diff --git "a/wandb/run-20220504_142129-w4rlzz90/files/wandb-summary.json" "b/wandb/run-20220504_142129-w4rlzz90/files/wandb-summary.json" --- "a/wandb/run-20220504_142129-w4rlzz90/files/wandb-summary.json" +++ "b/wandb/run-20220504_142129-w4rlzz90/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.9735, "train/learning_rate": 9.739639080135741e-06, "train/epoch": 2.78, "train/global_step": 9000, "_runtime": 88903, "_timestamp": 1651762992, "_step": 9017, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 11.0, 59.0, 321.0, 395.0, 194.0, 36.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.493083953857422, -4.221606254577637, -2.9501290321350098, -1.6786515712738037, -0.40717411041259766, 0.8643035888671875, 2.1357808113098145, 3.4072580337524414, 4.678735733032227, 5.950213432312012, 7.221690654754639, 8.493167877197266, 9.76464557647705, 11.036123275756836, 12.307600021362305, 13.57907772064209, 14.850555419921875, 16.122032165527344, 17.393510818481445, 18.664987564086914, 19.936466217041016, 21.207942962646484, 22.479419708251953, 23.750896453857422, 25.022375106811523, 26.293851852416992, 27.565330505371094, 28.836807250976562, 30.10828399658203, 31.379762649536133, 32.651241302490234, 33.9227180480957, 35.194190979003906, 36.465667724609375, 37.737144470214844, 39.00862503051758, 40.28010177612305, 41.551578521728516, 42.823055267333984, 44.09453201293945, 45.36601257324219, 46.637489318847656, 47.908966064453125, 49.18044662475586, 50.45192337036133, 51.7234001159668, 52.994876861572266, 54.266353607177734, 55.5378303527832, 56.80930709838867, 58.08078384399414, 59.352264404296875, 60.623741149902344, 61.89521789550781, 63.16669464111328, 64.43817138671875, 65.70964813232422, 66.98112487792969, 68.25260162353516, 69.52407836914062, 70.7955551147461, 72.06703186035156, 73.33851623535156, 74.60999298095703, 75.8814697265625]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 6.0, 7.0, 7.0, 18.0, 13.0, 14.0, 20.0, 28.0, 33.0, 30.0, 33.0, 40.0, 36.0, 55.0, 36.0, 49.0, 51.0, 54.0, 48.0, 48.0, 40.0, 41.0, 49.0, 34.0, 33.0, 32.0, 37.0, 22.0, 14.0, 10.0, 20.0, 11.0, 4.0, 10.0, 6.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.991907119750977, -6.737341403961182, -6.482775688171387, -6.228209972381592, -5.973644256591797, -5.719078540802002, -5.464512825012207, -5.20994758605957, -4.955381393432617, -4.700815677642822, -4.446249961853027, -4.191684246063232, -3.9371185302734375, -3.6825528144836426, -3.4279873371124268, -3.173421621322632, -2.918856143951416, -2.664290428161621, -2.409724712371826, -2.1551589965820312, -1.9005934000015259, -1.646027684211731, -1.3914620876312256, -1.1368963718414307, -0.8823306560516357, -0.6277649402618408, -0.3731992840766907, -0.11863362789154053, 0.1359320878982544, 0.3904978036880493, 0.6450634002685547, 0.8996291160583496, 1.1541948318481445, 1.4087605476379395, 1.6633262634277344, 1.9178918600082397, 2.172457695007324, 2.427023410797119, 2.681588888168335, 2.93615460395813, 3.190720319747925, 3.4452860355377197, 3.6998517513275146, 3.9544172286987305, 4.208982944488525, 4.46354866027832, 4.718114376068115, 4.97268009185791, 5.227245807647705, 5.4818115234375, 5.736377239227295, 5.99094295501709, 6.245508670806885, 6.50007438659668, 6.754639625549316, 7.0092058181762695, 7.263771057128906, 7.518336772918701, 7.772902488708496, 8.027467727661133, 8.282033920288086, 8.536599159240723, 8.791165351867676, 9.045730590820312, 9.300296783447266]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 10.0, 9.0, 9.0, 19.0, 25.0, 17.0, 45.0, 67.0, 106.0, 206.0, 359.0, 654.0, 1240.0, 2326.0, 4634.0, 9028.0, 19975.0, 46274.0, 114597.0, 290061.0, 721117.0, 1434313.0, 924149.0, 378415.0, 144868.0, 56644.0, 23806.0, 10540.0, 5078.0, 2633.0, 1316.0, 712.0, 398.0, 244.0, 141.0, 64.0, 55.0, 42.0, 26.0, 17.0, 13.0, 5.0, 9.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0], "bins": [-9.796875, -9.52935791015625, -9.2618408203125, -8.99432373046875, -8.726806640625, -8.45928955078125, -8.1917724609375, -7.92425537109375, -7.65673828125, -7.38922119140625, -7.1217041015625, -6.85418701171875, -6.586669921875, -6.31915283203125, -6.0516357421875, -5.78411865234375, -5.5166015625, -5.24908447265625, -4.9815673828125, -4.71405029296875, -4.446533203125, -4.17901611328125, -3.9114990234375, -3.64398193359375, -3.37646484375, -3.10894775390625, -2.8414306640625, -2.57391357421875, -2.306396484375, -2.03887939453125, -1.7713623046875, -1.50384521484375, -1.236328125, -0.96881103515625, -0.7012939453125, -0.43377685546875, -0.166259765625, 0.10125732421875, 0.3687744140625, 0.63629150390625, 0.90380859375, 1.17132568359375, 1.4388427734375, 1.70635986328125, 1.973876953125, 2.24139404296875, 2.5089111328125, 2.77642822265625, 3.0439453125, 3.31146240234375, 3.5789794921875, 3.84649658203125, 4.114013671875, 4.38153076171875, 4.6490478515625, 4.91656494140625, 5.18408203125, 5.45159912109375, 5.7191162109375, 5.98663330078125, 6.254150390625, 6.52166748046875, 6.7891845703125, 7.05670166015625, 7.32421875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 4.0, 4.0, 6.0, 6.0, 4.0, 9.0, 11.0, 14.0, 24.0, 16.0, 16.0, 34.0, 35.0, 31.0, 28.0, 37.0, 39.0, 39.0, 46.0, 49.0, 43.0, 47.0, 38.0, 55.0, 46.0, 38.0, 37.0, 25.0, 30.0, 26.0, 25.0, 28.0, 17.0, 22.0, 12.0, 16.0, 7.0, 10.0, 10.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.4453125, -9.10009765625, -8.7548828125, -8.40966796875, -8.064453125, -7.71923828125, -7.3740234375, -7.02880859375, -6.68359375, -6.33837890625, -5.9931640625, -5.64794921875, -5.302734375, -4.95751953125, -4.6123046875, -4.26708984375, -3.921875, -3.57666015625, -3.2314453125, -2.88623046875, -2.541015625, -2.19580078125, -1.8505859375, -1.50537109375, -1.16015625, -0.81494140625, -0.4697265625, -0.12451171875, 0.220703125, 0.56591796875, 0.9111328125, 1.25634765625, 1.6015625, 1.94677734375, 2.2919921875, 2.63720703125, 2.982421875, 3.32763671875, 3.6728515625, 4.01806640625, 4.36328125, 4.70849609375, 5.0537109375, 5.39892578125, 5.744140625, 6.08935546875, 6.4345703125, 6.77978515625, 7.125, 7.47021484375, 7.8154296875, 8.16064453125, 8.505859375, 8.85107421875, 9.1962890625, 9.54150390625, 9.88671875, 10.23193359375, 10.5771484375, 10.92236328125, 11.267578125, 11.61279296875, 11.9580078125, 12.30322265625, 12.6484375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 5.0, 4.0, 14.0, 22.0, 40.0, 49.0, 92.0, 154.0, 270.0, 795.0, 198568.0, 3992532.0, 1025.0, 325.0, 138.0, 83.0, 53.0, 34.0, 24.0, 17.0, 12.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-210.375, -205.126953125, -199.87890625, -194.630859375, -189.3828125, -184.134765625, -178.88671875, -173.638671875, -168.390625, -163.142578125, -157.89453125, -152.646484375, -147.3984375, -142.150390625, -136.90234375, -131.654296875, -126.40625, -121.158203125, -115.91015625, -110.662109375, -105.4140625, -100.166015625, -94.91796875, -89.669921875, -84.421875, -79.173828125, -73.92578125, -68.677734375, -63.4296875, -58.181640625, -52.93359375, -47.685546875, -42.4375, -37.189453125, -31.94140625, -26.693359375, -21.4453125, -16.197265625, -10.94921875, -5.701171875, -0.453125, 4.794921875, 10.04296875, 15.291015625, 20.5390625, 25.787109375, 31.03515625, 36.283203125, 41.53125, 46.779296875, 52.02734375, 57.275390625, 62.5234375, 67.771484375, 73.01953125, 78.267578125, 83.515625, 88.763671875, 94.01171875, 99.259765625, 104.5078125, 109.755859375, 115.00390625, 120.251953125, 125.5]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 7.0, 7.0, 11.0, 15.0, 38.0, 61.0, 86.0, 141.0, 232.0, 420.0, 875.0, 1021.0, 507.0, 278.0, 138.0, 87.0, 56.0, 26.0, 26.0, 18.0, 6.0, 5.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.7578125, -8.5499267578125, -8.342041015625, -8.1341552734375, -7.92626953125, -7.7183837890625, -7.510498046875, -7.3026123046875, -7.0947265625, -6.8868408203125, -6.678955078125, -6.4710693359375, -6.26318359375, -6.0552978515625, -5.847412109375, -5.6395263671875, -5.431640625, -5.2237548828125, -5.015869140625, -4.8079833984375, -4.60009765625, -4.3922119140625, -4.184326171875, -3.9764404296875, -3.7685546875, -3.5606689453125, -3.352783203125, -3.1448974609375, -2.93701171875, -2.7291259765625, -2.521240234375, -2.3133544921875, -2.10546875, -1.8975830078125, -1.689697265625, -1.4818115234375, -1.27392578125, -1.0660400390625, -0.858154296875, -0.6502685546875, -0.4423828125, -0.2344970703125, -0.026611328125, 0.1812744140625, 0.38916015625, 0.5970458984375, 0.804931640625, 1.0128173828125, 1.220703125, 1.4285888671875, 1.636474609375, 1.8443603515625, 2.05224609375, 2.2601318359375, 2.468017578125, 2.6759033203125, 2.8837890625, 3.0916748046875, 3.299560546875, 3.5074462890625, 3.71533203125, 3.9232177734375, 4.131103515625, 4.3389892578125, 4.546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 3.0, 9.0, 8.0, 11.0, 18.0, 17.0, 18.0, 29.0, 35.0, 44.0, 42.0, 51.0, 58.0, 50.0, 57.0, 65.0, 64.0, 53.0, 54.0, 41.0, 41.0, 42.0, 37.0, 35.0, 16.0, 19.0, 24.0, 15.0, 8.0, 6.0, 7.0, 7.0, 1.0, 3.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.563047409057617, -15.172430038452148, -14.781813621520996, -14.391196250915527, -14.000578880310059, -13.609962463378906, -13.219345092773438, -12.828727722167969, -12.438111305236816, -12.047493934631348, -11.656877517700195, -11.266260147094727, -10.875642776489258, -10.485026359558105, -10.094408988952637, -9.703792572021484, -9.313175201416016, -8.922557830810547, -8.531941413879395, -8.141324043273926, -7.750707149505615, -7.360090255737305, -6.969472885131836, -6.578855991363525, -6.188238143920898, -5.797621250152588, -5.407003879547119, -5.016386985778809, -4.625770092010498, -4.2351531982421875, -3.8445358276367188, -3.453918933868408, -3.0633020401000977, -2.672684907913208, -2.2820680141448975, -1.8914508819580078, -1.5008338689804077, -1.1102168560028076, -0.719599723815918, -0.3289828300476074, 0.06163430213928223, 0.4522513449192047, 0.8428683876991272, 1.233485460281372, 1.6241024732589722, 2.0147194862365723, 2.405336618423462, 2.7959535121917725, 3.186570644378662, 3.5771877765655518, 3.9678046703338623, 4.358421802520752, 4.7490386962890625, 5.139656066894531, 5.530272960662842, 5.920889854431152, 6.311507225036621, 6.702124118804932, 7.0927414894104, 7.483358383178711, 7.8739752769470215, 8.264592170715332, 8.6552095413208, 9.045825958251953, 9.436443328857422]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 12.0, 9.0, 11.0, 13.0, 11.0, 18.0, 16.0, 26.0, 22.0, 24.0, 28.0, 28.0, 36.0, 39.0, 35.0, 49.0, 29.0, 32.0, 47.0, 47.0, 38.0, 44.0, 32.0, 38.0, 36.0, 28.0, 29.0, 32.0, 30.0, 17.0, 16.0, 17.0, 14.0, 17.0, 14.0, 10.0, 9.0, 7.0, 4.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-9.535484313964844, -9.235716819763184, -8.935949325561523, -8.636181831359863, -8.336414337158203, -8.03664779663086, -7.736880302429199, -7.437112808227539, -7.137345314025879, -6.837577819824219, -6.537810325622559, -6.238043308258057, -5.9382758140563965, -5.638508319854736, -5.338741302490234, -5.038973808288574, -4.739206314086914, -4.439438819885254, -4.139671325683594, -3.839904308319092, -3.5401368141174316, -3.2403693199157715, -2.9406020641326904, -2.6408348083496094, -2.341067314147949, -2.041299819946289, -1.741532564163208, -1.4417651891708374, -1.1419978141784668, -0.8422304391860962, -0.5424630641937256, -0.24269580841064453, 0.057071685791015625, 0.35683906078338623, 0.6566064357757568, 0.9563738107681274, 1.256141185760498, 1.5559085607528687, 1.8556759357452393, 2.1554431915283203, 2.4552106857299805, 2.7549781799316406, 3.0547454357147217, 3.3545126914978027, 3.654280185699463, 3.954047679901123, 4.253814697265625, 4.553582191467285, 4.853349685668945, 5.1531171798706055, 5.452884674072266, 5.752651691436768, 6.052419185638428, 6.352186679840088, 6.65195369720459, 6.95172119140625, 7.25148868560791, 7.55125617980957, 7.8510236740112305, 8.15079116821289, 8.450557708740234, 8.750325202941895, 9.050092697143555, 9.349860191345215, 9.649627685546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 6.0, 16.0, 19.0, 26.0, 22.0, 40.0, 77.0, 104.0, 175.0, 249.0, 391.0, 564.0, 866.0, 1362.0, 2169.0, 3486.0, 5715.0, 9698.0, 16483.0, 28643.0, 51222.0, 92494.0, 163333.0, 227880.0, 188363.0, 110828.0, 61225.0, 34304.0, 19534.0, 11528.0, 6634.0, 4076.0, 2514.0, 1569.0, 980.0, 612.0, 452.0, 282.0, 206.0, 118.0, 86.0, 55.0, 39.0, 36.0, 16.0, 16.0, 11.0, 7.0, 4.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.865234375, -2.771759033203125, -2.67828369140625, -2.584808349609375, -2.4913330078125, -2.397857666015625, -2.30438232421875, -2.210906982421875, -2.117431640625, -2.023956298828125, -1.93048095703125, -1.837005615234375, -1.7435302734375, -1.650054931640625, -1.55657958984375, -1.463104248046875, -1.36962890625, -1.276153564453125, -1.18267822265625, -1.089202880859375, -0.9957275390625, -0.902252197265625, -0.80877685546875, -0.715301513671875, -0.621826171875, -0.528350830078125, -0.43487548828125, -0.341400146484375, -0.2479248046875, -0.154449462890625, -0.06097412109375, 0.032501220703125, 0.1259765625, 0.219451904296875, 0.31292724609375, 0.406402587890625, 0.4998779296875, 0.593353271484375, 0.68682861328125, 0.780303955078125, 0.873779296875, 0.967254638671875, 1.06072998046875, 1.154205322265625, 1.2476806640625, 1.341156005859375, 1.43463134765625, 1.528106689453125, 1.62158203125, 1.715057373046875, 1.80853271484375, 1.902008056640625, 1.9954833984375, 2.088958740234375, 2.18243408203125, 2.275909423828125, 2.369384765625, 2.462860107421875, 2.55633544921875, 2.649810791015625, 2.7432861328125, 2.836761474609375, 2.93023681640625, 3.023712158203125, 3.1171875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 7.0, 7.0, 5.0, 6.0, 11.0, 12.0, 12.0, 16.0, 25.0, 29.0, 28.0, 36.0, 26.0, 44.0, 46.0, 45.0, 61.0, 44.0, 60.0, 49.0, 46.0, 55.0, 44.0, 52.0, 34.0, 31.0, 35.0, 26.0, 24.0, 20.0, 13.0, 9.0, 12.0, 9.0, 11.0, 3.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2265625, -8.9281005859375, -8.629638671875, -8.3311767578125, -8.03271484375, -7.7342529296875, -7.435791015625, -7.1373291015625, -6.8388671875, -6.5404052734375, -6.241943359375, -5.9434814453125, -5.64501953125, -5.3465576171875, -5.048095703125, -4.7496337890625, -4.451171875, -4.1527099609375, -3.854248046875, -3.5557861328125, -3.25732421875, -2.9588623046875, -2.660400390625, -2.3619384765625, -2.0634765625, -1.7650146484375, -1.466552734375, -1.1680908203125, -0.86962890625, -0.5711669921875, -0.272705078125, 0.0257568359375, 0.32421875, 0.6226806640625, 0.921142578125, 1.2196044921875, 1.51806640625, 1.8165283203125, 2.114990234375, 2.4134521484375, 2.7119140625, 3.0103759765625, 3.308837890625, 3.6072998046875, 3.90576171875, 4.2042236328125, 4.502685546875, 4.8011474609375, 5.099609375, 5.3980712890625, 5.696533203125, 5.9949951171875, 6.29345703125, 6.5919189453125, 6.890380859375, 7.1888427734375, 7.4873046875, 7.7857666015625, 8.084228515625, 8.3826904296875, 8.68115234375, 8.9796142578125, 9.278076171875, 9.5765380859375, 9.875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 6.0, 10.0, 14.0, 13.0, 25.0, 37.0, 38.0, 71.0, 119.0, 176.0, 325.0, 549.0, 1195.0, 2624.0, 7072.0, 21636.0, 78108.0, 317707.0, 439899.0, 128530.0, 33115.0, 10345.0, 3791.0, 1462.0, 704.0, 391.0, 206.0, 136.0, 93.0, 50.0, 23.0, 26.0, 17.0, 15.0, 9.0, 4.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08984375, -4.9091796875, -4.728515625, -4.5478515625, -4.3671875, -4.1865234375, -4.005859375, -3.8251953125, -3.64453125, -3.4638671875, -3.283203125, -3.1025390625, -2.921875, -2.7412109375, -2.560546875, -2.3798828125, -2.19921875, -2.0185546875, -1.837890625, -1.6572265625, -1.4765625, -1.2958984375, -1.115234375, -0.9345703125, -0.75390625, -0.5732421875, -0.392578125, -0.2119140625, -0.03125, 0.1494140625, 0.330078125, 0.5107421875, 0.69140625, 0.8720703125, 1.052734375, 1.2333984375, 1.4140625, 1.5947265625, 1.775390625, 1.9560546875, 2.13671875, 2.3173828125, 2.498046875, 2.6787109375, 2.859375, 3.0400390625, 3.220703125, 3.4013671875, 3.58203125, 3.7626953125, 3.943359375, 4.1240234375, 4.3046875, 4.4853515625, 4.666015625, 4.8466796875, 5.02734375, 5.2080078125, 5.388671875, 5.5693359375, 5.75, 5.9306640625, 6.111328125, 6.2919921875, 6.47265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 8.0, 7.0, 12.0, 9.0, 10.0, 15.0, 13.0, 21.0, 29.0, 36.0, 21.0, 40.0, 39.0, 51.0, 51.0, 38.0, 41.0, 48.0, 43.0, 42.0, 46.0, 54.0, 34.0, 41.0, 41.0, 37.0, 27.0, 23.0, 25.0, 15.0, 10.0, 16.0, 9.0, 10.0, 8.0, 4.0, 8.0, 5.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.734375, -16.178955078125, -15.62353515625, -15.068115234375, -14.5126953125, -13.957275390625, -13.40185546875, -12.846435546875, -12.291015625, -11.735595703125, -11.18017578125, -10.624755859375, -10.0693359375, -9.513916015625, -8.95849609375, -8.403076171875, -7.84765625, -7.292236328125, -6.73681640625, -6.181396484375, -5.6259765625, -5.070556640625, -4.51513671875, -3.959716796875, -3.404296875, -2.848876953125, -2.29345703125, -1.738037109375, -1.1826171875, -0.627197265625, -0.07177734375, 0.483642578125, 1.0390625, 1.594482421875, 2.14990234375, 2.705322265625, 3.2607421875, 3.816162109375, 4.37158203125, 4.927001953125, 5.482421875, 6.037841796875, 6.59326171875, 7.148681640625, 7.7041015625, 8.259521484375, 8.81494140625, 9.370361328125, 9.92578125, 10.481201171875, 11.03662109375, 11.592041015625, 12.1474609375, 12.702880859375, 13.25830078125, 13.813720703125, 14.369140625, 14.924560546875, 15.47998046875, 16.035400390625, 16.5908203125, 17.146240234375, 17.70166015625, 18.257080078125, 18.8125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 12.0, 8.0, 12.0, 17.0, 18.0, 41.0, 55.0, 86.0, 138.0, 188.0, 314.0, 535.0, 1037.0, 2125.0, 4642.0, 12724.0, 44580.0, 244387.0, 591877.0, 106164.0, 24782.0, 8064.0, 3248.0, 1550.0, 788.0, 410.0, 264.0, 165.0, 102.0, 67.0, 46.0, 23.0, 21.0, 14.0, 16.0, 15.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3671875, -3.26287841796875, -3.1585693359375, -3.05426025390625, -2.949951171875, -2.84564208984375, -2.7413330078125, -2.63702392578125, -2.53271484375, -2.42840576171875, -2.3240966796875, -2.21978759765625, -2.115478515625, -2.01116943359375, -1.9068603515625, -1.80255126953125, -1.6982421875, -1.59393310546875, -1.4896240234375, -1.38531494140625, -1.281005859375, -1.17669677734375, -1.0723876953125, -0.96807861328125, -0.86376953125, -0.75946044921875, -0.6551513671875, -0.55084228515625, -0.446533203125, -0.34222412109375, -0.2379150390625, -0.13360595703125, -0.029296875, 0.07501220703125, 0.1793212890625, 0.28363037109375, 0.387939453125, 0.49224853515625, 0.5965576171875, 0.70086669921875, 0.80517578125, 0.90948486328125, 1.0137939453125, 1.11810302734375, 1.222412109375, 1.32672119140625, 1.4310302734375, 1.53533935546875, 1.6396484375, 1.74395751953125, 1.8482666015625, 1.95257568359375, 2.056884765625, 2.16119384765625, 2.2655029296875, 2.36981201171875, 2.47412109375, 2.57843017578125, 2.6827392578125, 2.78704833984375, 2.891357421875, 2.99566650390625, 3.0999755859375, 3.20428466796875, 3.30859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 4.0, 6.0, 9.0, 10.0, 16.0, 19.0, 39.0, 57.0, 82.0, 111.0, 121.0, 143.0, 100.0, 99.0, 58.0, 36.0, 24.0, 11.0, 19.0, 8.0, 7.0, 9.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015745162963867188, -0.0015202164649963379, -0.001465916633605957, -0.0014116168022155762, -0.0013573169708251953, -0.0013030171394348145, -0.0012487173080444336, -0.0011944174766540527, -0.0011401176452636719, -0.001085817813873291, -0.0010315179824829102, -0.0009772181510925293, -0.0009229183197021484, -0.0008686184883117676, -0.0008143186569213867, -0.0007600188255310059, -0.000705718994140625, -0.0006514191627502441, -0.0005971193313598633, -0.0005428194999694824, -0.0004885196685791016, -0.0004342198371887207, -0.00037992000579833984, -0.000325620174407959, -0.0002713203430175781, -0.00021702051162719727, -0.0001627206802368164, -0.00010842084884643555, -5.412101745605469e-05, 1.7881393432617188e-07, 5.447864532470703e-05, 0.00010877847671508789, 0.00016307830810546875, 0.0002173781394958496, 0.00027167797088623047, 0.00032597780227661133, 0.0003802776336669922, 0.00043457746505737305, 0.0004888772964477539, 0.0005431771278381348, 0.0005974769592285156, 0.0006517767906188965, 0.0007060766220092773, 0.0007603764533996582, 0.0008146762847900391, 0.0008689761161804199, 0.0009232759475708008, 0.0009775757789611816, 0.0010318756103515625, 0.0010861754417419434, 0.0011404752731323242, 0.001194775104522705, 0.001249074935913086, 0.0013033747673034668, 0.0013576745986938477, 0.0014119744300842285, 0.0014662742614746094, 0.0015205740928649902, 0.001574873924255371, 0.001629173755645752, 0.0016834735870361328, 0.0017377734184265137, 0.0017920732498168945, 0.0018463730812072754, 0.0019006729125976562]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 9.0, 9.0, 18.0, 13.0, 20.0, 30.0, 56.0, 105.0, 295.0, 1889.0, 23666.0, 869755.0, 145799.0, 5874.0, 632.0, 162.0, 71.0, 33.0, 28.0, 15.0, 13.0, 11.0, 7.0, 8.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.0546875, -11.707763671875, -11.36083984375, -11.013916015625, -10.6669921875, -10.320068359375, -9.97314453125, -9.626220703125, -9.279296875, -8.932373046875, -8.58544921875, -8.238525390625, -7.8916015625, -7.544677734375, -7.19775390625, -6.850830078125, -6.50390625, -6.156982421875, -5.81005859375, -5.463134765625, -5.1162109375, -4.769287109375, -4.42236328125, -4.075439453125, -3.728515625, -3.381591796875, -3.03466796875, -2.687744140625, -2.3408203125, -1.993896484375, -1.64697265625, -1.300048828125, -0.953125, -0.606201171875, -0.25927734375, 0.087646484375, 0.4345703125, 0.781494140625, 1.12841796875, 1.475341796875, 1.822265625, 2.169189453125, 2.51611328125, 2.863037109375, 3.2099609375, 3.556884765625, 3.90380859375, 4.250732421875, 4.59765625, 4.944580078125, 5.29150390625, 5.638427734375, 5.9853515625, 6.332275390625, 6.67919921875, 7.026123046875, 7.373046875, 7.719970703125, 8.06689453125, 8.413818359375, 8.7607421875, 9.107666015625, 9.45458984375, 9.801513671875, 10.1484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 9.0, 14.0, 10.0, 15.0, 23.0, 28.0, 33.0, 50.0, 82.0, 87.0, 126.0, 91.0, 110.0, 80.0, 55.0, 44.0, 25.0, 29.0, 20.0, 13.0, 6.0, 7.0, 9.0, 3.0, 4.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.41796875, -1.3788909912109375, -1.339813232421875, -1.3007354736328125, -1.26165771484375, -1.2225799560546875, -1.183502197265625, -1.1444244384765625, -1.1053466796875, -1.0662689208984375, -1.027191162109375, -0.9881134033203125, -0.94903564453125, -0.9099578857421875, -0.870880126953125, -0.8318023681640625, -0.792724609375, -0.7536468505859375, -0.714569091796875, -0.6754913330078125, -0.63641357421875, -0.5973358154296875, -0.558258056640625, -0.5191802978515625, -0.4801025390625, -0.4410247802734375, -0.401947021484375, -0.3628692626953125, -0.32379150390625, -0.2847137451171875, -0.245635986328125, -0.2065582275390625, -0.16748046875, -0.1284027099609375, -0.089324951171875, -0.0502471923828125, -0.01116943359375, 0.0279083251953125, 0.066986083984375, 0.1060638427734375, 0.1451416015625, 0.1842193603515625, 0.223297119140625, 0.2623748779296875, 0.30145263671875, 0.3405303955078125, 0.379608154296875, 0.4186859130859375, 0.457763671875, 0.4968414306640625, 0.535919189453125, 0.5749969482421875, 0.61407470703125, 0.6531524658203125, 0.692230224609375, 0.7313079833984375, 0.7703857421875, 0.8094635009765625, 0.848541259765625, 0.8876190185546875, 0.92669677734375, 0.9657745361328125, 1.004852294921875, 1.0439300537109375, 1.0830078125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 5.0, 8.0, 10.0, 26.0, 44.0, 78.0, 103.0, 150.0, 135.0, 119.0, 92.0, 94.0, 50.0, 36.0, 19.0, 16.0, 7.0, 6.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.89997100830078, -29.245502471923828, -28.591035842895508, -27.936569213867188, -27.282100677490234, -26.62763214111328, -25.97316551208496, -25.31869888305664, -24.664230346679688, -24.009761810302734, -23.355295181274414, -22.700828552246094, -22.04636001586914, -21.391891479492188, -20.737424850463867, -20.082958221435547, -19.428489685058594, -18.77402114868164, -18.11955451965332, -17.465087890625, -16.810619354248047, -16.156150817871094, -15.501684188842773, -14.847216606140137, -14.1927490234375, -13.538281440734863, -12.883813858032227, -12.22934627532959, -11.574878692626953, -10.920411109924316, -10.26594352722168, -9.611475944519043, -8.957008361816406, -8.30254077911377, -7.648073196411133, -6.993605613708496, -6.339138031005859, -5.684670448303223, -5.030202865600586, -4.375735282897949, -3.7212677001953125, -3.066800117492676, -2.412332534790039, -1.7578649520874023, -1.1033973693847656, -0.4489297866821289, 0.2055377960205078, 0.8600053787231445, 1.5144729614257812, 2.168940544128418, 2.8234081268310547, 3.4778757095336914, 4.132343292236328, 4.786810874938965, 5.441278457641602, 6.095746040344238, 6.750213623046875, 7.404681205749512, 8.059148788452148, 8.713616371154785, 9.368083953857422, 10.022551536560059, 10.677019119262695, 11.331486701965332, 11.985954284667969]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 5.0, 8.0, 11.0, 2.0, 13.0, 22.0, 17.0, 22.0, 34.0, 33.0, 39.0, 41.0, 34.0, 50.0, 51.0, 59.0, 40.0, 44.0, 43.0, 41.0, 55.0, 46.0, 37.0, 39.0, 32.0, 34.0, 25.0, 17.0, 18.0, 22.0, 10.0, 9.0, 11.0, 11.0, 6.0, 6.0, 4.0, 5.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.189397811889648, -8.908153533935547, -8.626909255981445, -8.34566593170166, -8.064421653747559, -7.783177375793457, -7.501933574676514, -7.22068977355957, -6.939445495605469, -6.658201217651367, -6.376957416534424, -6.0957136154174805, -5.814469337463379, -5.533225059509277, -5.251981258392334, -4.970737457275391, -4.689493179321289, -4.4082489013671875, -4.127005100250244, -3.8457610607147217, -3.564517021179199, -3.2832729816436768, -3.0020289421081543, -2.720784902572632, -2.4395408630371094, -2.158296823501587, -1.8770527839660645, -1.595808744430542, -1.3145647048950195, -1.033320665359497, -0.7520766258239746, -0.47083258628845215, -0.18958759307861328, 0.09165644645690918, 0.37290048599243164, 0.6541445255279541, 0.9353885650634766, 1.216632604598999, 1.4978766441345215, 1.779120683670044, 2.0603647232055664, 2.341608762741089, 2.6228528022766113, 2.904096841812134, 3.1853408813476562, 3.4665849208831787, 3.747828960418701, 4.0290727615356445, 4.310317039489746, 4.591561317443848, 4.872805118560791, 5.154048919677734, 5.435293197631836, 5.7165374755859375, 5.997781276702881, 6.279025077819824, 6.560269355773926, 6.841513633728027, 7.122757434844971, 7.404001235961914, 7.685245513916016, 7.966489791870117, 8.247734069824219, 8.528977394104004, 8.810221672058105]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 9.0, 8.0, 11.0, 22.0, 13.0, 24.0, 53.0, 61.0, 101.0, 144.0, 184.0, 292.0, 481.0, 705.0, 1299.0, 2299.0, 4521.0, 9459.0, 22348.0, 56481.0, 149022.0, 319766.0, 281713.0, 119905.0, 45021.0, 17800.0, 7999.0, 3795.0, 1962.0, 1129.0, 697.0, 394.0, 266.0, 166.0, 125.0, 90.0, 46.0, 38.0, 35.0, 19.0, 24.0, 10.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.12109375, -5.9349365234375, -5.748779296875, -5.5626220703125, -5.37646484375, -5.1903076171875, -5.004150390625, -4.8179931640625, -4.6318359375, -4.4456787109375, -4.259521484375, -4.0733642578125, -3.88720703125, -3.7010498046875, -3.514892578125, -3.3287353515625, -3.142578125, -2.9564208984375, -2.770263671875, -2.5841064453125, -2.39794921875, -2.2117919921875, -2.025634765625, -1.8394775390625, -1.6533203125, -1.4671630859375, -1.281005859375, -1.0948486328125, -0.90869140625, -0.7225341796875, -0.536376953125, -0.3502197265625, -0.1640625, 0.0220947265625, 0.208251953125, 0.3944091796875, 0.58056640625, 0.7667236328125, 0.952880859375, 1.1390380859375, 1.3251953125, 1.5113525390625, 1.697509765625, 1.8836669921875, 2.06982421875, 2.2559814453125, 2.442138671875, 2.6282958984375, 2.814453125, 3.0006103515625, 3.186767578125, 3.3729248046875, 3.55908203125, 3.7452392578125, 3.931396484375, 4.1175537109375, 4.3037109375, 4.4898681640625, 4.676025390625, 4.8621826171875, 5.04833984375, 5.2344970703125, 5.420654296875, 5.6068115234375, 5.79296875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 0.0, 4.0, 9.0, 7.0, 12.0, 14.0, 10.0, 13.0, 27.0, 26.0, 30.0, 23.0, 44.0, 45.0, 42.0, 53.0, 57.0, 60.0, 72.0, 50.0, 53.0, 51.0, 57.0, 49.0, 23.0, 21.0, 36.0, 29.0, 8.0, 15.0, 13.0, 9.0, 11.0, 11.0, 1.0, 2.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-65.25, -63.29736328125, -61.3447265625, -59.39208984375, -57.439453125, -55.48681640625, -53.5341796875, -51.58154296875, -49.62890625, -47.67626953125, -45.7236328125, -43.77099609375, -41.818359375, -39.86572265625, -37.9130859375, -35.96044921875, -34.0078125, -32.05517578125, -30.1025390625, -28.14990234375, -26.197265625, -24.24462890625, -22.2919921875, -20.33935546875, -18.38671875, -16.43408203125, -14.4814453125, -12.52880859375, -10.576171875, -8.62353515625, -6.6708984375, -4.71826171875, -2.765625, -0.81298828125, 1.1396484375, 3.09228515625, 5.044921875, 6.99755859375, 8.9501953125, 10.90283203125, 12.85546875, 14.80810546875, 16.7607421875, 18.71337890625, 20.666015625, 22.61865234375, 24.5712890625, 26.52392578125, 28.4765625, 30.42919921875, 32.3818359375, 34.33447265625, 36.287109375, 38.23974609375, 40.1923828125, 42.14501953125, 44.09765625, 46.05029296875, 48.0029296875, 49.95556640625, 51.908203125, 53.86083984375, 55.8134765625, 57.76611328125, 59.71875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 10.0, 12.0, 17.0, 18.0, 26.0, 31.0, 40.0, 39.0, 57.0, 78.0, 85.0, 117.0, 170.0, 313.0, 662.0, 1919.0, 18169.0, 821780.0, 197488.0, 5130.0, 1059.0, 486.0, 256.0, 132.0, 111.0, 72.0, 53.0, 44.0, 43.0, 31.0, 26.0, 14.0, 12.0, 11.0, 11.0, 4.0, 4.0, 7.0, 4.0, 5.0, 2.0, 2.0], "bins": [-32.0, -31.195556640625, -30.39111328125, -29.586669921875, -28.7822265625, -27.977783203125, -27.17333984375, -26.368896484375, -25.564453125, -24.760009765625, -23.95556640625, -23.151123046875, -22.3466796875, -21.542236328125, -20.73779296875, -19.933349609375, -19.12890625, -18.324462890625, -17.52001953125, -16.715576171875, -15.9111328125, -15.106689453125, -14.30224609375, -13.497802734375, -12.693359375, -11.888916015625, -11.08447265625, -10.280029296875, -9.4755859375, -8.671142578125, -7.86669921875, -7.062255859375, -6.2578125, -5.453369140625, -4.64892578125, -3.844482421875, -3.0400390625, -2.235595703125, -1.43115234375, -0.626708984375, 0.177734375, 0.982177734375, 1.78662109375, 2.591064453125, 3.3955078125, 4.199951171875, 5.00439453125, 5.808837890625, 6.61328125, 7.417724609375, 8.22216796875, 9.026611328125, 9.8310546875, 10.635498046875, 11.43994140625, 12.244384765625, 13.048828125, 13.853271484375, 14.65771484375, 15.462158203125, 16.2666015625, 17.071044921875, 17.87548828125, 18.679931640625, 19.484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 6.0, 4.0, 8.0, 8.0, 9.0, 13.0, 14.0, 14.0, 20.0, 25.0, 19.0, 24.0, 22.0, 38.0, 33.0, 34.0, 44.0, 44.0, 32.0, 52.0, 55.0, 54.0, 37.0, 33.0, 49.0, 49.0, 38.0, 35.0, 23.0, 19.0, 28.0, 28.0, 13.0, 10.0, 17.0, 15.0, 11.0, 5.0, 11.0, 4.0, 6.0, 1.0, 0.0, 7.0, 0.0, 1.0, 1.0, 1.0], "bins": [-60.09375, -58.470703125, -56.84765625, -55.224609375, -53.6015625, -51.978515625, -50.35546875, -48.732421875, -47.109375, -45.486328125, -43.86328125, -42.240234375, -40.6171875, -38.994140625, -37.37109375, -35.748046875, -34.125, -32.501953125, -30.87890625, -29.255859375, -27.6328125, -26.009765625, -24.38671875, -22.763671875, -21.140625, -19.517578125, -17.89453125, -16.271484375, -14.6484375, -13.025390625, -11.40234375, -9.779296875, -8.15625, -6.533203125, -4.91015625, -3.287109375, -1.6640625, -0.041015625, 1.58203125, 3.205078125, 4.828125, 6.451171875, 8.07421875, 9.697265625, 11.3203125, 12.943359375, 14.56640625, 16.189453125, 17.8125, 19.435546875, 21.05859375, 22.681640625, 24.3046875, 25.927734375, 27.55078125, 29.173828125, 30.796875, 32.419921875, 34.04296875, 35.666015625, 37.2890625, 38.912109375, 40.53515625, 42.158203125, 43.78125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 5.0, 7.0, 22.0, 23.0, 24.0, 31.0, 54.0, 93.0, 137.0, 324.0, 688.0, 1373.0, 4278.0, 18319.0, 198682.0, 764154.0, 47936.0, 8105.0, 2359.0, 934.0, 449.0, 225.0, 114.0, 63.0, 46.0, 26.0, 23.0, 18.0, 13.0, 12.0, 1.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.734375, -2.649566650390625, -2.56475830078125, -2.479949951171875, -2.3951416015625, -2.310333251953125, -2.22552490234375, -2.140716552734375, -2.055908203125, -1.971099853515625, -1.88629150390625, -1.801483154296875, -1.7166748046875, -1.631866455078125, -1.54705810546875, -1.462249755859375, -1.37744140625, -1.292633056640625, -1.20782470703125, -1.123016357421875, -1.0382080078125, -0.953399658203125, -0.86859130859375, -0.783782958984375, -0.698974609375, -0.614166259765625, -0.52935791015625, -0.444549560546875, -0.3597412109375, -0.274932861328125, -0.19012451171875, -0.105316162109375, -0.0205078125, 0.064300537109375, 0.14910888671875, 0.233917236328125, 0.3187255859375, 0.403533935546875, 0.48834228515625, 0.573150634765625, 0.657958984375, 0.742767333984375, 0.82757568359375, 0.912384033203125, 0.9971923828125, 1.082000732421875, 1.16680908203125, 1.251617431640625, 1.33642578125, 1.421234130859375, 1.50604248046875, 1.590850830078125, 1.6756591796875, 1.760467529296875, 1.84527587890625, 1.930084228515625, 2.014892578125, 2.099700927734375, 2.18450927734375, 2.269317626953125, 2.3541259765625, 2.438934326171875, 2.52374267578125, 2.608551025390625, 2.693359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 9.0, 11.0, 25.0, 47.0, 131.0, 293.0, 279.0, 122.0, 46.0, 22.0, 13.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002815723419189453, -0.0002578906714916229, -0.00023420900106430054, -0.00021052733063697815, -0.00018684566020965576, -0.00016316398978233337, -0.00013948231935501099, -0.0001158006489276886, -9.211897850036621e-05, -6.843730807304382e-05, -4.4755637645721436e-05, -2.1073967218399048e-05, 2.60770320892334e-06, 2.6289373636245728e-05, 4.9971044063568115e-05, 7.36527144908905e-05, 9.733438491821289e-05, 0.00012101605534553528, 0.00014469772577285767, 0.00016837939620018005, 0.00019206106662750244, 0.00021574273705482483, 0.00023942440748214722, 0.0002631060779094696, 0.000286787748336792, 0.0003104694187641144, 0.00033415108919143677, 0.00035783275961875916, 0.00038151443004608154, 0.00040519610047340393, 0.0004288777709007263, 0.0004525594413280487, 0.0004762411117553711, 0.0004999227821826935, 0.0005236044526100159, 0.0005472861230373383, 0.0005709677934646606, 0.000594649463891983, 0.0006183311343193054, 0.0006420128047466278, 0.0006656944751739502, 0.0006893761456012726, 0.000713057816028595, 0.0007367394864559174, 0.0007604211568832397, 0.0007841028273105621, 0.0008077844977378845, 0.0008314661681652069, 0.0008551478385925293, 0.0008788295090198517, 0.0009025111794471741, 0.0009261928498744965, 0.0009498745203018188, 0.0009735561907291412, 0.0009972378611564636, 0.001020919531583786, 0.0010446012020111084, 0.0010682828724384308, 0.0010919645428657532, 0.0011156462132930756, 0.001139327883720398, 0.0011630095541477203, 0.0011866912245750427, 0.0012103728950023651, 0.0012340545654296875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 2.0, 11.0, 9.0, 16.0, 23.0, 39.0, 83.0, 159.0, 328.0, 794.0, 2304.0, 11165.0, 210017.0, 790817.0, 26684.0, 3969.0, 1235.0, 465.0, 184.0, 102.0, 51.0, 33.0, 21.0, 19.0, 11.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6171875, -2.5133056640625, -2.409423828125, -2.3055419921875, -2.20166015625, -2.0977783203125, -1.993896484375, -1.8900146484375, -1.7861328125, -1.6822509765625, -1.578369140625, -1.4744873046875, -1.37060546875, -1.2667236328125, -1.162841796875, -1.0589599609375, -0.955078125, -0.8511962890625, -0.747314453125, -0.6434326171875, -0.53955078125, -0.4356689453125, -0.331787109375, -0.2279052734375, -0.1240234375, -0.0201416015625, 0.083740234375, 0.1876220703125, 0.29150390625, 0.3953857421875, 0.499267578125, 0.6031494140625, 0.70703125, 0.8109130859375, 0.914794921875, 1.0186767578125, 1.12255859375, 1.2264404296875, 1.330322265625, 1.4342041015625, 1.5380859375, 1.6419677734375, 1.745849609375, 1.8497314453125, 1.95361328125, 2.0574951171875, 2.161376953125, 2.2652587890625, 2.369140625, 2.4730224609375, 2.576904296875, 2.6807861328125, 2.78466796875, 2.8885498046875, 2.992431640625, 3.0963134765625, 3.2001953125, 3.3040771484375, 3.407958984375, 3.5118408203125, 3.61572265625, 3.7196044921875, 3.823486328125, 3.9273681640625, 4.03125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 3.0, 5.0, 7.0, 12.0, 21.0, 33.0, 45.0, 45.0, 103.0, 144.0, 188.0, 142.0, 75.0, 59.0, 43.0, 22.0, 13.0, 11.0, 7.0, 4.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7470703125, -0.7165374755859375, -0.686004638671875, -0.6554718017578125, -0.62493896484375, -0.5944061279296875, -0.563873291015625, -0.5333404541015625, -0.5028076171875, -0.4722747802734375, -0.441741943359375, -0.4112091064453125, -0.38067626953125, -0.3501434326171875, -0.319610595703125, -0.2890777587890625, -0.258544921875, -0.2280120849609375, -0.197479248046875, -0.1669464111328125, -0.13641357421875, -0.1058807373046875, -0.075347900390625, -0.0448150634765625, -0.0142822265625, 0.0162506103515625, 0.046783447265625, 0.0773162841796875, 0.10784912109375, 0.1383819580078125, 0.168914794921875, 0.1994476318359375, 0.22998046875, 0.2605133056640625, 0.291046142578125, 0.3215789794921875, 0.35211181640625, 0.3826446533203125, 0.413177490234375, 0.4437103271484375, 0.4742431640625, 0.5047760009765625, 0.535308837890625, 0.5658416748046875, 0.59637451171875, 0.6269073486328125, 0.657440185546875, 0.6879730224609375, 0.718505859375, 0.7490386962890625, 0.779571533203125, 0.8101043701171875, 0.84063720703125, 0.8711700439453125, 0.901702880859375, 0.9322357177734375, 0.9627685546875, 0.9933013916015625, 1.023834228515625, 1.0543670654296875, 1.08489990234375, 1.1154327392578125, 1.145965576171875, 1.1764984130859375, 1.20703125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 22.0, 102.0, 320.0, 352.0, 169.0, 44.0, 5.0, 2.0], "bins": [-188.10671997070312, -184.927978515625, -181.74923706054688, -178.57049560546875, -175.39175415039062, -172.2130126953125, -169.03427124023438, -165.85552978515625, -162.67678833007812, -159.498046875, -156.31930541992188, -153.14056396484375, -149.96182250976562, -146.7830810546875, -143.60433959960938, -140.42559814453125, -137.24685668945312, -134.068115234375, -130.88937377929688, -127.71063232421875, -124.53189086914062, -121.3531494140625, -118.17440795898438, -114.99566650390625, -111.81694030761719, -108.63819885253906, -105.45945739746094, -102.28071594238281, -99.10197448730469, -95.92323303222656, -92.74449157714844, -89.56575012207031, -86.38700103759766, -83.20825958251953, -80.0295181274414, -76.85077667236328, -73.67203521728516, -70.49329376220703, -67.31455993652344, -64.13581848144531, -60.95707321166992, -57.7783317565918, -54.59959030151367, -51.42085266113281, -48.24211120605469, -45.06336975097656, -41.88462829589844, -38.70588684082031, -35.52714538574219, -32.34840393066406, -29.169662475585938, -25.990922927856445, -22.81218147277832, -19.633440017700195, -16.454700469970703, -13.275959014892578, -10.09721851348877, -6.918477535247803, -3.739736557006836, -0.5609960556030273, 2.6177453994750977, 5.796486854553223, 8.975226402282715, 12.15396785736084, 15.332709312438965]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 10.0, 12.0, 12.0, 7.0, 18.0, 20.0, 23.0, 29.0, 21.0, 32.0, 35.0, 34.0, 41.0, 40.0, 55.0, 47.0, 49.0, 39.0, 44.0, 30.0, 37.0, 41.0, 36.0, 45.0, 27.0, 26.0, 33.0, 23.0, 19.0, 23.0, 19.0, 18.0, 14.0, 11.0, 7.0, 1.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.14498901367188, -81.6260757446289, -79.10716247558594, -76.58824920654297, -74.0693359375, -71.55043029785156, -69.03150939941406, -66.51260375976562, -63.993690490722656, -61.47477722167969, -58.95586395263672, -56.43695068359375, -53.91804122924805, -51.39912796020508, -48.88021469116211, -46.361305236816406, -43.84238815307617, -41.3234748840332, -38.804561614990234, -36.28565216064453, -33.76673889160156, -31.247825622558594, -28.728912353515625, -26.21000099182129, -23.69108772277832, -21.17217445373535, -18.653263092041016, -16.134349822998047, -13.615437507629395, -11.096525192260742, -8.577611923217773, -6.0587005615234375, -3.5397872924804688, -1.0208747386932373, 1.4980378150939941, 4.016950607299805, 6.535862922668457, 9.05477523803711, 11.573688507080078, 14.092599868774414, 16.611513137817383, 19.13042640686035, 21.649337768554688, 24.168251037597656, 26.687164306640625, 29.20607566833496, 31.72498893737793, 34.243900299072266, 36.762813568115234, 39.2817268371582, 41.80064010620117, 44.319549560546875, 46.838462829589844, 49.35737609863281, 51.87628936767578, 54.39520263671875, 56.91411590576172, 59.43302917480469, 61.951942443847656, 64.47085571289062, 66.9897689819336, 69.50868225097656, 72.027587890625, 74.54650115966797, 77.06541442871094]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 11.0, 8.0, 7.0, 6.0, 11.0, 17.0, 24.0, 22.0, 32.0, 38.0, 59.0, 84.0, 182.0, 509.0, 2254.0, 13034.0, 160856.0, 2960734.0, 1003521.0, 45654.0, 5426.0, 1102.0, 283.0, 127.0, 63.0, 41.0, 33.0, 22.0, 22.0, 18.0, 20.0, 13.0, 12.0, 14.0, 10.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.546875, -26.77685546875, -26.0068359375, -25.23681640625, -24.466796875, -23.69677734375, -22.9267578125, -22.15673828125, -21.38671875, -20.61669921875, -19.8466796875, -19.07666015625, -18.306640625, -17.53662109375, -16.7666015625, -15.99658203125, -15.2265625, -14.45654296875, -13.6865234375, -12.91650390625, -12.146484375, -11.37646484375, -10.6064453125, -9.83642578125, -9.06640625, -8.29638671875, -7.5263671875, -6.75634765625, -5.986328125, -5.21630859375, -4.4462890625, -3.67626953125, -2.90625, -2.13623046875, -1.3662109375, -0.59619140625, 0.173828125, 0.94384765625, 1.7138671875, 2.48388671875, 3.25390625, 4.02392578125, 4.7939453125, 5.56396484375, 6.333984375, 7.10400390625, 7.8740234375, 8.64404296875, 9.4140625, 10.18408203125, 10.9541015625, 11.72412109375, 12.494140625, 13.26416015625, 14.0341796875, 14.80419921875, 15.57421875, 16.34423828125, 17.1142578125, 17.88427734375, 18.654296875, 19.42431640625, 20.1943359375, 20.96435546875, 21.734375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 5.0, 11.0, 5.0, 13.0, 22.0, 15.0, 25.0, 23.0, 35.0, 32.0, 35.0, 39.0, 46.0, 53.0, 53.0, 46.0, 32.0, 55.0, 47.0, 55.0, 44.0, 42.0, 36.0, 36.0, 36.0, 24.0, 21.0, 22.0, 23.0, 9.0, 12.0, 12.0, 6.0, 6.0, 4.0, 7.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3828125, -10.0447998046875, -9.706787109375, -9.3687744140625, -9.03076171875, -8.6927490234375, -8.354736328125, -8.0167236328125, -7.6787109375, -7.3406982421875, -7.002685546875, -6.6646728515625, -6.32666015625, -5.9886474609375, -5.650634765625, -5.3126220703125, -4.974609375, -4.6365966796875, -4.298583984375, -3.9605712890625, -3.62255859375, -3.2845458984375, -2.946533203125, -2.6085205078125, -2.2705078125, -1.9324951171875, -1.594482421875, -1.2564697265625, -0.91845703125, -0.5804443359375, -0.242431640625, 0.0955810546875, 0.43359375, 0.7716064453125, 1.109619140625, 1.4476318359375, 1.78564453125, 2.1236572265625, 2.461669921875, 2.7996826171875, 3.1376953125, 3.4757080078125, 3.813720703125, 4.1517333984375, 4.48974609375, 4.8277587890625, 5.165771484375, 5.5037841796875, 5.841796875, 6.1798095703125, 6.517822265625, 6.8558349609375, 7.19384765625, 7.5318603515625, 7.869873046875, 8.2078857421875, 8.5458984375, 8.8839111328125, 9.221923828125, 9.5599365234375, 9.89794921875, 10.2359619140625, 10.573974609375, 10.9119873046875, 11.25]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 1.0, 7.0, 12.0, 18.0, 54.0, 230.0, 4162233.0, 31401.0, 211.0, 54.0, 22.0, 15.0, 8.0, 8.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-495.5, -485.158203125, -474.81640625, -464.474609375, -454.1328125, -443.791015625, -433.44921875, -423.107421875, -412.765625, -402.423828125, -392.08203125, -381.740234375, -371.3984375, -361.056640625, -350.71484375, -340.373046875, -330.03125, -319.689453125, -309.34765625, -299.005859375, -288.6640625, -278.322265625, -267.98046875, -257.638671875, -247.296875, -236.955078125, -226.61328125, -216.271484375, -205.9296875, -195.587890625, -185.24609375, -174.904296875, -164.5625, -154.220703125, -143.87890625, -133.537109375, -123.1953125, -112.853515625, -102.51171875, -92.169921875, -81.828125, -71.486328125, -61.14453125, -50.802734375, -40.4609375, -30.119140625, -19.77734375, -9.435546875, 0.90625, 11.248046875, 21.58984375, 31.931640625, 42.2734375, 52.615234375, 62.95703125, 73.298828125, 83.640625, 93.982421875, 104.32421875, 114.666015625, 125.0078125, 135.349609375, 145.69140625, 156.033203125, 166.375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 12.0, 17.0, 14.0, 27.0, 20.0, 36.0, 52.0, 96.0, 119.0, 154.0, 252.0, 314.0, 450.0, 657.0, 501.0, 369.0, 281.0, 190.0, 135.0, 94.0, 71.0, 68.0, 38.0, 25.0, 13.0, 22.0, 8.0, 11.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.01171875, -3.89605712890625, -3.7803955078125, -3.66473388671875, -3.549072265625, -3.43341064453125, -3.3177490234375, -3.20208740234375, -3.08642578125, -2.97076416015625, -2.8551025390625, -2.73944091796875, -2.623779296875, -2.50811767578125, -2.3924560546875, -2.27679443359375, -2.1611328125, -2.04547119140625, -1.9298095703125, -1.81414794921875, -1.698486328125, -1.58282470703125, -1.4671630859375, -1.35150146484375, -1.23583984375, -1.12017822265625, -1.0045166015625, -0.88885498046875, -0.773193359375, -0.65753173828125, -0.5418701171875, -0.42620849609375, -0.310546875, -0.19488525390625, -0.0792236328125, 0.03643798828125, 0.152099609375, 0.26776123046875, 0.3834228515625, 0.49908447265625, 0.61474609375, 0.73040771484375, 0.8460693359375, 0.96173095703125, 1.077392578125, 1.19305419921875, 1.3087158203125, 1.42437744140625, 1.5400390625, 1.65570068359375, 1.7713623046875, 1.88702392578125, 2.002685546875, 2.11834716796875, 2.2340087890625, 2.34967041015625, 2.46533203125, 2.58099365234375, 2.6966552734375, 2.81231689453125, 2.927978515625, 3.04364013671875, 3.1593017578125, 3.27496337890625, 3.390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 10.0, 11.0, 11.0, 11.0, 16.0, 22.0, 34.0, 55.0, 61.0, 60.0, 78.0, 94.0, 66.0, 101.0, 83.0, 61.0, 53.0, 46.0, 39.0, 28.0, 16.0, 13.0, 10.0, 10.0, 4.0, 2.0, 8.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.826425552368164, -20.323572158813477, -19.82071876525879, -19.31786346435547, -18.81501007080078, -18.312156677246094, -17.809303283691406, -17.30644989013672, -16.8035945892334, -16.30074119567871, -15.797886848449707, -15.29503345489502, -14.792179107666016, -14.289325714111328, -13.78647232055664, -13.283617973327637, -12.78076457977295, -12.277911186218262, -11.775056838989258, -11.27220344543457, -10.769349098205566, -10.266495704650879, -9.763641357421875, -9.260787963867188, -8.7579345703125, -8.255081176757812, -7.752226829528809, -7.249373435974121, -6.746519088745117, -6.24366569519043, -5.740811824798584, -5.237957954406738, -4.735103607177734, -4.232249736785889, -3.729395866394043, -3.2265422344207764, -2.7236883640289307, -2.220834493637085, -1.7179808616638184, -1.2151269912719727, -0.712273120880127, -0.20941931009292603, 0.2934345006942749, 0.796288251876831, 1.2991421222686768, 1.8019959926605225, 2.304849624633789, 2.8077034950256348, 3.3105573654174805, 3.813411235809326, 4.316265106201172, 4.819118499755859, 5.321972846984863, 5.824826240539551, 6.3276801109313965, 6.830533981323242, 7.333387851715088, 7.836241722106934, 8.339095115661621, 8.841949462890625, 9.344802856445312, 9.847657203674316, 10.350510597229004, 10.853364944458008, 11.356218338012695]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 1.0, 5.0, 4.0, 16.0, 12.0, 12.0, 22.0, 18.0, 13.0, 26.0, 21.0, 28.0, 29.0, 37.0, 33.0, 39.0, 37.0, 59.0, 47.0, 51.0, 38.0, 42.0, 49.0, 39.0, 46.0, 35.0, 32.0, 31.0, 25.0, 23.0, 23.0, 17.0, 19.0, 11.0, 15.0, 12.0, 5.0, 7.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.021855354309082, -9.70553970336914, -9.389225006103516, -9.072909355163574, -8.75659465789795, -8.440279006958008, -8.123964309692383, -7.807648658752441, -7.491333484649658, -7.175018310546875, -6.858703136444092, -6.542387962341309, -6.226072311401367, -5.909757614135742, -5.593441963195801, -5.277126789093018, -4.960811614990234, -4.644496440887451, -4.328181266784668, -4.011866092681885, -3.6955506801605225, -3.3792355060577393, -3.062920093536377, -2.7466049194335938, -2.4302897453308105, -2.1139745712280273, -1.7976592779159546, -1.4813439846038818, -1.1650288105010986, -0.8487136363983154, -0.5323983430862427, -0.21608304977416992, 0.10023117065429688, 0.41654640436172485, 0.7328616380691528, 1.0491769313812256, 1.3654921054840088, 1.681807279586792, 1.9981225728988647, 2.3144378662109375, 2.6307530403137207, 2.947068214416504, 3.263383388519287, 3.5796988010406494, 3.8960139751434326, 4.212328910827637, 4.528644561767578, 4.844959735870361, 5.1612749099731445, 5.477590084075928, 5.793905258178711, 6.110220432281494, 6.426535606384277, 6.742851257324219, 7.059166431427002, 7.375481605529785, 7.691796779632568, 8.008111953735352, 8.324427604675293, 8.640742301940918, 8.95705795288086, 9.273372650146484, 9.589688301086426, 9.906003952026367, 10.222318649291992]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 8.0, 13.0, 15.0, 22.0, 34.0, 35.0, 65.0, 112.0, 183.0, 275.0, 426.0, 613.0, 958.0, 1564.0, 2484.0, 4356.0, 7634.0, 14858.0, 29853.0, 61864.0, 131716.0, 259073.0, 266066.0, 136998.0, 64096.0, 30419.0, 15253.0, 7989.0, 4512.0, 2677.0, 1564.0, 959.0, 668.0, 379.0, 286.0, 169.0, 112.0, 72.0, 57.0, 30.0, 25.0, 30.0, 13.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.7109375, -3.595062255859375, -3.47918701171875, -3.363311767578125, -3.2474365234375, -3.131561279296875, -3.01568603515625, -2.899810791015625, -2.783935546875, -2.668060302734375, -2.55218505859375, -2.436309814453125, -2.3204345703125, -2.204559326171875, -2.08868408203125, -1.972808837890625, -1.85693359375, -1.741058349609375, -1.62518310546875, -1.509307861328125, -1.3934326171875, -1.277557373046875, -1.16168212890625, -1.045806884765625, -0.929931640625, -0.814056396484375, -0.69818115234375, -0.582305908203125, -0.4664306640625, -0.350555419921875, -0.23468017578125, -0.118804931640625, -0.0029296875, 0.112945556640625, 0.22882080078125, 0.344696044921875, 0.4605712890625, 0.576446533203125, 0.69232177734375, 0.808197021484375, 0.924072265625, 1.039947509765625, 1.15582275390625, 1.271697998046875, 1.3875732421875, 1.503448486328125, 1.61932373046875, 1.735198974609375, 1.85107421875, 1.966949462890625, 2.08282470703125, 2.198699951171875, 2.3145751953125, 2.430450439453125, 2.54632568359375, 2.662200927734375, 2.778076171875, 2.893951416015625, 3.00982666015625, 3.125701904296875, 3.2415771484375, 3.357452392578125, 3.47332763671875, 3.589202880859375, 3.705078125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 0.0, 3.0, 7.0, 4.0, 8.0, 6.0, 8.0, 8.0, 12.0, 12.0, 17.0, 30.0, 35.0, 23.0, 28.0, 30.0, 42.0, 41.0, 32.0, 40.0, 49.0, 58.0, 58.0, 45.0, 51.0, 40.0, 49.0, 33.0, 35.0, 34.0, 23.0, 22.0, 19.0, 15.0, 19.0, 16.0, 10.0, 11.0, 7.0, 3.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.1953125, -6.9837646484375, -6.772216796875, -6.5606689453125, -6.34912109375, -6.1375732421875, -5.926025390625, -5.7144775390625, -5.5029296875, -5.2913818359375, -5.079833984375, -4.8682861328125, -4.65673828125, -4.4451904296875, -4.233642578125, -4.0220947265625, -3.810546875, -3.5989990234375, -3.387451171875, -3.1759033203125, -2.96435546875, -2.7528076171875, -2.541259765625, -2.3297119140625, -2.1181640625, -1.9066162109375, -1.695068359375, -1.4835205078125, -1.27197265625, -1.0604248046875, -0.848876953125, -0.6373291015625, -0.42578125, -0.2142333984375, -0.002685546875, 0.2088623046875, 0.42041015625, 0.6319580078125, 0.843505859375, 1.0550537109375, 1.2666015625, 1.4781494140625, 1.689697265625, 1.9012451171875, 2.11279296875, 2.3243408203125, 2.535888671875, 2.7474365234375, 2.958984375, 3.1705322265625, 3.382080078125, 3.5936279296875, 3.80517578125, 4.0167236328125, 4.228271484375, 4.4398193359375, 4.6513671875, 4.8629150390625, 5.074462890625, 5.2860107421875, 5.49755859375, 5.7091064453125, 5.920654296875, 6.1322021484375, 6.34375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 0.0, 5.0, 1.0, 6.0, 7.0, 5.0, 6.0, 19.0, 22.0, 34.0, 48.0, 67.0, 81.0, 158.0, 243.0, 441.0, 908.0, 2134.0, 5594.0, 18600.0, 73573.0, 325759.0, 464002.0, 115825.0, 27724.0, 8077.0, 2752.0, 1133.0, 545.0, 266.0, 178.0, 97.0, 68.0, 54.0, 33.0, 26.0, 9.0, 12.0, 13.0, 11.0, 9.0, 5.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.95703125, -5.75946044921875, -5.5618896484375, -5.36431884765625, -5.166748046875, -4.96917724609375, -4.7716064453125, -4.57403564453125, -4.37646484375, -4.17889404296875, -3.9813232421875, -3.78375244140625, -3.586181640625, -3.38861083984375, -3.1910400390625, -2.99346923828125, -2.7958984375, -2.59832763671875, -2.4007568359375, -2.20318603515625, -2.005615234375, -1.80804443359375, -1.6104736328125, -1.41290283203125, -1.21533203125, -1.01776123046875, -0.8201904296875, -0.62261962890625, -0.425048828125, -0.22747802734375, -0.0299072265625, 0.16766357421875, 0.365234375, 0.56280517578125, 0.7603759765625, 0.95794677734375, 1.155517578125, 1.35308837890625, 1.5506591796875, 1.74822998046875, 1.94580078125, 2.14337158203125, 2.3409423828125, 2.53851318359375, 2.736083984375, 2.93365478515625, 3.1312255859375, 3.32879638671875, 3.5263671875, 3.72393798828125, 3.9215087890625, 4.11907958984375, 4.316650390625, 4.51422119140625, 4.7117919921875, 4.90936279296875, 5.10693359375, 5.30450439453125, 5.5020751953125, 5.69964599609375, 5.897216796875, 6.09478759765625, 6.2923583984375, 6.48992919921875, 6.6875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 1.0, 7.0, 6.0, 12.0, 15.0, 21.0, 16.0, 23.0, 27.0, 39.0, 36.0, 48.0, 44.0, 53.0, 57.0, 60.0, 46.0, 49.0, 52.0, 49.0, 57.0, 56.0, 35.0, 43.0, 32.0, 24.0, 19.0, 12.0, 15.0, 12.0, 8.0, 8.0, 11.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.4609375, -14.978759765625, -14.49658203125, -14.014404296875, -13.5322265625, -13.050048828125, -12.56787109375, -12.085693359375, -11.603515625, -11.121337890625, -10.63916015625, -10.156982421875, -9.6748046875, -9.192626953125, -8.71044921875, -8.228271484375, -7.74609375, -7.263916015625, -6.78173828125, -6.299560546875, -5.8173828125, -5.335205078125, -4.85302734375, -4.370849609375, -3.888671875, -3.406494140625, -2.92431640625, -2.442138671875, -1.9599609375, -1.477783203125, -0.99560546875, -0.513427734375, -0.03125, 0.450927734375, 0.93310546875, 1.415283203125, 1.8974609375, 2.379638671875, 2.86181640625, 3.343994140625, 3.826171875, 4.308349609375, 4.79052734375, 5.272705078125, 5.7548828125, 6.237060546875, 6.71923828125, 7.201416015625, 7.68359375, 8.165771484375, 8.64794921875, 9.130126953125, 9.6123046875, 10.094482421875, 10.57666015625, 11.058837890625, 11.541015625, 12.023193359375, 12.50537109375, 12.987548828125, 13.4697265625, 13.951904296875, 14.43408203125, 14.916259765625, 15.3984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 9.0, 9.0, 11.0, 30.0, 35.0, 36.0, 33.0, 91.0, 145.0, 188.0, 318.0, 519.0, 997.0, 1919.0, 3835.0, 9309.0, 27229.0, 94863.0, 384620.0, 385062.0, 94960.0, 26776.0, 9421.0, 3883.0, 1862.0, 950.0, 523.0, 325.0, 175.0, 125.0, 83.0, 68.0, 38.0, 29.0, 25.0, 13.0, 11.0, 5.0, 6.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.8779296875, -1.817352294921875, -1.75677490234375, -1.696197509765625, -1.6356201171875, -1.575042724609375, -1.51446533203125, -1.453887939453125, -1.393310546875, -1.332733154296875, -1.27215576171875, -1.211578369140625, -1.1510009765625, -1.090423583984375, -1.02984619140625, -0.969268798828125, -0.90869140625, -0.848114013671875, -0.78753662109375, -0.726959228515625, -0.6663818359375, -0.605804443359375, -0.54522705078125, -0.484649658203125, -0.424072265625, -0.363494873046875, -0.30291748046875, -0.242340087890625, -0.1817626953125, -0.121185302734375, -0.06060791015625, -3.0517578125e-05, 0.060546875, 0.121124267578125, 0.18170166015625, 0.242279052734375, 0.3028564453125, 0.363433837890625, 0.42401123046875, 0.484588623046875, 0.545166015625, 0.605743408203125, 0.66632080078125, 0.726898193359375, 0.7874755859375, 0.848052978515625, 0.90863037109375, 0.969207763671875, 1.02978515625, 1.090362548828125, 1.15093994140625, 1.211517333984375, 1.2720947265625, 1.332672119140625, 1.39324951171875, 1.453826904296875, 1.514404296875, 1.574981689453125, 1.63555908203125, 1.696136474609375, 1.7567138671875, 1.817291259765625, 1.87786865234375, 1.938446044921875, 1.9990234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 3.0, 12.0, 6.0, 8.0, 7.0, 16.0, 18.0, 21.0, 26.0, 36.0, 45.0, 73.0, 83.0, 97.0, 95.0, 102.0, 71.0, 70.0, 47.0, 33.0, 29.0, 30.0, 22.0, 9.0, 13.0, 8.0, 10.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008492469787597656, -0.0008194372057914734, -0.0007896274328231812, -0.0007598176598548889, -0.0007300078868865967, -0.0007001981139183044, -0.0006703883409500122, -0.00064057856798172, -0.0006107687950134277, -0.0005809590220451355, -0.0005511492490768433, -0.000521339476108551, -0.0004915297031402588, -0.00046171993017196655, -0.0004319101572036743, -0.0004021003842353821, -0.00037229061126708984, -0.0003424808382987976, -0.00031267106533050537, -0.00028286129236221313, -0.0002530515193939209, -0.00022324174642562866, -0.00019343197345733643, -0.0001636222004890442, -0.00013381242752075195, -0.00010400265455245972, -7.419288158416748e-05, -4.4383108615875244e-05, -1.4573335647583008e-05, 1.5236437320709229e-05, 4.5046210289001465e-05, 7.48559832572937e-05, 0.00010466575622558594, 0.00013447552919387817, 0.0001642853021621704, 0.00019409507513046265, 0.00022390484809875488, 0.0002537146210670471, 0.00028352439403533936, 0.0003133341670036316, 0.00034314393997192383, 0.00037295371294021606, 0.0004027634859085083, 0.00043257325887680054, 0.0004623830318450928, 0.000492192804813385, 0.0005220025777816772, 0.0005518123507499695, 0.0005816221237182617, 0.000611431896686554, 0.0006412416696548462, 0.0006710514426231384, 0.0007008612155914307, 0.0007306709885597229, 0.0007604807615280151, 0.0007902905344963074, 0.0008201003074645996, 0.0008499100804328918, 0.0008797198534011841, 0.0009095296263694763, 0.0009393393993377686, 0.0009691491723060608, 0.000998958945274353, 0.0010287687182426453, 0.0010585784912109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 6.0, 6.0, 1.0, 5.0, 9.0, 9.0, 8.0, 21.0, 23.0, 36.0, 45.0, 97.0, 313.0, 7452.0, 976569.0, 62967.0, 694.0, 125.0, 58.0, 32.0, 23.0, 16.0, 7.0, 8.0, 8.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.890625, -11.5478515625, -11.205078125, -10.8623046875, -10.51953125, -10.1767578125, -9.833984375, -9.4912109375, -9.1484375, -8.8056640625, -8.462890625, -8.1201171875, -7.77734375, -7.4345703125, -7.091796875, -6.7490234375, -6.40625, -6.0634765625, -5.720703125, -5.3779296875, -5.03515625, -4.6923828125, -4.349609375, -4.0068359375, -3.6640625, -3.3212890625, -2.978515625, -2.6357421875, -2.29296875, -1.9501953125, -1.607421875, -1.2646484375, -0.921875, -0.5791015625, -0.236328125, 0.1064453125, 0.44921875, 0.7919921875, 1.134765625, 1.4775390625, 1.8203125, 2.1630859375, 2.505859375, 2.8486328125, 3.19140625, 3.5341796875, 3.876953125, 4.2197265625, 4.5625, 4.9052734375, 5.248046875, 5.5908203125, 5.93359375, 6.2763671875, 6.619140625, 6.9619140625, 7.3046875, 7.6474609375, 7.990234375, 8.3330078125, 8.67578125, 9.0185546875, 9.361328125, 9.7041015625, 10.046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 5.0, 3.0, 5.0, 7.0, 13.0, 8.0, 14.0, 16.0, 20.0, 17.0, 32.0, 34.0, 37.0, 51.0, 53.0, 60.0, 73.0, 71.0, 56.0, 69.0, 44.0, 59.0, 45.0, 38.0, 32.0, 36.0, 20.0, 25.0, 12.0, 7.0, 10.0, 5.0, 10.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57373046875, -0.5552444458007812, -0.5367584228515625, -0.5182723999023438, -0.499786376953125, -0.48130035400390625, -0.4628143310546875, -0.44432830810546875, -0.42584228515625, -0.40735626220703125, -0.3888702392578125, -0.37038421630859375, -0.351898193359375, -0.33341217041015625, -0.3149261474609375, -0.29644012451171875, -0.2779541015625, -0.25946807861328125, -0.2409820556640625, -0.22249603271484375, -0.204010009765625, -0.18552398681640625, -0.1670379638671875, -0.14855194091796875, -0.13006591796875, -0.11157989501953125, -0.0930938720703125, -0.07460784912109375, -0.056121826171875, -0.03763580322265625, -0.0191497802734375, -0.00066375732421875, 0.017822265625, 0.03630828857421875, 0.0547943115234375, 0.07328033447265625, 0.091766357421875, 0.11025238037109375, 0.1287384033203125, 0.14722442626953125, 0.16571044921875, 0.18419647216796875, 0.2026824951171875, 0.22116851806640625, 0.239654541015625, 0.25814056396484375, 0.2766265869140625, 0.29511260986328125, 0.3135986328125, 0.33208465576171875, 0.3505706787109375, 0.36905670166015625, 0.387542724609375, 0.40602874755859375, 0.4245147705078125, 0.44300079345703125, 0.46148681640625, 0.47997283935546875, 0.4984588623046875, 0.5169448852539062, 0.535430908203125, 0.5539169311523438, 0.5724029541015625, 0.5908889770507812, 0.609375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 13.0, 26.0, 29.0, 51.0, 82.0, 144.0, 167.0, 140.0, 110.0, 93.0, 62.0, 29.0, 26.0, 13.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.05207633972168, -21.527015686035156, -21.001955032348633, -20.476892471313477, -19.951831817626953, -19.42677116394043, -18.901710510253906, -18.37664794921875, -17.851587295532227, -17.326526641845703, -16.80146598815918, -16.276403427124023, -15.7513427734375, -15.226282119750977, -14.701221466064453, -14.176159858703613, -13.65109920501709, -13.126038551330566, -12.600976943969727, -12.075916290283203, -11.550854682922363, -11.02579402923584, -10.500732421875, -9.975671768188477, -9.450611114501953, -8.92555046081543, -8.40048885345459, -7.875428199768066, -7.350366592407227, -6.825305938720703, -6.3002448081970215, -5.77518367767334, -5.2501220703125, -4.725060939788818, -4.199999809265137, -3.674938917160034, -3.1498777866363525, -2.624816656112671, -2.0997557640075684, -1.5746946334838867, -1.049633502960205, -0.5245724320411682, 0.0004886388778686523, 0.5255496501922607, 1.0506107807159424, 1.575671911239624, 2.1007328033447266, 2.625793933868408, 3.15085506439209, 3.6759161949157715, 4.200977325439453, 4.726037979125977, 5.251099586486816, 5.77616024017334, 6.3012213706970215, 6.826282501220703, 7.351343631744385, 7.876404762268066, 8.40146541595459, 8.92652702331543, 9.451587677001953, 9.976649284362793, 10.501709938049316, 11.026771545410156, 11.55183219909668]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 0.0, 6.0, 0.0, 8.0, 8.0, 9.0, 9.0, 10.0, 7.0, 14.0, 17.0, 23.0, 17.0, 30.0, 26.0, 35.0, 37.0, 33.0, 36.0, 47.0, 40.0, 48.0, 59.0, 52.0, 35.0, 49.0, 38.0, 48.0, 30.0, 29.0, 25.0, 23.0, 24.0, 18.0, 25.0, 14.0, 13.0, 16.0, 12.0, 7.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.825225353240967, -5.630563259124756, -5.435900688171387, -5.241238594055176, -5.046576499938965, -4.851914405822754, -4.657252311706543, -4.462589740753174, -4.267927646636963, -4.073265552520752, -3.878603219985962, -3.683940887451172, -3.489278793334961, -3.29461669921875, -3.09995436668396, -2.90529203414917, -2.710629940032959, -2.515967845916748, -2.321305513381958, -2.126643180847168, -1.931981086730957, -1.7373188734054565, -1.542656660079956, -1.3479944467544556, -1.153332233428955, -0.9586700201034546, -0.7640078067779541, -0.5693455934524536, -0.3746833801269531, -0.18002116680145264, 0.014641046524047852, 0.20930325984954834, 0.40396595001220703, 0.5986281633377075, 0.793290376663208, 0.9879525899887085, 1.182614803314209, 1.3772770166397095, 1.57193922996521, 1.7666014432907104, 1.961263656616211, 2.155925750732422, 2.350588083267212, 2.545250415802002, 2.739912509918213, 2.934574604034424, 3.129236936569214, 3.323899269104004, 3.518561363220215, 3.713223457336426, 3.907885789871216, 4.102548122406006, 4.297210216522217, 4.491872310638428, 4.686534881591797, 4.881196975708008, 5.075859069824219, 5.27052116394043, 5.465183258056641, 5.65984582901001, 5.854507923126221, 6.049170017242432, 6.243832588195801, 6.438494682312012, 6.633156776428223]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 6.0, 3.0, 5.0, 15.0, 11.0, 15.0, 36.0, 24.0, 49.0, 61.0, 73.0, 131.0, 189.0, 322.0, 453.0, 823.0, 1495.0, 2640.0, 5209.0, 11074.0, 24462.0, 57652.0, 152290.0, 370313.0, 257420.0, 93286.0, 37608.0, 16462.0, 7692.0, 3782.0, 1999.0, 1113.0, 677.0, 378.0, 240.0, 178.0, 116.0, 77.0, 55.0, 34.0, 24.0, 23.0, 19.0, 8.0, 9.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.3671875, -4.24505615234375, -4.1229248046875, -4.00079345703125, -3.878662109375, -3.75653076171875, -3.6343994140625, -3.51226806640625, -3.39013671875, -3.26800537109375, -3.1458740234375, -3.02374267578125, -2.901611328125, -2.77947998046875, -2.6573486328125, -2.53521728515625, -2.4130859375, -2.29095458984375, -2.1688232421875, -2.04669189453125, -1.924560546875, -1.80242919921875, -1.6802978515625, -1.55816650390625, -1.43603515625, -1.31390380859375, -1.1917724609375, -1.06964111328125, -0.947509765625, -0.82537841796875, -0.7032470703125, -0.58111572265625, -0.458984375, -0.33685302734375, -0.2147216796875, -0.09259033203125, 0.029541015625, 0.15167236328125, 0.2738037109375, 0.39593505859375, 0.51806640625, 0.64019775390625, 0.7623291015625, 0.88446044921875, 1.006591796875, 1.12872314453125, 1.2508544921875, 1.37298583984375, 1.4951171875, 1.61724853515625, 1.7393798828125, 1.86151123046875, 1.983642578125, 2.10577392578125, 2.2279052734375, 2.35003662109375, 2.47216796875, 2.59429931640625, 2.7164306640625, 2.83856201171875, 2.960693359375, 3.08282470703125, 3.2049560546875, 3.32708740234375, 3.44921875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 7.0, 5.0, 9.0, 10.0, 6.0, 16.0, 12.0, 12.0, 22.0, 30.0, 28.0, 32.0, 31.0, 35.0, 46.0, 33.0, 53.0, 37.0, 56.0, 43.0, 44.0, 57.0, 42.0, 53.0, 32.0, 36.0, 24.0, 29.0, 26.0, 20.0, 19.0, 23.0, 16.0, 5.0, 12.0, 9.0, 6.0, 2.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.625, -19.95947265625, -19.2939453125, -18.62841796875, -17.962890625, -17.29736328125, -16.6318359375, -15.96630859375, -15.30078125, -14.63525390625, -13.9697265625, -13.30419921875, -12.638671875, -11.97314453125, -11.3076171875, -10.64208984375, -9.9765625, -9.31103515625, -8.6455078125, -7.97998046875, -7.314453125, -6.64892578125, -5.9833984375, -5.31787109375, -4.65234375, -3.98681640625, -3.3212890625, -2.65576171875, -1.990234375, -1.32470703125, -0.6591796875, 0.00634765625, 0.671875, 1.33740234375, 2.0029296875, 2.66845703125, 3.333984375, 3.99951171875, 4.6650390625, 5.33056640625, 5.99609375, 6.66162109375, 7.3271484375, 7.99267578125, 8.658203125, 9.32373046875, 9.9892578125, 10.65478515625, 11.3203125, 11.98583984375, 12.6513671875, 13.31689453125, 13.982421875, 14.64794921875, 15.3134765625, 15.97900390625, 16.64453125, 17.31005859375, 17.9755859375, 18.64111328125, 19.306640625, 19.97216796875, 20.6376953125, 21.30322265625, 21.96875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 11.0, 8.0, 10.0, 8.0, 17.0, 21.0, 23.0, 23.0, 32.0, 31.0, 37.0, 63.0, 42.0, 66.0, 135.0, 2808.0, 1044440.0, 307.0, 86.0, 59.0, 50.0, 36.0, 33.0, 32.0, 34.0, 24.0, 26.0, 17.0, 15.0, 13.0, 10.0, 7.0, 4.0, 4.0, 3.0, 1.0, 6.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0], "bins": [-101.0, -98.2138671875, -95.427734375, -92.6416015625, -89.85546875, -87.0693359375, -84.283203125, -81.4970703125, -78.7109375, -75.9248046875, -73.138671875, -70.3525390625, -67.56640625, -64.7802734375, -61.994140625, -59.2080078125, -56.421875, -53.6357421875, -50.849609375, -48.0634765625, -45.27734375, -42.4912109375, -39.705078125, -36.9189453125, -34.1328125, -31.3466796875, -28.560546875, -25.7744140625, -22.98828125, -20.2021484375, -17.416015625, -14.6298828125, -11.84375, -9.0576171875, -6.271484375, -3.4853515625, -0.69921875, 2.0869140625, 4.873046875, 7.6591796875, 10.4453125, 13.2314453125, 16.017578125, 18.8037109375, 21.58984375, 24.3759765625, 27.162109375, 29.9482421875, 32.734375, 35.5205078125, 38.306640625, 41.0927734375, 43.87890625, 46.6650390625, 49.451171875, 52.2373046875, 55.0234375, 57.8095703125, 60.595703125, 63.3818359375, 66.16796875, 68.9541015625, 71.740234375, 74.5263671875, 77.3125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 5.0, 10.0, 9.0, 10.0, 13.0, 14.0, 19.0, 22.0, 23.0, 31.0, 33.0, 40.0, 59.0, 43.0, 41.0, 47.0, 62.0, 56.0, 42.0, 54.0, 49.0, 39.0, 43.0, 31.0, 25.0, 39.0, 29.0, 26.0, 15.0, 15.0, 13.0, 11.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-33.40625, -32.48583984375, -31.5654296875, -30.64501953125, -29.724609375, -28.80419921875, -27.8837890625, -26.96337890625, -26.04296875, -25.12255859375, -24.2021484375, -23.28173828125, -22.361328125, -21.44091796875, -20.5205078125, -19.60009765625, -18.6796875, -17.75927734375, -16.8388671875, -15.91845703125, -14.998046875, -14.07763671875, -13.1572265625, -12.23681640625, -11.31640625, -10.39599609375, -9.4755859375, -8.55517578125, -7.634765625, -6.71435546875, -5.7939453125, -4.87353515625, -3.953125, -3.03271484375, -2.1123046875, -1.19189453125, -0.271484375, 0.64892578125, 1.5693359375, 2.48974609375, 3.41015625, 4.33056640625, 5.2509765625, 6.17138671875, 7.091796875, 8.01220703125, 8.9326171875, 9.85302734375, 10.7734375, 11.69384765625, 12.6142578125, 13.53466796875, 14.455078125, 15.37548828125, 16.2958984375, 17.21630859375, 18.13671875, 19.05712890625, 19.9775390625, 20.89794921875, 21.818359375, 22.73876953125, 23.6591796875, 24.57958984375, 25.5]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 3.0, 0.0, 5.0, 8.0, 4.0, 8.0, 12.0, 31.0, 37.0, 42.0, 139.0, 457.0, 2752.0, 58706.0, 964868.0, 19470.0, 1497.0, 273.0, 94.0, 49.0, 24.0, 13.0, 17.0, 8.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.9453125, -7.69976806640625, -7.4542236328125, -7.20867919921875, -6.963134765625, -6.71759033203125, -6.4720458984375, -6.22650146484375, -5.98095703125, -5.73541259765625, -5.4898681640625, -5.24432373046875, -4.998779296875, -4.75323486328125, -4.5076904296875, -4.26214599609375, -4.0166015625, -3.77105712890625, -3.5255126953125, -3.27996826171875, -3.034423828125, -2.78887939453125, -2.5433349609375, -2.29779052734375, -2.05224609375, -1.80670166015625, -1.5611572265625, -1.31561279296875, -1.070068359375, -0.82452392578125, -0.5789794921875, -0.33343505859375, -0.087890625, 0.15765380859375, 0.4031982421875, 0.64874267578125, 0.894287109375, 1.13983154296875, 1.3853759765625, 1.63092041015625, 1.87646484375, 2.12200927734375, 2.3675537109375, 2.61309814453125, 2.858642578125, 3.10418701171875, 3.3497314453125, 3.59527587890625, 3.8408203125, 4.08636474609375, 4.3319091796875, 4.57745361328125, 4.822998046875, 5.06854248046875, 5.3140869140625, 5.55963134765625, 5.80517578125, 6.05072021484375, 6.2962646484375, 6.54180908203125, 6.787353515625, 7.03289794921875, 7.2784423828125, 7.52398681640625, 7.76953125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 12.0, 5.0, 9.0, 14.0, 18.0, 25.0, 30.0, 37.0, 68.0, 79.0, 110.0, 173.0, 138.0, 75.0, 60.0, 36.0, 21.0, 28.0, 15.0, 13.0, 15.0, 9.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003542900085449219, -0.0003418922424316406, -0.0003294944763183594, -0.0003170967102050781, -0.0003046989440917969, -0.0002923011779785156, -0.0002799034118652344, -0.0002675056457519531, -0.0002551078796386719, -0.00024271011352539062, -0.00023031234741210938, -0.00021791458129882812, -0.00020551681518554688, -0.00019311904907226562, -0.00018072128295898438, -0.00016832351684570312, -0.00015592575073242188, -0.00014352798461914062, -0.00013113021850585938, -0.00011873245239257812, -0.00010633468627929688, -9.393692016601562e-05, -8.153915405273438e-05, -6.914138793945312e-05, -5.6743621826171875e-05, -4.4345855712890625e-05, -3.1948089599609375e-05, -1.9550323486328125e-05, -7.152557373046875e-06, 5.245208740234375e-06, 1.7642974853515625e-05, 3.0040740966796875e-05, 4.2438507080078125e-05, 5.4836273193359375e-05, 6.723403930664062e-05, 7.963180541992188e-05, 9.202957153320312e-05, 0.00010442733764648438, 0.00011682510375976562, 0.00012922286987304688, 0.00014162063598632812, 0.00015401840209960938, 0.00016641616821289062, 0.00017881393432617188, 0.00019121170043945312, 0.00020360946655273438, 0.00021600723266601562, 0.00022840499877929688, 0.00024080276489257812, 0.0002532005310058594, 0.0002655982971191406, 0.0002779960632324219, 0.0002903938293457031, 0.0003027915954589844, 0.0003151893615722656, 0.0003275871276855469, 0.0003399848937988281, 0.0003523826599121094, 0.0003647804260253906, 0.0003771781921386719, 0.0003895759582519531, 0.0004019737243652344, 0.0004143714904785156, 0.0004267692565917969, 0.0004391670227050781]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 10.0, 13.0, 10.0, 22.0, 23.0, 36.0, 85.0, 223.0, 873.0, 4644.0, 54946.0, 917692.0, 63496.0, 5124.0, 904.0, 229.0, 95.0, 40.0, 26.0, 19.0, 14.0, 9.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65234375, -4.4769287109375, -4.301513671875, -4.1260986328125, -3.95068359375, -3.7752685546875, -3.599853515625, -3.4244384765625, -3.2490234375, -3.0736083984375, -2.898193359375, -2.7227783203125, -2.54736328125, -2.3719482421875, -2.196533203125, -2.0211181640625, -1.845703125, -1.6702880859375, -1.494873046875, -1.3194580078125, -1.14404296875, -0.9686279296875, -0.793212890625, -0.6177978515625, -0.4423828125, -0.2669677734375, -0.091552734375, 0.0838623046875, 0.25927734375, 0.4346923828125, 0.610107421875, 0.7855224609375, 0.9609375, 1.1363525390625, 1.311767578125, 1.4871826171875, 1.66259765625, 1.8380126953125, 2.013427734375, 2.1888427734375, 2.3642578125, 2.5396728515625, 2.715087890625, 2.8905029296875, 3.06591796875, 3.2413330078125, 3.416748046875, 3.5921630859375, 3.767578125, 3.9429931640625, 4.118408203125, 4.2938232421875, 4.46923828125, 4.6446533203125, 4.820068359375, 4.9954833984375, 5.1708984375, 5.3463134765625, 5.521728515625, 5.6971435546875, 5.87255859375, 6.0479736328125, 6.223388671875, 6.3988037109375, 6.57421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 4.0, 15.0, 10.0, 17.0, 17.0, 22.0, 26.0, 54.0, 61.0, 102.0, 183.0, 188.0, 77.0, 65.0, 28.0, 24.0, 19.0, 16.0, 14.0, 6.0, 12.0, 14.0, 2.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2666015625, -1.2282867431640625, -1.189971923828125, -1.1516571044921875, -1.11334228515625, -1.0750274658203125, -1.036712646484375, -0.9983978271484375, -0.9600830078125, -0.9217681884765625, -0.883453369140625, -0.8451385498046875, -0.80682373046875, -0.7685089111328125, -0.730194091796875, -0.6918792724609375, -0.653564453125, -0.6152496337890625, -0.576934814453125, -0.5386199951171875, -0.50030517578125, -0.4619903564453125, -0.423675537109375, -0.3853607177734375, -0.3470458984375, -0.3087310791015625, -0.270416259765625, -0.2321014404296875, -0.19378662109375, -0.1554718017578125, -0.117156982421875, -0.0788421630859375, -0.04052734375, -0.0022125244140625, 0.036102294921875, 0.0744171142578125, 0.11273193359375, 0.1510467529296875, 0.189361572265625, 0.2276763916015625, 0.2659912109375, 0.3043060302734375, 0.342620849609375, 0.3809356689453125, 0.41925048828125, 0.4575653076171875, 0.495880126953125, 0.5341949462890625, 0.572509765625, 0.6108245849609375, 0.649139404296875, 0.6874542236328125, 0.72576904296875, 0.7640838623046875, 0.802398681640625, 0.8407135009765625, 0.8790283203125, 0.9173431396484375, 0.955657958984375, 0.9939727783203125, 1.03228759765625, 1.0706024169921875, 1.108917236328125, 1.1472320556640625, 1.185546875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 16.0, 64.0, 167.0, 390.0, 246.0, 90.0, 26.0, 10.0, 2.0, 3.0], "bins": [-143.51739501953125, -141.02890014648438, -138.54042053222656, -136.0519256591797, -133.5634307861328, -131.07493591308594, -128.58645629882812, -126.09796142578125, -123.60946655273438, -121.12097930908203, -118.63248443603516, -116.14399719238281, -113.65550231933594, -111.1670150756836, -108.67852020263672, -106.19003295898438, -103.70154571533203, -101.21305847167969, -98.72456359863281, -96.23607635498047, -93.7475814819336, -91.25909423828125, -88.77059936523438, -86.28211212158203, -83.79362487792969, -81.30513763427734, -78.81664276123047, -76.32815551757812, -73.83966064453125, -71.3511734008789, -68.86267852783203, -66.37419128417969, -63.88569259643555, -61.39720153808594, -58.90871047973633, -56.42021942138672, -53.931732177734375, -51.4432373046875, -48.954750061035156, -46.46625900268555, -43.97776794433594, -41.48927688598633, -39.00078582763672, -36.51229476928711, -34.0238037109375, -31.535314559936523, -29.046825408935547, -26.558334350585938, -24.069843292236328, -21.58135223388672, -19.09286117553711, -16.604372024536133, -14.115880966186523, -11.627389907836914, -9.138899803161621, -6.650409698486328, -4.161918640136719, -1.6734280586242676, 0.8150625228881836, 3.3035531044006348, 5.792043685913086, 8.280534744262695, 10.769024848937988, 13.257514953613281, 15.74600601196289]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 8.0, 6.0, 3.0, 7.0, 6.0, 13.0, 11.0, 11.0, 14.0, 14.0, 20.0, 26.0, 38.0, 25.0, 38.0, 35.0, 49.0, 32.0, 33.0, 36.0, 36.0, 40.0, 56.0, 42.0, 34.0, 42.0, 30.0, 38.0, 31.0, 30.0, 34.0, 22.0, 20.0, 19.0, 17.0, 18.0, 12.0, 14.0, 9.0, 9.0, 6.0, 5.0, 7.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.784635543823242, -28.812204360961914, -27.839773178100586, -26.867341995239258, -25.894912719726562, -24.922481536865234, -23.950050354003906, -22.977619171142578, -22.00518798828125, -21.032756805419922, -20.060325622558594, -19.087894439697266, -18.115463256835938, -17.14303207397461, -16.170602798461914, -15.198171615600586, -14.225740432739258, -13.25330924987793, -12.280878067016602, -11.30844783782959, -10.336016654968262, -9.363585472106934, -8.391155242919922, -7.418724060058594, -6.446292877197266, -5.4738616943359375, -4.501430988311768, -3.5290000438690186, -2.5565690994262695, -1.5841379165649414, -0.6117072105407715, 0.36072349548339844, 1.3331565856933594, 2.3055875301361084, 3.2780184745788574, 4.250449180603027, 5.2228803634643555, 6.195311546325684, 7.1677422523498535, 8.140172958374023, 9.112604141235352, 10.08503532409668, 11.057466506958008, 12.02989673614502, 13.002327919006348, 13.974759101867676, 14.947189331054688, 15.919620513916016, 16.892051696777344, 17.864482879638672, 18.8369140625, 19.809345245361328, 20.781776428222656, 21.754207611083984, 22.72663688659668, 23.699068069458008, 24.671499252319336, 25.643930435180664, 26.616361618041992, 27.58879280090332, 28.561222076416016, 29.533653259277344, 30.506084442138672, 31.478515625, 32.45094680786133]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 3.0, 6.0, 6.0, 14.0, 8.0, 12.0, 12.0, 18.0, 18.0, 30.0, 38.0, 67.0, 84.0, 166.0, 473.0, 1697.0, 8852.0, 90682.0, 2373960.0, 1645922.0, 62748.0, 7138.0, 1454.0, 407.0, 163.0, 87.0, 49.0, 37.0, 26.0, 26.0, 17.0, 12.0, 4.0, 9.0, 11.0, 6.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.265625, -23.550537109375, -22.83544921875, -22.120361328125, -21.4052734375, -20.690185546875, -19.97509765625, -19.260009765625, -18.544921875, -17.829833984375, -17.11474609375, -16.399658203125, -15.6845703125, -14.969482421875, -14.25439453125, -13.539306640625, -12.82421875, -12.109130859375, -11.39404296875, -10.678955078125, -9.9638671875, -9.248779296875, -8.53369140625, -7.818603515625, -7.103515625, -6.388427734375, -5.67333984375, -4.958251953125, -4.2431640625, -3.528076171875, -2.81298828125, -2.097900390625, -1.3828125, -0.667724609375, 0.04736328125, 0.762451171875, 1.4775390625, 2.192626953125, 2.90771484375, 3.622802734375, 4.337890625, 5.052978515625, 5.76806640625, 6.483154296875, 7.1982421875, 7.913330078125, 8.62841796875, 9.343505859375, 10.05859375, 10.773681640625, 11.48876953125, 12.203857421875, 12.9189453125, 13.634033203125, 14.34912109375, 15.064208984375, 15.779296875, 16.494384765625, 17.20947265625, 17.924560546875, 18.6396484375, 19.354736328125, 20.06982421875, 20.784912109375, 21.5]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 9.0, 10.0, 15.0, 16.0, 27.0, 22.0, 28.0, 30.0, 41.0, 38.0, 47.0, 55.0, 63.0, 69.0, 43.0, 47.0, 56.0, 55.0, 40.0, 44.0, 38.0, 32.0, 26.0, 25.0, 21.0, 19.0, 12.0, 10.0, 7.0, 10.0, 7.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3984375, -7.1390380859375, -6.879638671875, -6.6202392578125, -6.36083984375, -6.1014404296875, -5.842041015625, -5.5826416015625, -5.3232421875, -5.0638427734375, -4.804443359375, -4.5450439453125, -4.28564453125, -4.0262451171875, -3.766845703125, -3.5074462890625, -3.248046875, -2.9886474609375, -2.729248046875, -2.4698486328125, -2.21044921875, -1.9510498046875, -1.691650390625, -1.4322509765625, -1.1728515625, -0.9134521484375, -0.654052734375, -0.3946533203125, -0.13525390625, 0.1241455078125, 0.383544921875, 0.6429443359375, 0.90234375, 1.1617431640625, 1.421142578125, 1.6805419921875, 1.93994140625, 2.1993408203125, 2.458740234375, 2.7181396484375, 2.9775390625, 3.2369384765625, 3.496337890625, 3.7557373046875, 4.01513671875, 4.2745361328125, 4.533935546875, 4.7933349609375, 5.052734375, 5.3121337890625, 5.571533203125, 5.8309326171875, 6.09033203125, 6.3497314453125, 6.609130859375, 6.8685302734375, 7.1279296875, 7.3873291015625, 7.646728515625, 7.9061279296875, 8.16552734375, 8.4249267578125, 8.684326171875, 8.9437255859375, 9.203125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 5.0, 3.0, 7.0, 4.0, 16.0, 15.0, 29.0, 49.0, 109.0, 259.0, 953.0, 89561.0, 4099361.0, 3122.0, 434.0, 160.0, 66.0, 38.0, 16.0, 16.0, 9.0, 8.0, 10.0, 6.0, 5.0, 1.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-75.8125, -73.384765625, -70.95703125, -68.529296875, -66.1015625, -63.673828125, -61.24609375, -58.818359375, -56.390625, -53.962890625, -51.53515625, -49.107421875, -46.6796875, -44.251953125, -41.82421875, -39.396484375, -36.96875, -34.541015625, -32.11328125, -29.685546875, -27.2578125, -24.830078125, -22.40234375, -19.974609375, -17.546875, -15.119140625, -12.69140625, -10.263671875, -7.8359375, -5.408203125, -2.98046875, -0.552734375, 1.875, 4.302734375, 6.73046875, 9.158203125, 11.5859375, 14.013671875, 16.44140625, 18.869140625, 21.296875, 23.724609375, 26.15234375, 28.580078125, 31.0078125, 33.435546875, 35.86328125, 38.291015625, 40.71875, 43.146484375, 45.57421875, 48.001953125, 50.4296875, 52.857421875, 55.28515625, 57.712890625, 60.140625, 62.568359375, 64.99609375, 67.423828125, 69.8515625, 72.279296875, 74.70703125, 77.134765625, 79.5625]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 1.0, 7.0, 12.0, 12.0, 11.0, 24.0, 29.0, 30.0, 42.0, 57.0, 75.0, 115.0, 146.0, 197.0, 296.0, 451.0, 568.0, 516.0, 419.0, 315.0, 198.0, 149.0, 99.0, 89.0, 51.0, 52.0, 26.0, 30.0, 19.0, 7.0, 11.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.392578125, -3.282867431640625, -3.17315673828125, -3.063446044921875, -2.9537353515625, -2.844024658203125, -2.73431396484375, -2.624603271484375, -2.514892578125, -2.405181884765625, -2.29547119140625, -2.185760498046875, -2.0760498046875, -1.966339111328125, -1.85662841796875, -1.746917724609375, -1.63720703125, -1.527496337890625, -1.41778564453125, -1.308074951171875, -1.1983642578125, -1.088653564453125, -0.97894287109375, -0.869232177734375, -0.759521484375, -0.649810791015625, -0.54010009765625, -0.430389404296875, -0.3206787109375, -0.210968017578125, -0.10125732421875, 0.008453369140625, 0.1181640625, 0.227874755859375, 0.33758544921875, 0.447296142578125, 0.5570068359375, 0.666717529296875, 0.77642822265625, 0.886138916015625, 0.995849609375, 1.105560302734375, 1.21527099609375, 1.324981689453125, 1.4346923828125, 1.544403076171875, 1.65411376953125, 1.763824462890625, 1.87353515625, 1.983245849609375, 2.09295654296875, 2.202667236328125, 2.3123779296875, 2.422088623046875, 2.53179931640625, 2.641510009765625, 2.751220703125, 2.860931396484375, 2.97064208984375, 3.080352783203125, 3.1900634765625, 3.299774169921875, 3.40948486328125, 3.519195556640625, 3.62890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 1.0, 6.0, 8.0, 11.0, 14.0, 11.0, 10.0, 16.0, 36.0, 55.0, 60.0, 75.0, 84.0, 83.0, 97.0, 100.0, 69.0, 57.0, 49.0, 29.0, 34.0, 28.0, 18.0, 13.0, 4.0, 13.0, 6.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0], "bins": [-18.161945343017578, -17.72087287902832, -17.27979850769043, -16.838726043701172, -16.397653579711914, -15.95658016204834, -15.515506744384766, -15.074434280395508, -14.63336181640625, -14.192288398742676, -13.751215934753418, -13.310142517089844, -12.869070053100586, -12.427996635437012, -11.986923217773438, -11.54585075378418, -11.104777336120605, -10.663703918457031, -10.222631454467773, -9.7815580368042, -9.340485572814941, -8.899412155151367, -8.45833969116211, -8.017266273498535, -7.576193332672119, -7.135120391845703, -6.694047451019287, -6.252974510192871, -5.811901092529297, -5.370828628540039, -4.929755210876465, -4.488682270050049, -4.047609329223633, -3.606536388397217, -3.165463447570801, -2.7243902683258057, -2.2833173274993896, -1.8422443866729736, -1.4011712074279785, -0.9600982666015625, -0.5190253257751465, -0.0779523253440857, 0.3631206750869751, 0.8041937351226807, 1.2452666759490967, 1.6863396167755127, 2.127412796020508, 2.568485736846924, 3.00955867767334, 3.450631618499756, 3.891704559326172, 4.332777976989746, 4.773850440979004, 5.214923858642578, 5.655996799468994, 6.09706974029541, 6.538142681121826, 6.979215621948242, 7.420288562774658, 7.861361503601074, 8.302434921264648, 8.743507385253906, 9.18458080291748, 9.625654220581055, 10.066726684570312]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 10.0, 3.0, 11.0, 11.0, 8.0, 7.0, 15.0, 19.0, 18.0, 19.0, 24.0, 19.0, 33.0, 31.0, 26.0, 35.0, 32.0, 33.0, 27.0, 55.0, 45.0, 44.0, 36.0, 56.0, 32.0, 39.0, 32.0, 41.0, 32.0, 17.0, 24.0, 26.0, 18.0, 18.0, 21.0, 12.0, 11.0, 10.0, 6.0, 6.0, 10.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.4154462814331055, -7.183505058288574, -6.951563835144043, -6.719622611999512, -6.4876813888549805, -6.255740165710449, -6.023798942565918, -5.791857719421387, -5.5599164962768555, -5.327975273132324, -5.096034049987793, -4.864092826843262, -4.6321516036987305, -4.400210380554199, -4.168269157409668, -3.9363279342651367, -3.7043867111206055, -3.472445487976074, -3.240504264831543, -3.0085630416870117, -2.7766218185424805, -2.544680595397949, -2.312739372253418, -2.0807981491088867, -1.8488569259643555, -1.6169157028198242, -1.384974479675293, -1.1530332565307617, -0.9210920333862305, -0.6891508102416992, -0.45720958709716797, -0.22526836395263672, 0.006672382354736328, 0.23861360549926758, 0.47055482864379883, 0.7024960517883301, 0.9344372749328613, 1.1663784980773926, 1.3983197212219238, 1.630260944366455, 1.8622021675109863, 2.0941433906555176, 2.326084613800049, 2.55802583694458, 2.7899670600891113, 3.0219082832336426, 3.253849506378174, 3.485790729522705, 3.7177319526672363, 3.9496731758117676, 4.181614398956299, 4.41355562210083, 4.645496845245361, 4.877438068389893, 5.109379291534424, 5.341320514678955, 5.573261737823486, 5.805202960968018, 6.037144184112549, 6.26908540725708, 6.501026630401611, 6.732967853546143, 6.964909076690674, 7.196850299835205, 7.428791522979736]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 7.0, 7.0, 12.0, 23.0, 30.0, 79.0, 149.0, 376.0, 924.0, 2771.0, 9257.0, 35537.0, 168465.0, 503785.0, 254606.0, 53764.0, 13090.0, 3621.0, 1219.0, 419.0, 176.0, 102.0, 43.0, 40.0, 16.0, 6.0, 8.0, 5.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.0625, -6.87969970703125, -6.6968994140625, -6.51409912109375, -6.331298828125, -6.14849853515625, -5.9656982421875, -5.78289794921875, -5.60009765625, -5.41729736328125, -5.2344970703125, -5.05169677734375, -4.868896484375, -4.68609619140625, -4.5032958984375, -4.32049560546875, -4.1376953125, -3.95489501953125, -3.7720947265625, -3.58929443359375, -3.406494140625, -3.22369384765625, -3.0408935546875, -2.85809326171875, -2.67529296875, -2.49249267578125, -2.3096923828125, -2.12689208984375, -1.944091796875, -1.76129150390625, -1.5784912109375, -1.39569091796875, -1.212890625, -1.03009033203125, -0.8472900390625, -0.66448974609375, -0.481689453125, -0.29888916015625, -0.1160888671875, 0.06671142578125, 0.24951171875, 0.43231201171875, 0.6151123046875, 0.79791259765625, 0.980712890625, 1.16351318359375, 1.3463134765625, 1.52911376953125, 1.7119140625, 1.89471435546875, 2.0775146484375, 2.26031494140625, 2.443115234375, 2.62591552734375, 2.8087158203125, 2.99151611328125, 3.17431640625, 3.35711669921875, 3.5399169921875, 3.72271728515625, 3.905517578125, 4.08831787109375, 4.2711181640625, 4.45391845703125, 4.63671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 10.0, 5.0, 7.0, 11.0, 15.0, 11.0, 12.0, 16.0, 11.0, 21.0, 19.0, 30.0, 28.0, 38.0, 38.0, 35.0, 38.0, 37.0, 43.0, 48.0, 50.0, 52.0, 59.0, 40.0, 39.0, 33.0, 19.0, 32.0, 36.0, 27.0, 18.0, 21.0, 23.0, 7.0, 11.0, 10.0, 7.0, 8.0, 6.0, 5.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-5.13671875, -4.98577880859375, -4.8348388671875, -4.68389892578125, -4.532958984375, -4.38201904296875, -4.2310791015625, -4.08013916015625, -3.92919921875, -3.77825927734375, -3.6273193359375, -3.47637939453125, -3.325439453125, -3.17449951171875, -3.0235595703125, -2.87261962890625, -2.7216796875, -2.57073974609375, -2.4197998046875, -2.26885986328125, -2.117919921875, -1.96697998046875, -1.8160400390625, -1.66510009765625, -1.51416015625, -1.36322021484375, -1.2122802734375, -1.06134033203125, -0.910400390625, -0.75946044921875, -0.6085205078125, -0.45758056640625, -0.306640625, -0.15570068359375, -0.0047607421875, 0.14617919921875, 0.297119140625, 0.44805908203125, 0.5989990234375, 0.74993896484375, 0.90087890625, 1.05181884765625, 1.2027587890625, 1.35369873046875, 1.504638671875, 1.65557861328125, 1.8065185546875, 1.95745849609375, 2.1083984375, 2.25933837890625, 2.4102783203125, 2.56121826171875, 2.712158203125, 2.86309814453125, 3.0140380859375, 3.16497802734375, 3.31591796875, 3.46685791015625, 3.6177978515625, 3.76873779296875, 3.919677734375, 4.07061767578125, 4.2215576171875, 4.37249755859375, 4.5234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 6.0, 6.0, 5.0, 14.0, 23.0, 26.0, 26.0, 58.0, 79.0, 175.0, 273.0, 442.0, 901.0, 2129.0, 5477.0, 16541.0, 60008.0, 248277.0, 469081.0, 180530.0, 44044.0, 12571.0, 4346.0, 1723.0, 777.0, 383.0, 239.0, 133.0, 70.0, 50.0, 41.0, 21.0, 18.0, 15.0, 15.0, 10.0, 2.0, 3.0, 9.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4140625, -3.28466796875, -3.1552734375, -3.02587890625, -2.896484375, -2.76708984375, -2.6376953125, -2.50830078125, -2.37890625, -2.24951171875, -2.1201171875, -1.99072265625, -1.861328125, -1.73193359375, -1.6025390625, -1.47314453125, -1.34375, -1.21435546875, -1.0849609375, -0.95556640625, -0.826171875, -0.69677734375, -0.5673828125, -0.43798828125, -0.30859375, -0.17919921875, -0.0498046875, 0.07958984375, 0.208984375, 0.33837890625, 0.4677734375, 0.59716796875, 0.7265625, 0.85595703125, 0.9853515625, 1.11474609375, 1.244140625, 1.37353515625, 1.5029296875, 1.63232421875, 1.76171875, 1.89111328125, 2.0205078125, 2.14990234375, 2.279296875, 2.40869140625, 2.5380859375, 2.66748046875, 2.796875, 2.92626953125, 3.0556640625, 3.18505859375, 3.314453125, 3.44384765625, 3.5732421875, 3.70263671875, 3.83203125, 3.96142578125, 4.0908203125, 4.22021484375, 4.349609375, 4.47900390625, 4.6083984375, 4.73779296875, 4.8671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 1.0, 8.0, 6.0, 6.0, 11.0, 11.0, 13.0, 16.0, 20.0, 27.0, 36.0, 44.0, 47.0, 67.0, 59.0, 50.0, 51.0, 48.0, 43.0, 57.0, 57.0, 42.0, 37.0, 36.0, 34.0, 34.0, 27.0, 20.0, 21.0, 16.0, 11.0, 8.0, 18.0, 7.0, 5.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.875, -10.5452880859375, -10.215576171875, -9.8858642578125, -9.55615234375, -9.2264404296875, -8.896728515625, -8.5670166015625, -8.2373046875, -7.9075927734375, -7.577880859375, -7.2481689453125, -6.91845703125, -6.5887451171875, -6.259033203125, -5.9293212890625, -5.599609375, -5.2698974609375, -4.940185546875, -4.6104736328125, -4.28076171875, -3.9510498046875, -3.621337890625, -3.2916259765625, -2.9619140625, -2.6322021484375, -2.302490234375, -1.9727783203125, -1.64306640625, -1.3133544921875, -0.983642578125, -0.6539306640625, -0.32421875, 0.0054931640625, 0.335205078125, 0.6649169921875, 0.99462890625, 1.3243408203125, 1.654052734375, 1.9837646484375, 2.3134765625, 2.6431884765625, 2.972900390625, 3.3026123046875, 3.63232421875, 3.9620361328125, 4.291748046875, 4.6214599609375, 4.951171875, 5.2808837890625, 5.610595703125, 5.9403076171875, 6.27001953125, 6.5997314453125, 6.929443359375, 7.2591552734375, 7.5888671875, 7.9185791015625, 8.248291015625, 8.5780029296875, 8.90771484375, 9.2374267578125, 9.567138671875, 9.8968505859375, 10.2265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 8.0, 7.0, 14.0, 27.0, 43.0, 63.0, 116.0, 170.0, 382.0, 912.0, 2323.0, 8205.0, 62306.0, 713352.0, 235588.0, 18595.0, 3870.0, 1375.0, 570.0, 274.0, 123.0, 70.0, 58.0, 29.0, 20.0, 11.0, 10.0, 9.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.22265625, -3.1177978515625, -3.012939453125, -2.9080810546875, -2.80322265625, -2.6983642578125, -2.593505859375, -2.4886474609375, -2.3837890625, -2.2789306640625, -2.174072265625, -2.0692138671875, -1.96435546875, -1.8594970703125, -1.754638671875, -1.6497802734375, -1.544921875, -1.4400634765625, -1.335205078125, -1.2303466796875, -1.12548828125, -1.0206298828125, -0.915771484375, -0.8109130859375, -0.7060546875, -0.6011962890625, -0.496337890625, -0.3914794921875, -0.28662109375, -0.1817626953125, -0.076904296875, 0.0279541015625, 0.1328125, 0.2376708984375, 0.342529296875, 0.4473876953125, 0.55224609375, 0.6571044921875, 0.761962890625, 0.8668212890625, 0.9716796875, 1.0765380859375, 1.181396484375, 1.2862548828125, 1.39111328125, 1.4959716796875, 1.600830078125, 1.7056884765625, 1.810546875, 1.9154052734375, 2.020263671875, 2.1251220703125, 2.22998046875, 2.3348388671875, 2.439697265625, 2.5445556640625, 2.6494140625, 2.7542724609375, 2.859130859375, 2.9639892578125, 3.06884765625, 3.1737060546875, 3.278564453125, 3.3834228515625, 3.48828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 6.0, 5.0, 5.0, 7.0, 11.0, 12.0, 23.0, 43.0, 53.0, 92.0, 116.0, 130.0, 129.0, 127.0, 75.0, 65.0, 31.0, 24.0, 16.0, 9.0, 4.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0011396408081054688, -0.0011003464460372925, -0.0010610520839691162, -0.00102175772190094, -0.0009824633598327637, -0.0009431689977645874, -0.0009038746356964111, -0.0008645802736282349, -0.0008252859115600586, -0.0007859915494918823, -0.0007466971874237061, -0.0007074028253555298, -0.0006681084632873535, -0.0006288141012191772, -0.000589519739151001, -0.0005502253770828247, -0.0005109310150146484, -0.00047163665294647217, -0.0004323422908782959, -0.00039304792881011963, -0.00035375356674194336, -0.0003144592046737671, -0.0002751648426055908, -0.00023587048053741455, -0.00019657611846923828, -0.000157281756401062, -0.00011798739433288574, -7.869303226470947e-05, -3.93986701965332e-05, -1.043081283569336e-07, 3.9190053939819336e-05, 7.84844160079956e-05, 0.00011777877807617188, 0.00015707314014434814, 0.00019636750221252441, 0.00023566186428070068, 0.00027495622634887695, 0.0003142505884170532, 0.0003535449504852295, 0.00039283931255340576, 0.00043213367462158203, 0.0004714280366897583, 0.0005107223987579346, 0.0005500167608261108, 0.0005893111228942871, 0.0006286054849624634, 0.0006678998470306396, 0.0007071942090988159, 0.0007464885711669922, 0.0007857829332351685, 0.0008250772953033447, 0.000864371657371521, 0.0009036660194396973, 0.0009429603815078735, 0.0009822547435760498, 0.001021549105644226, 0.0010608434677124023, 0.0011001378297805786, 0.0011394321918487549, 0.0011787265539169312, 0.0012180209159851074, 0.0012573152780532837, 0.00129660964012146, 0.0013359040021896362, 0.0013751983642578125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 8.0, 10.0, 5.0, 14.0, 13.0, 27.0, 44.0, 47.0, 81.0, 131.0, 209.0, 353.0, 645.0, 1261.0, 2829.0, 7339.0, 26327.0, 143718.0, 570404.0, 238391.0, 39777.0, 10030.0, 3492.0, 1551.0, 776.0, 412.0, 236.0, 140.0, 96.0, 60.0, 31.0, 25.0, 16.0, 16.0, 9.0, 7.0, 11.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.068359375, -1.998565673828125, -1.92877197265625, -1.858978271484375, -1.7891845703125, -1.719390869140625, -1.64959716796875, -1.579803466796875, -1.510009765625, -1.440216064453125, -1.37042236328125, -1.300628662109375, -1.2308349609375, -1.161041259765625, -1.09124755859375, -1.021453857421875, -0.95166015625, -0.881866455078125, -0.81207275390625, -0.742279052734375, -0.6724853515625, -0.602691650390625, -0.53289794921875, -0.463104248046875, -0.393310546875, -0.323516845703125, -0.25372314453125, -0.183929443359375, -0.1141357421875, -0.044342041015625, 0.02545166015625, 0.095245361328125, 0.1650390625, 0.234832763671875, 0.30462646484375, 0.374420166015625, 0.4442138671875, 0.514007568359375, 0.58380126953125, 0.653594970703125, 0.723388671875, 0.793182373046875, 0.86297607421875, 0.932769775390625, 1.0025634765625, 1.072357177734375, 1.14215087890625, 1.211944580078125, 1.28173828125, 1.351531982421875, 1.42132568359375, 1.491119384765625, 1.5609130859375, 1.630706787109375, 1.70050048828125, 1.770294189453125, 1.840087890625, 1.909881591796875, 1.97967529296875, 2.049468994140625, 2.1192626953125, 2.189056396484375, 2.25885009765625, 2.328643798828125, 2.3984375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 7.0, 9.0, 13.0, 10.0, 32.0, 38.0, 53.0, 60.0, 76.0, 97.0, 95.0, 103.0, 103.0, 83.0, 64.0, 32.0, 35.0, 27.0, 16.0, 13.0, 8.0, 5.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50537109375, -0.4886016845703125, -0.471832275390625, -0.4550628662109375, -0.43829345703125, -0.4215240478515625, -0.404754638671875, -0.3879852294921875, -0.3712158203125, -0.3544464111328125, -0.337677001953125, -0.3209075927734375, -0.30413818359375, -0.2873687744140625, -0.270599365234375, -0.2538299560546875, -0.237060546875, -0.2202911376953125, -0.203521728515625, -0.1867523193359375, -0.16998291015625, -0.1532135009765625, -0.136444091796875, -0.1196746826171875, -0.1029052734375, -0.0861358642578125, -0.069366455078125, -0.0525970458984375, -0.03582763671875, -0.0190582275390625, -0.002288818359375, 0.0144805908203125, 0.03125, 0.0480194091796875, 0.064788818359375, 0.0815582275390625, 0.09832763671875, 0.1150970458984375, 0.131866455078125, 0.1486358642578125, 0.1654052734375, 0.1821746826171875, 0.198944091796875, 0.2157135009765625, 0.23248291015625, 0.2492523193359375, 0.266021728515625, 0.2827911376953125, 0.299560546875, 0.3163299560546875, 0.333099365234375, 0.3498687744140625, 0.36663818359375, 0.3834075927734375, 0.400177001953125, 0.4169464111328125, 0.4337158203125, 0.4504852294921875, 0.467254638671875, 0.4840240478515625, 0.50079345703125, 0.5175628662109375, 0.534332275390625, 0.5511016845703125, 0.56787109375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 5.0, 10.0, 16.0, 12.0, 27.0, 55.0, 66.0, 86.0, 145.0, 141.0, 108.0, 112.0, 58.0, 48.0, 30.0, 21.0, 15.0, 7.0, 8.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.878320693969727, -13.53606128692627, -13.193801879882812, -12.851542472839355, -12.509283065795898, -12.167024612426758, -11.8247652053833, -11.482505798339844, -11.140246391296387, -10.79798698425293, -10.455727577209473, -10.113468170166016, -9.771209716796875, -9.428950309753418, -9.086690902709961, -8.744431495666504, -8.402172088623047, -8.05991268157959, -7.717653274536133, -7.375394344329834, -7.033134937286377, -6.69087553024292, -6.348616600036621, -6.006357192993164, -5.664097785949707, -5.32183837890625, -4.979578971862793, -4.637320041656494, -4.295060634613037, -3.95280122756958, -3.610542058944702, -3.268282890319824, -2.9260244369506836, -2.5837650299072266, -2.2415058612823486, -1.8992465734481812, -1.5569872856140137, -1.2147279977798462, -0.8724687099456787, -0.5302095413208008, -0.18795013427734375, 0.15430915355682373, 0.4965684413909912, 0.8388277292251587, 1.1810870170593262, 1.5233463048934937, 1.8656055927276611, 2.207864761352539, 2.550124168395996, 2.892383575439453, 3.234642744064331, 3.576901912689209, 3.919161319732666, 4.261420726776123, 4.603679656982422, 4.945939064025879, 5.288198471069336, 5.630457878112793, 5.97271728515625, 6.314976215362549, 6.657235622406006, 6.999495029449463, 7.341753959655762, 7.684013366699219, 8.026272773742676]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 11.0, 8.0, 11.0, 5.0, 9.0, 14.0, 22.0, 16.0, 20.0, 30.0, 22.0, 25.0, 30.0, 30.0, 33.0, 48.0, 34.0, 33.0, 39.0, 64.0, 49.0, 44.0, 39.0, 47.0, 43.0, 29.0, 34.0, 28.0, 31.0, 19.0, 16.0, 15.0, 24.0, 17.0, 7.0, 7.0, 11.0, 7.0, 3.0, 5.0, 6.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-5.043096542358398, -4.896683216094971, -4.750269889831543, -4.603856563568115, -4.4574432373046875, -4.31102991104126, -4.164616584777832, -4.018202781677246, -3.8717896938323975, -3.7253763675689697, -3.578963041305542, -3.4325497150421143, -3.2861361503601074, -3.1397228240966797, -2.993309497833252, -2.846896171569824, -2.7004828453063965, -2.5540695190429688, -2.407656192779541, -2.2612428665161133, -2.1148295402526855, -1.9684160947799683, -1.822002649307251, -1.6755893230438232, -1.5291759967803955, -1.3827626705169678, -1.23634934425354, -1.0899358987808228, -0.943522572517395, -0.7971092462539673, -0.6506958603858948, -0.5042824745178223, -0.35786962509155273, -0.2114562690258026, -0.06504291296005249, 0.08137044310569763, 0.22778379917144775, 0.3741971254348755, 0.520610511302948, 0.6670238971710205, 0.8134372234344482, 0.959850549697876, 1.1062638759613037, 1.252677321434021, 1.3990906476974487, 1.5455039739608765, 1.6919174194335938, 1.8383307456970215, 1.9847440719604492, 2.131157398223877, 2.2775707244873047, 2.4239840507507324, 2.57039737701416, 2.716810703277588, 2.8632242679595947, 3.0096375942230225, 3.15605092048645, 3.302464246749878, 3.4488775730133057, 3.5952908992767334, 3.7417044639587402, 3.888117790222168, 4.034531116485596, 4.180944442749023, 4.327357769012451]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 6.0, 16.0, 13.0, 24.0, 31.0, 41.0, 63.0, 108.0, 193.0, 285.0, 501.0, 927.0, 1844.0, 3813.0, 8564.0, 21260.0, 59661.0, 196359.0, 465008.0, 193828.0, 58797.0, 20966.0, 8550.0, 3758.0, 1825.0, 872.0, 483.0, 268.0, 170.0, 109.0, 58.0, 51.0, 36.0, 18.0, 11.0, 5.0, 12.0, 10.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.00390625, -3.8582763671875, -3.712646484375, -3.5670166015625, -3.42138671875, -3.2757568359375, -3.130126953125, -2.9844970703125, -2.8388671875, -2.6932373046875, -2.547607421875, -2.4019775390625, -2.25634765625, -2.1107177734375, -1.965087890625, -1.8194580078125, -1.673828125, -1.5281982421875, -1.382568359375, -1.2369384765625, -1.09130859375, -0.9456787109375, -0.800048828125, -0.6544189453125, -0.5087890625, -0.3631591796875, -0.217529296875, -0.0718994140625, 0.07373046875, 0.2193603515625, 0.364990234375, 0.5106201171875, 0.65625, 0.8018798828125, 0.947509765625, 1.0931396484375, 1.23876953125, 1.3843994140625, 1.530029296875, 1.6756591796875, 1.8212890625, 1.9669189453125, 2.112548828125, 2.2581787109375, 2.40380859375, 2.5494384765625, 2.695068359375, 2.8406982421875, 2.986328125, 3.1319580078125, 3.277587890625, 3.4232177734375, 3.56884765625, 3.7144775390625, 3.860107421875, 4.0057373046875, 4.1513671875, 4.2969970703125, 4.442626953125, 4.5882568359375, 4.73388671875, 4.8795166015625, 5.025146484375, 5.1707763671875, 5.31640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 9.0, 8.0, 7.0, 10.0, 13.0, 8.0, 13.0, 20.0, 12.0, 19.0, 29.0, 23.0, 43.0, 28.0, 40.0, 45.0, 49.0, 45.0, 40.0, 48.0, 50.0, 56.0, 39.0, 30.0, 48.0, 38.0, 38.0, 35.0, 21.0, 19.0, 17.0, 17.0, 16.0, 10.0, 11.0, 10.0, 10.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.0625, -11.7025146484375, -11.342529296875, -10.9825439453125, -10.62255859375, -10.2625732421875, -9.902587890625, -9.5426025390625, -9.1826171875, -8.8226318359375, -8.462646484375, -8.1026611328125, -7.74267578125, -7.3826904296875, -7.022705078125, -6.6627197265625, -6.302734375, -5.9427490234375, -5.582763671875, -5.2227783203125, -4.86279296875, -4.5028076171875, -4.142822265625, -3.7828369140625, -3.4228515625, -3.0628662109375, -2.702880859375, -2.3428955078125, -1.98291015625, -1.6229248046875, -1.262939453125, -0.9029541015625, -0.54296875, -0.1829833984375, 0.177001953125, 0.5369873046875, 0.89697265625, 1.2569580078125, 1.616943359375, 1.9769287109375, 2.3369140625, 2.6968994140625, 3.056884765625, 3.4168701171875, 3.77685546875, 4.1368408203125, 4.496826171875, 4.8568115234375, 5.216796875, 5.5767822265625, 5.936767578125, 6.2967529296875, 6.65673828125, 7.0167236328125, 7.376708984375, 7.7366943359375, 8.0966796875, 8.4566650390625, 8.816650390625, 9.1766357421875, 9.53662109375, 9.8966064453125, 10.256591796875, 10.6165771484375, 10.9765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 9.0, 6.0, 7.0, 5.0, 7.0, 14.0, 8.0, 12.0, 16.0, 14.0, 19.0, 30.0, 26.0, 21.0, 28.0, 21.0, 38.0, 31.0, 43.0, 38.0, 107.0, 1079.0, 906100.0, 139940.0, 466.0, 73.0, 33.0, 49.0, 40.0, 25.0, 29.0, 25.0, 34.0, 30.0, 21.0, 15.0, 16.0, 23.0, 7.0, 11.0, 8.0, 8.0, 3.0, 6.0, 6.0, 6.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-34.84375, -33.63720703125, -32.4306640625, -31.22412109375, -30.017578125, -28.81103515625, -27.6044921875, -26.39794921875, -25.19140625, -23.98486328125, -22.7783203125, -21.57177734375, -20.365234375, -19.15869140625, -17.9521484375, -16.74560546875, -15.5390625, -14.33251953125, -13.1259765625, -11.91943359375, -10.712890625, -9.50634765625, -8.2998046875, -7.09326171875, -5.88671875, -4.68017578125, -3.4736328125, -2.26708984375, -1.060546875, 0.14599609375, 1.3525390625, 2.55908203125, 3.765625, 4.97216796875, 6.1787109375, 7.38525390625, 8.591796875, 9.79833984375, 11.0048828125, 12.21142578125, 13.41796875, 14.62451171875, 15.8310546875, 17.03759765625, 18.244140625, 19.45068359375, 20.6572265625, 21.86376953125, 23.0703125, 24.27685546875, 25.4833984375, 26.68994140625, 27.896484375, 29.10302734375, 30.3095703125, 31.51611328125, 32.72265625, 33.92919921875, 35.1357421875, 36.34228515625, 37.548828125, 38.75537109375, 39.9619140625, 41.16845703125, 42.375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 10.0, 5.0, 9.0, 9.0, 7.0, 15.0, 5.0, 20.0, 9.0, 26.0, 31.0, 22.0, 24.0, 19.0, 28.0, 37.0, 36.0, 30.0, 37.0, 30.0, 31.0, 45.0, 50.0, 40.0, 29.0, 33.0, 43.0, 33.0, 43.0, 26.0, 26.0, 25.0, 28.0, 15.0, 23.0, 19.0, 14.0, 16.0, 12.0, 11.0, 5.0, 7.0, 5.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.7734375, -9.4359130859375, -9.098388671875, -8.7608642578125, -8.42333984375, -8.0858154296875, -7.748291015625, -7.4107666015625, -7.0732421875, -6.7357177734375, -6.398193359375, -6.0606689453125, -5.72314453125, -5.3856201171875, -5.048095703125, -4.7105712890625, -4.373046875, -4.0355224609375, -3.697998046875, -3.3604736328125, -3.02294921875, -2.6854248046875, -2.347900390625, -2.0103759765625, -1.6728515625, -1.3353271484375, -0.997802734375, -0.6602783203125, -0.32275390625, 0.0147705078125, 0.352294921875, 0.6898193359375, 1.02734375, 1.3648681640625, 1.702392578125, 2.0399169921875, 2.37744140625, 2.7149658203125, 3.052490234375, 3.3900146484375, 3.7275390625, 4.0650634765625, 4.402587890625, 4.7401123046875, 5.07763671875, 5.4151611328125, 5.752685546875, 6.0902099609375, 6.427734375, 6.7652587890625, 7.102783203125, 7.4403076171875, 7.77783203125, 8.1153564453125, 8.452880859375, 8.7904052734375, 9.1279296875, 9.4654541015625, 9.802978515625, 10.1405029296875, 10.47802734375, 10.8155517578125, 11.153076171875, 11.4906005859375, 11.828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 4.0, 9.0, 14.0, 19.0, 32.0, 28.0, 36.0, 107.0, 165.0, 214.0, 500.0, 959.0, 2313.0, 7303.0, 46212.0, 668461.0, 291314.0, 22738.0, 4855.0, 1620.0, 765.0, 389.0, 202.0, 117.0, 64.0, 41.0, 11.0, 21.0, 10.0, 5.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.53125, -3.41290283203125, -3.2945556640625, -3.17620849609375, -3.057861328125, -2.93951416015625, -2.8211669921875, -2.70281982421875, -2.58447265625, -2.46612548828125, -2.3477783203125, -2.22943115234375, -2.111083984375, -1.99273681640625, -1.8743896484375, -1.75604248046875, -1.6376953125, -1.51934814453125, -1.4010009765625, -1.28265380859375, -1.164306640625, -1.04595947265625, -0.9276123046875, -0.80926513671875, -0.69091796875, -0.57257080078125, -0.4542236328125, -0.33587646484375, -0.217529296875, -0.09918212890625, 0.0191650390625, 0.13751220703125, 0.255859375, 0.37420654296875, 0.4925537109375, 0.61090087890625, 0.729248046875, 0.84759521484375, 0.9659423828125, 1.08428955078125, 1.20263671875, 1.32098388671875, 1.4393310546875, 1.55767822265625, 1.676025390625, 1.79437255859375, 1.9127197265625, 2.03106689453125, 2.1494140625, 2.26776123046875, 2.3861083984375, 2.50445556640625, 2.622802734375, 2.74114990234375, 2.8594970703125, 2.97784423828125, 3.09619140625, 3.21453857421875, 3.3328857421875, 3.45123291015625, 3.569580078125, 3.68792724609375, 3.8062744140625, 3.92462158203125, 4.04296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 3.0, 3.0, 13.0, 8.0, 18.0, 16.0, 34.0, 40.0, 36.0, 78.0, 95.0, 146.0, 129.0, 106.0, 69.0, 68.0, 42.0, 28.0, 17.0, 14.0, 7.0, 13.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002453327178955078, -0.00023241713643074036, -0.0002195015549659729, -0.00020658597350120544, -0.000193670392036438, -0.00018075481057167053, -0.00016783922910690308, -0.00015492364764213562, -0.00014200806617736816, -0.0001290924847126007, -0.00011617690324783325, -0.0001032613217830658, -9.034574031829834e-05, -7.743015885353088e-05, -6.451457738876343e-05, -5.159899592399597e-05, -3.8683414459228516e-05, -2.576783299446106e-05, -1.2852251529693604e-05, 6.332993507385254e-08, 1.2978911399841309e-05, 2.5894492864608765e-05, 3.881007432937622e-05, 5.172565579414368e-05, 6.464123725891113e-05, 7.755681872367859e-05, 9.047240018844604e-05, 0.0001033879816532135, 0.00011630356311798096, 0.0001292191445827484, 0.00014213472604751587, 0.00015505030751228333, 0.00016796588897705078, 0.00018088147044181824, 0.0001937970519065857, 0.00020671263337135315, 0.0002196282148361206, 0.00023254379630088806, 0.0002454593777656555, 0.000258374959230423, 0.00027129054069519043, 0.0002842061221599579, 0.00029712170362472534, 0.0003100372850894928, 0.00032295286655426025, 0.0003358684480190277, 0.00034878402948379517, 0.0003616996109485626, 0.0003746151924133301, 0.00038753077387809753, 0.000400446355342865, 0.00041336193680763245, 0.0004262775182723999, 0.00043919309973716736, 0.0004521086812019348, 0.00046502426266670227, 0.0004779398441314697, 0.0004908554255962372, 0.0005037710070610046, 0.0005166865885257721, 0.0005296021699905396, 0.000542517751455307, 0.0005554333329200745, 0.0005683489143848419, 0.0005812644958496094]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 6.0, 5.0, 14.0, 22.0, 28.0, 41.0, 53.0, 103.0, 156.0, 280.0, 478.0, 777.0, 1481.0, 3004.0, 7575.0, 22951.0, 94478.0, 523127.0, 309568.0, 58098.0, 15730.0, 5541.0, 2285.0, 1154.0, 593.0, 392.0, 208.0, 124.0, 77.0, 62.0, 43.0, 32.0, 30.0, 16.0, 8.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.08203125, -2.0145263671875, -1.947021484375, -1.8795166015625, -1.81201171875, -1.7445068359375, -1.677001953125, -1.6094970703125, -1.5419921875, -1.4744873046875, -1.406982421875, -1.3394775390625, -1.27197265625, -1.2044677734375, -1.136962890625, -1.0694580078125, -1.001953125, -0.9344482421875, -0.866943359375, -0.7994384765625, -0.73193359375, -0.6644287109375, -0.596923828125, -0.5294189453125, -0.4619140625, -0.3944091796875, -0.326904296875, -0.2593994140625, -0.19189453125, -0.1243896484375, -0.056884765625, 0.0106201171875, 0.078125, 0.1456298828125, 0.213134765625, 0.2806396484375, 0.34814453125, 0.4156494140625, 0.483154296875, 0.5506591796875, 0.6181640625, 0.6856689453125, 0.753173828125, 0.8206787109375, 0.88818359375, 0.9556884765625, 1.023193359375, 1.0906982421875, 1.158203125, 1.2257080078125, 1.293212890625, 1.3607177734375, 1.42822265625, 1.4957275390625, 1.563232421875, 1.6307373046875, 1.6982421875, 1.7657470703125, 1.833251953125, 1.9007568359375, 1.96826171875, 2.0357666015625, 2.103271484375, 2.1707763671875, 2.23828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 7.0, 8.0, 11.0, 17.0, 8.0, 14.0, 16.0, 33.0, 36.0, 36.0, 41.0, 90.0, 85.0, 136.0, 126.0, 86.0, 58.0, 45.0, 28.0, 27.0, 20.0, 21.0, 16.0, 7.0, 8.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.177734375, -1.1446304321289062, -1.1115264892578125, -1.0784225463867188, -1.045318603515625, -1.0122146606445312, -0.9791107177734375, -0.9460067749023438, -0.91290283203125, -0.8797988891601562, -0.8466949462890625, -0.8135910034179688, -0.780487060546875, -0.7473831176757812, -0.7142791748046875, -0.6811752319335938, -0.6480712890625, -0.6149673461914062, -0.5818634033203125, -0.5487594604492188, -0.515655517578125, -0.48255157470703125, -0.4494476318359375, -0.41634368896484375, -0.38323974609375, -0.35013580322265625, -0.3170318603515625, -0.28392791748046875, -0.250823974609375, -0.21772003173828125, -0.1846160888671875, -0.15151214599609375, -0.118408203125, -0.08530426025390625, -0.0522003173828125, -0.01909637451171875, 0.014007568359375, 0.04711151123046875, 0.0802154541015625, 0.11331939697265625, 0.14642333984375, 0.17952728271484375, 0.2126312255859375, 0.24573516845703125, 0.278839111328125, 0.31194305419921875, 0.3450469970703125, 0.37815093994140625, 0.4112548828125, 0.44435882568359375, 0.4774627685546875, 0.5105667114257812, 0.543670654296875, 0.5767745971679688, 0.6098785400390625, 0.6429824829101562, 0.67608642578125, 0.7091903686523438, 0.7422943115234375, 0.7753982543945312, 0.808502197265625, 0.8416061401367188, 0.8747100830078125, 0.9078140258789062, 0.94091796875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 7.0, 5.0, 6.0, 4.0, 8.0, 7.0, 15.0, 13.0, 34.0, 48.0, 80.0, 94.0, 122.0, 126.0, 127.0, 116.0, 69.0, 34.0, 28.0, 23.0, 11.0, 7.0, 9.0, 8.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.67986488342285, -24.00391387939453, -23.32796287536621, -22.65201187133789, -21.976062774658203, -21.300111770629883, -20.624160766601562, -19.948209762573242, -19.272258758544922, -18.5963077545166, -17.92035675048828, -17.244407653808594, -16.568456649780273, -15.892505645751953, -15.216554641723633, -14.540603637695312, -13.864654541015625, -13.188703536987305, -12.5127534866333, -11.83680248260498, -11.160852432250977, -10.484901428222656, -9.808950424194336, -9.132999420166016, -8.457049369812012, -7.78109884262085, -7.1051483154296875, -6.429197311401367, -5.753246784210205, -5.077296257019043, -4.401345252990723, -3.7253947257995605, -3.0494461059570312, -2.373495578765869, -1.697544813156128, -1.0215940475463867, -0.3456435203552246, 0.3303070068359375, 1.0062580108642578, 1.68220853805542, 2.358159065246582, 3.034109592437744, 3.7100603580474854, 4.386011123657227, 5.061961650848389, 5.737912178039551, 6.413863182067871, 7.089813709259033, 7.765764236450195, 8.441715240478516, 9.11766529083252, 9.79361629486084, 10.469566345214844, 11.145517349243164, 11.821468353271484, 12.497419357299805, 13.173369407653809, 13.849320411682129, 14.525270462036133, 15.201221466064453, 15.877172470092773, 16.553123474121094, 17.22907257080078, 17.9050235748291, 18.580974578857422]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 2.0, 15.0, 9.0, 5.0, 15.0, 13.0, 15.0, 15.0, 29.0, 25.0, 29.0, 33.0, 39.0, 37.0, 30.0, 37.0, 37.0, 48.0, 36.0, 40.0, 46.0, 50.0, 46.0, 37.0, 33.0, 19.0, 39.0, 32.0, 21.0, 19.0, 28.0, 17.0, 15.0, 12.0, 15.0, 9.0, 5.0, 10.0, 3.0, 11.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-16.421985626220703, -15.898605346679688, -15.375225067138672, -14.851845741271973, -14.328465461730957, -13.805085182189941, -13.281705856323242, -12.758325576782227, -12.234945297241211, -11.711565017700195, -11.18818473815918, -10.66480541229248, -10.141425132751465, -9.61804485321045, -9.09466552734375, -8.571285247802734, -8.047904968261719, -7.524524688720703, -7.001144886016846, -6.477765083312988, -5.954384803771973, -5.431004524230957, -4.9076247215271, -4.384244918823242, -3.8608646392822266, -3.33748459815979, -2.8141045570373535, -2.290724515914917, -1.7673444747924805, -1.243964433670044, -0.7205843925476074, -0.1972043514251709, 0.3261756896972656, 0.8495557308197021, 1.3729357719421387, 1.8963158130645752, 2.4196958541870117, 2.9430758953094482, 3.4664559364318848, 3.9898359775543213, 4.513216018676758, 5.036596298217773, 5.559976100921631, 6.083355903625488, 6.606736183166504, 7.1301164627075195, 7.653496265411377, 8.176876068115234, 8.70025634765625, 9.223636627197266, 9.747016906738281, 10.27039623260498, 10.793776512145996, 11.317156791687012, 11.840536117553711, 12.363916397094727, 12.887296676635742, 13.410676956176758, 13.934057235717773, 14.457436561584473, 14.980816841125488, 15.504197120666504, 16.027576446533203, 16.55095672607422, 17.074337005615234]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 15.0, 5.0, 15.0, 13.0, 21.0, 16.0, 38.0, 61.0, 78.0, 126.0, 197.0, 460.0, 967.0, 2415.0, 7991.0, 37120.0, 322440.0, 2640507.0, 1053708.0, 103448.0, 17278.0, 4467.0, 1563.0, 625.0, 285.0, 140.0, 61.0, 50.0, 36.0, 33.0, 25.0, 11.0, 15.0, 6.0, 5.0, 8.0, 3.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.9375, -12.4874267578125, -12.037353515625, -11.5872802734375, -11.13720703125, -10.6871337890625, -10.237060546875, -9.7869873046875, -9.3369140625, -8.8868408203125, -8.436767578125, -7.9866943359375, -7.53662109375, -7.0865478515625, -6.636474609375, -6.1864013671875, -5.736328125, -5.2862548828125, -4.836181640625, -4.3861083984375, -3.93603515625, -3.4859619140625, -3.035888671875, -2.5858154296875, -2.1357421875, -1.6856689453125, -1.235595703125, -0.7855224609375, -0.33544921875, 0.1146240234375, 0.564697265625, 1.0147705078125, 1.46484375, 1.9149169921875, 2.364990234375, 2.8150634765625, 3.26513671875, 3.7152099609375, 4.165283203125, 4.6153564453125, 5.0654296875, 5.5155029296875, 5.965576171875, 6.4156494140625, 6.86572265625, 7.3157958984375, 7.765869140625, 8.2159423828125, 8.666015625, 9.1160888671875, 9.566162109375, 10.0162353515625, 10.46630859375, 10.9163818359375, 11.366455078125, 11.8165283203125, 12.2666015625, 12.7166748046875, 13.166748046875, 13.6168212890625, 14.06689453125, 14.5169677734375, 14.967041015625, 15.4171142578125, 15.8671875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 5.0, 4.0, 7.0, 8.0, 10.0, 12.0, 17.0, 20.0, 24.0, 17.0, 31.0, 25.0, 35.0, 34.0, 40.0, 34.0, 50.0, 51.0, 44.0, 53.0, 51.0, 57.0, 42.0, 48.0, 37.0, 28.0, 35.0, 25.0, 25.0, 18.0, 24.0, 8.0, 13.0, 19.0, 8.0, 9.0, 11.0, 4.0, 4.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1015625, -7.87066650390625, -7.6397705078125, -7.40887451171875, -7.177978515625, -6.94708251953125, -6.7161865234375, -6.48529052734375, -6.25439453125, -6.02349853515625, -5.7926025390625, -5.56170654296875, -5.330810546875, -5.09991455078125, -4.8690185546875, -4.63812255859375, -4.4072265625, -4.17633056640625, -3.9454345703125, -3.71453857421875, -3.483642578125, -3.25274658203125, -3.0218505859375, -2.79095458984375, -2.56005859375, -2.32916259765625, -2.0982666015625, -1.86737060546875, -1.636474609375, -1.40557861328125, -1.1746826171875, -0.94378662109375, -0.712890625, -0.48199462890625, -0.2510986328125, -0.02020263671875, 0.210693359375, 0.44158935546875, 0.6724853515625, 0.90338134765625, 1.13427734375, 1.36517333984375, 1.5960693359375, 1.82696533203125, 2.057861328125, 2.28875732421875, 2.5196533203125, 2.75054931640625, 2.9814453125, 3.21234130859375, 3.4432373046875, 3.67413330078125, 3.905029296875, 4.13592529296875, 4.3668212890625, 4.59771728515625, 4.82861328125, 5.05950927734375, 5.2904052734375, 5.52130126953125, 5.752197265625, 5.98309326171875, 6.2139892578125, 6.44488525390625, 6.67578125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 11.0, 16.0, 25.0, 59.0, 106.0, 266.0, 1229.0, 40226.0, 4110339.0, 40239.0, 1268.0, 269.0, 100.0, 49.0, 26.0, 14.0, 14.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.625, -51.2216796875, -49.818359375, -48.4150390625, -47.01171875, -45.6083984375, -44.205078125, -42.8017578125, -41.3984375, -39.9951171875, -38.591796875, -37.1884765625, -35.78515625, -34.3818359375, -32.978515625, -31.5751953125, -30.171875, -28.7685546875, -27.365234375, -25.9619140625, -24.55859375, -23.1552734375, -21.751953125, -20.3486328125, -18.9453125, -17.5419921875, -16.138671875, -14.7353515625, -13.33203125, -11.9287109375, -10.525390625, -9.1220703125, -7.71875, -6.3154296875, -4.912109375, -3.5087890625, -2.10546875, -0.7021484375, 0.701171875, 2.1044921875, 3.5078125, 4.9111328125, 6.314453125, 7.7177734375, 9.12109375, 10.5244140625, 11.927734375, 13.3310546875, 14.734375, 16.1376953125, 17.541015625, 18.9443359375, 20.34765625, 21.7509765625, 23.154296875, 24.5576171875, 25.9609375, 27.3642578125, 28.767578125, 30.1708984375, 31.57421875, 32.9775390625, 34.380859375, 35.7841796875, 37.1875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 5.0, 2.0, 4.0, 14.0, 13.0, 19.0, 32.0, 42.0, 55.0, 88.0, 102.0, 163.0, 220.0, 363.0, 530.0, 620.0, 548.0, 385.0, 243.0, 185.0, 117.0, 89.0, 54.0, 41.0, 40.0, 18.0, 23.0, 16.0, 9.0, 4.0, 4.0, 6.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.568359375, -3.4622802734375, -3.356201171875, -3.2501220703125, -3.14404296875, -3.0379638671875, -2.931884765625, -2.8258056640625, -2.7197265625, -2.6136474609375, -2.507568359375, -2.4014892578125, -2.29541015625, -2.1893310546875, -2.083251953125, -1.9771728515625, -1.87109375, -1.7650146484375, -1.658935546875, -1.5528564453125, -1.44677734375, -1.3406982421875, -1.234619140625, -1.1285400390625, -1.0224609375, -0.9163818359375, -0.810302734375, -0.7042236328125, -0.59814453125, -0.4920654296875, -0.385986328125, -0.2799072265625, -0.173828125, -0.0677490234375, 0.038330078125, 0.1444091796875, 0.25048828125, 0.3565673828125, 0.462646484375, 0.5687255859375, 0.6748046875, 0.7808837890625, 0.886962890625, 0.9930419921875, 1.09912109375, 1.2052001953125, 1.311279296875, 1.4173583984375, 1.5234375, 1.6295166015625, 1.735595703125, 1.8416748046875, 1.94775390625, 2.0538330078125, 2.159912109375, 2.2659912109375, 2.3720703125, 2.4781494140625, 2.584228515625, 2.6903076171875, 2.79638671875, 2.9024658203125, 3.008544921875, 3.1146240234375, 3.220703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 6.0, 6.0, 3.0, 6.0, 7.0, 10.0, 13.0, 28.0, 31.0, 46.0, 50.0, 73.0, 73.0, 81.0, 91.0, 84.0, 91.0, 74.0, 57.0, 50.0, 26.0, 28.0, 14.0, 16.0, 11.0, 7.0, 4.0, 4.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.074129104614258, -14.662347793579102, -14.250567436218262, -13.838786125183105, -13.42700481414795, -13.01522445678711, -12.603443145751953, -12.191661834716797, -11.77988052368164, -11.368099212646484, -10.956318855285645, -10.544537544250488, -10.132756233215332, -9.720975875854492, -9.309194564819336, -8.89741325378418, -8.48563289642334, -8.073851585388184, -7.6620707511901855, -7.2502899169921875, -6.838508605957031, -6.426727771759033, -6.014946937561035, -5.603165626525879, -5.191384792327881, -4.779603958129883, -4.367822647094727, -3.9560418128967285, -3.5442607402801514, -3.132479667663574, -2.720698833465576, -2.308917760848999, -1.8971376419067383, -1.4853565692901611, -1.0735756158828735, -0.6617946624755859, -0.2500135898590088, 0.16176748275756836, 0.5735483169555664, 0.9853293895721436, 1.3971104621887207, 1.8088915348052979, 2.220672607421875, 2.632453441619873, 3.04423451423645, 3.4560155868530273, 3.8677964210510254, 4.279577255249023, 4.69135856628418, 5.103139400482178, 5.514920711517334, 5.926701545715332, 6.338482856750488, 6.750263690948486, 7.162044525146484, 7.573825836181641, 7.985606670379639, 8.397387504577637, 8.809168815612793, 9.220949172973633, 9.632730484008789, 10.044511795043945, 10.456293106079102, 10.868073463439941, 11.279854774475098]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 9.0, 9.0, 5.0, 6.0, 14.0, 13.0, 17.0, 17.0, 11.0, 19.0, 20.0, 31.0, 27.0, 31.0, 39.0, 31.0, 30.0, 53.0, 53.0, 61.0, 42.0, 48.0, 42.0, 46.0, 32.0, 44.0, 26.0, 25.0, 33.0, 25.0, 24.0, 22.0, 22.0, 11.0, 12.0, 12.0, 11.0, 7.0, 4.0, 6.0, 5.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.329716682434082, -8.089249610900879, -7.848782062530518, -7.6083149909973145, -7.367847442626953, -7.12738037109375, -6.886913299560547, -6.6464457511901855, -6.405978202819824, -6.165511131286621, -5.92504358291626, -5.684576511383057, -5.444108963012695, -5.203641891479492, -4.963174819946289, -4.722707271575928, -4.482240200042725, -4.2417731285095215, -4.00130558013916, -3.760838508605957, -3.5203709602355957, -3.2799038887023926, -3.0394365787506104, -2.798969268798828, -2.558501958847046, -2.3180346488952637, -2.0775673389434814, -1.8371001482009888, -1.5966328382492065, -1.3561655282974243, -1.1156983375549316, -0.8752310276031494, -0.6347637176513672, -0.39429643750190735, -0.1538291573524475, 0.08663809299468994, 0.32710540294647217, 0.5675727128982544, 0.8080399036407471, 1.0485072135925293, 1.2889745235443115, 1.5294418334960938, 1.769909143447876, 2.010376453399658, 2.2508435249328613, 2.4913110733032227, 2.731778144836426, 2.972245454788208, 3.2127127647399902, 3.4531800746917725, 3.6936473846435547, 3.934114456176758, 4.174582004547119, 4.415049076080322, 4.655516624450684, 4.895983695983887, 5.13645076751709, 5.376917839050293, 5.617385387420654, 5.857852458953857, 6.098320007324219, 6.338787078857422, 6.579254150390625, 6.819721698760986, 7.060189247131348]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 1.0, 4.0, 7.0, 14.0, 14.0, 20.0, 27.0, 46.0, 71.0, 111.0, 159.0, 396.0, 791.0, 1854.0, 4904.0, 14943.0, 53713.0, 242598.0, 538254.0, 140198.0, 34243.0, 10030.0, 3456.0, 1371.0, 609.0, 317.0, 155.0, 86.0, 51.0, 34.0, 19.0, 12.0, 18.0, 7.0, 8.0, 5.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.45703125, -4.32330322265625, -4.1895751953125, -4.05584716796875, -3.922119140625, -3.78839111328125, -3.6546630859375, -3.52093505859375, -3.38720703125, -3.25347900390625, -3.1197509765625, -2.98602294921875, -2.852294921875, -2.71856689453125, -2.5848388671875, -2.45111083984375, -2.3173828125, -2.18365478515625, -2.0499267578125, -1.91619873046875, -1.782470703125, -1.64874267578125, -1.5150146484375, -1.38128662109375, -1.24755859375, -1.11383056640625, -0.9801025390625, -0.84637451171875, -0.712646484375, -0.57891845703125, -0.4451904296875, -0.31146240234375, -0.177734375, -0.04400634765625, 0.0897216796875, 0.22344970703125, 0.357177734375, 0.49090576171875, 0.6246337890625, 0.75836181640625, 0.89208984375, 1.02581787109375, 1.1595458984375, 1.29327392578125, 1.427001953125, 1.56072998046875, 1.6944580078125, 1.82818603515625, 1.9619140625, 2.09564208984375, 2.2293701171875, 2.36309814453125, 2.496826171875, 2.63055419921875, 2.7642822265625, 2.89801025390625, 3.03173828125, 3.16546630859375, 3.2991943359375, 3.43292236328125, 3.566650390625, 3.70037841796875, 3.8341064453125, 3.96783447265625, 4.1015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 11.0, 8.0, 5.0, 13.0, 8.0, 17.0, 20.0, 18.0, 18.0, 39.0, 33.0, 33.0, 35.0, 35.0, 39.0, 44.0, 63.0, 47.0, 63.0, 46.0, 51.0, 42.0, 40.0, 38.0, 29.0, 24.0, 27.0, 29.0, 22.0, 19.0, 19.0, 15.0, 7.0, 7.0, 11.0, 1.0, 5.0, 1.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-5.02734375, -4.87530517578125, -4.7232666015625, -4.57122802734375, -4.419189453125, -4.26715087890625, -4.1151123046875, -3.96307373046875, -3.81103515625, -3.65899658203125, -3.5069580078125, -3.35491943359375, -3.202880859375, -3.05084228515625, -2.8988037109375, -2.74676513671875, -2.5947265625, -2.44268798828125, -2.2906494140625, -2.13861083984375, -1.986572265625, -1.83453369140625, -1.6824951171875, -1.53045654296875, -1.37841796875, -1.22637939453125, -1.0743408203125, -0.92230224609375, -0.770263671875, -0.61822509765625, -0.4661865234375, -0.31414794921875, -0.162109375, -0.01007080078125, 0.1419677734375, 0.29400634765625, 0.446044921875, 0.59808349609375, 0.7501220703125, 0.90216064453125, 1.05419921875, 1.20623779296875, 1.3582763671875, 1.51031494140625, 1.662353515625, 1.81439208984375, 1.9664306640625, 2.11846923828125, 2.2705078125, 2.42254638671875, 2.5745849609375, 2.72662353515625, 2.878662109375, 3.03070068359375, 3.1827392578125, 3.33477783203125, 3.48681640625, 3.63885498046875, 3.7908935546875, 3.94293212890625, 4.094970703125, 4.24700927734375, 4.3990478515625, 4.55108642578125, 4.703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 9.0, 7.0, 12.0, 23.0, 15.0, 35.0, 40.0, 58.0, 58.0, 85.0, 132.0, 185.0, 273.0, 485.0, 810.0, 1564.0, 3384.0, 8182.0, 23210.0, 73193.0, 274043.0, 455605.0, 141968.0, 41023.0, 13630.0, 5328.0, 2320.0, 1119.0, 584.0, 346.0, 251.0, 175.0, 114.0, 73.0, 59.0, 45.0, 36.0, 23.0, 15.0, 12.0, 8.0, 3.0, 2.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.9375, -2.846435546875, -2.75537109375, -2.664306640625, -2.5732421875, -2.482177734375, -2.39111328125, -2.300048828125, -2.208984375, -2.117919921875, -2.02685546875, -1.935791015625, -1.8447265625, -1.753662109375, -1.66259765625, -1.571533203125, -1.48046875, -1.389404296875, -1.29833984375, -1.207275390625, -1.1162109375, -1.025146484375, -0.93408203125, -0.843017578125, -0.751953125, -0.660888671875, -0.56982421875, -0.478759765625, -0.3876953125, -0.296630859375, -0.20556640625, -0.114501953125, -0.0234375, 0.067626953125, 0.15869140625, 0.249755859375, 0.3408203125, 0.431884765625, 0.52294921875, 0.614013671875, 0.705078125, 0.796142578125, 0.88720703125, 0.978271484375, 1.0693359375, 1.160400390625, 1.25146484375, 1.342529296875, 1.43359375, 1.524658203125, 1.61572265625, 1.706787109375, 1.7978515625, 1.888916015625, 1.97998046875, 2.071044921875, 2.162109375, 2.253173828125, 2.34423828125, 2.435302734375, 2.5263671875, 2.617431640625, 2.70849609375, 2.799560546875, 2.890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 8.0, 8.0, 18.0, 10.0, 21.0, 26.0, 27.0, 34.0, 33.0, 41.0, 44.0, 49.0, 32.0, 48.0, 44.0, 56.0, 38.0, 40.0, 59.0, 45.0, 44.0, 48.0, 41.0, 33.0, 29.0, 19.0, 25.0, 18.0, 12.0, 20.0, 10.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.3564453125, -10.048828125, -9.7412109375, -9.43359375, -9.1259765625, -8.818359375, -8.5107421875, -8.203125, -7.8955078125, -7.587890625, -7.2802734375, -6.97265625, -6.6650390625, -6.357421875, -6.0498046875, -5.7421875, -5.4345703125, -5.126953125, -4.8193359375, -4.51171875, -4.2041015625, -3.896484375, -3.5888671875, -3.28125, -2.9736328125, -2.666015625, -2.3583984375, -2.05078125, -1.7431640625, -1.435546875, -1.1279296875, -0.8203125, -0.5126953125, -0.205078125, 0.1025390625, 0.41015625, 0.7177734375, 1.025390625, 1.3330078125, 1.640625, 1.9482421875, 2.255859375, 2.5634765625, 2.87109375, 3.1787109375, 3.486328125, 3.7939453125, 4.1015625, 4.4091796875, 4.716796875, 5.0244140625, 5.33203125, 5.6396484375, 5.947265625, 6.2548828125, 6.5625, 6.8701171875, 7.177734375, 7.4853515625, 7.79296875, 8.1005859375, 8.408203125, 8.7158203125, 9.0234375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 8.0, 10.0, 3.0, 9.0, 20.0, 12.0, 18.0, 30.0, 40.0, 61.0, 103.0, 143.0, 237.0, 339.0, 534.0, 1010.0, 1610.0, 3150.0, 7455.0, 24783.0, 146710.0, 625168.0, 189925.0, 30670.0, 8603.0, 3421.0, 1780.0, 965.0, 607.0, 384.0, 246.0, 169.0, 101.0, 63.0, 56.0, 40.0, 23.0, 24.0, 8.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0], "bins": [-1.96875, -1.91339111328125, -1.8580322265625, -1.80267333984375, -1.747314453125, -1.69195556640625, -1.6365966796875, -1.58123779296875, -1.52587890625, -1.47052001953125, -1.4151611328125, -1.35980224609375, -1.304443359375, -1.24908447265625, -1.1937255859375, -1.13836669921875, -1.0830078125, -1.02764892578125, -0.9722900390625, -0.91693115234375, -0.861572265625, -0.80621337890625, -0.7508544921875, -0.69549560546875, -0.64013671875, -0.58477783203125, -0.5294189453125, -0.47406005859375, -0.418701171875, -0.36334228515625, -0.3079833984375, -0.25262451171875, -0.197265625, -0.14190673828125, -0.0865478515625, -0.03118896484375, 0.024169921875, 0.07952880859375, 0.1348876953125, 0.19024658203125, 0.24560546875, 0.30096435546875, 0.3563232421875, 0.41168212890625, 0.467041015625, 0.52239990234375, 0.5777587890625, 0.63311767578125, 0.6884765625, 0.74383544921875, 0.7991943359375, 0.85455322265625, 0.909912109375, 0.96527099609375, 1.0206298828125, 1.07598876953125, 1.13134765625, 1.18670654296875, 1.2420654296875, 1.29742431640625, 1.352783203125, 1.40814208984375, 1.4635009765625, 1.51885986328125, 1.57421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 9.0, 8.0, 26.0, 58.0, 152.0, 283.0, 252.0, 114.0, 54.0, 20.0, 8.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00223541259765625, -0.0021763741970062256, -0.002117335796356201, -0.0020582973957061768, -0.0019992589950561523, -0.001940220594406128, -0.0018811821937561035, -0.001822143793106079, -0.0017631053924560547, -0.0017040669918060303, -0.0016450285911560059, -0.0015859901905059814, -0.001526951789855957, -0.0014679133892059326, -0.0014088749885559082, -0.0013498365879058838, -0.0012907981872558594, -0.001231759786605835, -0.0011727213859558105, -0.0011136829853057861, -0.0010546445846557617, -0.0009956061840057373, -0.0009365677833557129, -0.0008775293827056885, -0.0008184909820556641, -0.0007594525814056396, -0.0007004141807556152, -0.0006413757801055908, -0.0005823373794555664, -0.000523298978805542, -0.0004642605781555176, -0.00040522217750549316, -0.00034618377685546875, -0.00028714537620544434, -0.00022810697555541992, -0.0001690685749053955, -0.0001100301742553711, -5.099177360534668e-05, 8.046627044677734e-06, 6.708502769470215e-05, 0.00012612342834472656, 0.00018516182899475098, 0.0002442002296447754, 0.0003032386302947998, 0.0003622770309448242, 0.00042131543159484863, 0.00048035383224487305, 0.0005393922328948975, 0.0005984306335449219, 0.0006574690341949463, 0.0007165074348449707, 0.0007755458354949951, 0.0008345842361450195, 0.0008936226367950439, 0.0009526610374450684, 0.0010116994380950928, 0.0010707378387451172, 0.0011297762393951416, 0.001188814640045166, 0.0012478530406951904, 0.0013068914413452148, 0.0013659298419952393, 0.0014249682426452637, 0.001484006643295288, 0.0015430450439453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 8.0, 8.0, 16.0, 12.0, 19.0, 33.0, 39.0, 66.0, 100.0, 153.0, 289.0, 434.0, 760.0, 1548.0, 3275.0, 8835.0, 34571.0, 206352.0, 597110.0, 154334.0, 27045.0, 7423.0, 2932.0, 1371.0, 729.0, 381.0, 267.0, 143.0, 113.0, 53.0, 40.0, 35.0, 24.0, 11.0, 10.0, 4.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.771484375, -1.7132568359375, -1.655029296875, -1.5968017578125, -1.53857421875, -1.4803466796875, -1.422119140625, -1.3638916015625, -1.3056640625, -1.2474365234375, -1.189208984375, -1.1309814453125, -1.07275390625, -1.0145263671875, -0.956298828125, -0.8980712890625, -0.83984375, -0.7816162109375, -0.723388671875, -0.6651611328125, -0.60693359375, -0.5487060546875, -0.490478515625, -0.4322509765625, -0.3740234375, -0.3157958984375, -0.257568359375, -0.1993408203125, -0.14111328125, -0.0828857421875, -0.024658203125, 0.0335693359375, 0.091796875, 0.1500244140625, 0.208251953125, 0.2664794921875, 0.32470703125, 0.3829345703125, 0.441162109375, 0.4993896484375, 0.5576171875, 0.6158447265625, 0.674072265625, 0.7322998046875, 0.79052734375, 0.8487548828125, 0.906982421875, 0.9652099609375, 1.0234375, 1.0816650390625, 1.139892578125, 1.1981201171875, 1.25634765625, 1.3145751953125, 1.372802734375, 1.4310302734375, 1.4892578125, 1.5474853515625, 1.605712890625, 1.6639404296875, 1.72216796875, 1.7803955078125, 1.838623046875, 1.8968505859375, 1.955078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 7.0, 6.0, 7.0, 8.0, 10.0, 10.0, 18.0, 31.0, 46.0, 65.0, 85.0, 103.0, 94.0, 120.0, 98.0, 76.0, 51.0, 59.0, 34.0, 24.0, 16.0, 15.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.55517578125, -0.5402107238769531, -0.5252456665039062, -0.5102806091308594, -0.4953155517578125, -0.4803504943847656, -0.46538543701171875, -0.4504203796386719, -0.435455322265625, -0.4204902648925781, -0.40552520751953125, -0.3905601501464844, -0.3755950927734375, -0.3606300354003906, -0.34566497802734375, -0.3306999206542969, -0.31573486328125, -0.3007698059082031, -0.28580474853515625, -0.2708396911621094, -0.2558746337890625, -0.24090957641601562, -0.22594451904296875, -0.21097946166992188, -0.196014404296875, -0.18104934692382812, -0.16608428955078125, -0.15111923217773438, -0.1361541748046875, -0.12118911743164062, -0.10622406005859375, -0.09125900268554688, -0.0762939453125, -0.061328887939453125, -0.04636383056640625, -0.031398773193359375, -0.0164337158203125, -0.001468658447265625, 0.01349639892578125, 0.028461456298828125, 0.043426513671875, 0.058391571044921875, 0.07335662841796875, 0.08832168579101562, 0.1032867431640625, 0.11825180053710938, 0.13321685791015625, 0.14818191528320312, 0.16314697265625, 0.17811203002929688, 0.19307708740234375, 0.20804214477539062, 0.2230072021484375, 0.23797225952148438, 0.25293731689453125, 0.2679023742675781, 0.282867431640625, 0.2978324890136719, 0.31279754638671875, 0.3277626037597656, 0.3427276611328125, 0.3576927185058594, 0.37265777587890625, 0.3876228332519531, 0.402587890625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 3.0, 7.0, 12.0, 21.0, 36.0, 56.0, 89.0, 106.0, 112.0, 120.0, 128.0, 93.0, 64.0, 45.0, 30.0, 17.0, 14.0, 16.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.848424911499023, -11.530074119567871, -11.211723327636719, -10.893373489379883, -10.57502269744873, -10.256671905517578, -9.938321113586426, -9.619970321655273, -9.301619529724121, -8.983268737792969, -8.664917945861816, -8.346567153930664, -8.028217315673828, -7.709866523742676, -7.391515731811523, -7.073164939880371, -6.754814624786377, -6.436463832855225, -6.1181135177612305, -5.799762725830078, -5.481411933898926, -5.163061141967773, -4.844710826873779, -4.526360034942627, -4.208009719848633, -3.8896591663360596, -3.5713083744049072, -3.252957820892334, -2.9346070289611816, -2.6162564754486084, -2.297905921936035, -1.9795551300048828, -1.6612043380737305, -1.3428536653518677, -1.0245029926300049, -0.7061524391174316, -0.38780176639556885, -0.06945109367370605, 0.2488994598388672, 0.5672502517700195, 0.8856008052825928, 1.2039514780044556, 1.5223021507263184, 1.8406527042388916, 2.159003257751465, 2.477354049682617, 2.7957046031951904, 3.1140553951263428, 3.432405948638916, 3.7507565021514893, 4.0691070556640625, 4.387457847595215, 4.705808639526367, 5.0241594314575195, 5.342509746551514, 5.660860538482666, 5.97921085357666, 6.2975616455078125, 6.615911960601807, 6.934262752532959, 7.252613544464111, 7.5709638595581055, 7.889314651489258, 8.20766544342041, 8.526016235351562]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 7.0, 5.0, 10.0, 9.0, 11.0, 11.0, 14.0, 11.0, 15.0, 28.0, 24.0, 33.0, 33.0, 34.0, 40.0, 43.0, 53.0, 58.0, 62.0, 65.0, 55.0, 49.0, 46.0, 38.0, 26.0, 37.0, 34.0, 26.0, 29.0, 22.0, 13.0, 12.0, 16.0, 13.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.244753360748291, -5.084238052368164, -4.923722743988037, -4.76320743560791, -4.602692127227783, -4.442176818847656, -4.281661510467529, -4.121146202087402, -3.9606311321258545, -3.8001158237457275, -3.6396005153656006, -3.4790852069854736, -3.318570137023926, -3.158054828643799, -2.997539520263672, -2.837024211883545, -2.676508903503418, -2.515993595123291, -2.355478286743164, -2.194962978363037, -2.03444766998291, -1.8739324808120728, -1.7134172916412354, -1.5529019832611084, -1.3923866748809814, -1.2318713665008545, -1.0713560581207275, -0.9108408689498901, -0.7503255605697632, -0.5898102521896362, -0.42929500341415405, -0.2687797546386719, -0.10826444625854492, 0.052250832319259644, 0.2127661108970642, 0.3732813894748688, 0.5337966680526733, 0.6943119764328003, 0.8548272252082825, 1.0153424739837646, 1.1758577823638916, 1.3363730907440186, 1.4968883991241455, 1.657403588294983, 1.8179188966751099, 1.9784342050552368, 2.138949394226074, 2.299464702606201, 2.459980010986328, 2.620495319366455, 2.781010627746582, 2.941525936126709, 3.102041244506836, 3.262556552886963, 3.4230716228485107, 3.5835869312286377, 3.7441022396087646, 3.9046175479888916, 4.0651326179504395, 4.225647926330566, 4.386163234710693, 4.54667854309082, 4.707193851470947, 4.867709159851074, 5.028224468231201]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 11.0, 16.0, 23.0, 21.0, 37.0, 63.0, 89.0, 118.0, 182.0, 299.0, 462.0, 811.0, 1340.0, 2302.0, 4240.0, 8412.0, 18331.0, 43241.0, 124776.0, 370566.0, 308109.0, 97974.0, 35769.0, 15079.0, 7331.0, 3770.0, 2102.0, 1167.0, 686.0, 439.0, 266.0, 172.0, 119.0, 64.0, 51.0, 23.0, 28.0, 25.0, 13.0, 6.0, 5.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.06640625, -4.91693115234375, -4.7674560546875, -4.61798095703125, -4.468505859375, -4.31903076171875, -4.1695556640625, -4.02008056640625, -3.87060546875, -3.72113037109375, -3.5716552734375, -3.42218017578125, -3.272705078125, -3.12322998046875, -2.9737548828125, -2.82427978515625, -2.6748046875, -2.52532958984375, -2.3758544921875, -2.22637939453125, -2.076904296875, -1.92742919921875, -1.7779541015625, -1.62847900390625, -1.47900390625, -1.32952880859375, -1.1800537109375, -1.03057861328125, -0.881103515625, -0.73162841796875, -0.5821533203125, -0.43267822265625, -0.283203125, -0.13372802734375, 0.0157470703125, 0.16522216796875, 0.314697265625, 0.46417236328125, 0.6136474609375, 0.76312255859375, 0.91259765625, 1.06207275390625, 1.2115478515625, 1.36102294921875, 1.510498046875, 1.65997314453125, 1.8094482421875, 1.95892333984375, 2.1083984375, 2.25787353515625, 2.4073486328125, 2.55682373046875, 2.706298828125, 2.85577392578125, 3.0052490234375, 3.15472412109375, 3.30419921875, 3.45367431640625, 3.6031494140625, 3.75262451171875, 3.902099609375, 4.05157470703125, 4.2010498046875, 4.35052490234375, 4.5]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 4.0, 4.0, 6.0, 3.0, 7.0, 7.0, 15.0, 18.0, 16.0, 21.0, 27.0, 22.0, 20.0, 27.0, 40.0, 40.0, 53.0, 49.0, 51.0, 60.0, 54.0, 51.0, 45.0, 48.0, 39.0, 43.0, 39.0, 35.0, 31.0, 26.0, 23.0, 15.0, 15.0, 12.0, 10.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9921875, -10.636474609375, -10.28076171875, -9.925048828125, -9.5693359375, -9.213623046875, -8.85791015625, -8.502197265625, -8.146484375, -7.790771484375, -7.43505859375, -7.079345703125, -6.7236328125, -6.367919921875, -6.01220703125, -5.656494140625, -5.30078125, -4.945068359375, -4.58935546875, -4.233642578125, -3.8779296875, -3.522216796875, -3.16650390625, -2.810791015625, -2.455078125, -2.099365234375, -1.74365234375, -1.387939453125, -1.0322265625, -0.676513671875, -0.32080078125, 0.034912109375, 0.390625, 0.746337890625, 1.10205078125, 1.457763671875, 1.8134765625, 2.169189453125, 2.52490234375, 2.880615234375, 3.236328125, 3.592041015625, 3.94775390625, 4.303466796875, 4.6591796875, 5.014892578125, 5.37060546875, 5.726318359375, 6.08203125, 6.437744140625, 6.79345703125, 7.149169921875, 7.5048828125, 7.860595703125, 8.21630859375, 8.572021484375, 8.927734375, 9.283447265625, 9.63916015625, 9.994873046875, 10.3505859375, 10.706298828125, 11.06201171875, 11.417724609375, 11.7734375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 8.0, 4.0, 7.0, 9.0, 14.0, 9.0, 11.0, 11.0, 15.0, 21.0, 26.0, 24.0, 22.0, 21.0, 33.0, 37.0, 30.0, 40.0, 53.0, 74.0, 314.0, 6961.0, 953521.0, 85726.0, 990.0, 146.0, 61.0, 42.0, 35.0, 27.0, 42.0, 34.0, 25.0, 18.0, 17.0, 18.0, 21.0, 16.0, 15.0, 15.0, 6.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-27.734375, -26.88720703125, -26.0400390625, -25.19287109375, -24.345703125, -23.49853515625, -22.6513671875, -21.80419921875, -20.95703125, -20.10986328125, -19.2626953125, -18.41552734375, -17.568359375, -16.72119140625, -15.8740234375, -15.02685546875, -14.1796875, -13.33251953125, -12.4853515625, -11.63818359375, -10.791015625, -9.94384765625, -9.0966796875, -8.24951171875, -7.40234375, -6.55517578125, -5.7080078125, -4.86083984375, -4.013671875, -3.16650390625, -2.3193359375, -1.47216796875, -0.625, 0.22216796875, 1.0693359375, 1.91650390625, 2.763671875, 3.61083984375, 4.4580078125, 5.30517578125, 6.15234375, 6.99951171875, 7.8466796875, 8.69384765625, 9.541015625, 10.38818359375, 11.2353515625, 12.08251953125, 12.9296875, 13.77685546875, 14.6240234375, 15.47119140625, 16.318359375, 17.16552734375, 18.0126953125, 18.85986328125, 19.70703125, 20.55419921875, 21.4013671875, 22.24853515625, 23.095703125, 23.94287109375, 24.7900390625, 25.63720703125, 26.484375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 10.0, 7.0, 11.0, 14.0, 9.0, 8.0, 17.0, 18.0, 21.0, 34.0, 28.0, 22.0, 23.0, 29.0, 37.0, 29.0, 40.0, 40.0, 33.0, 35.0, 40.0, 30.0, 37.0, 37.0, 35.0, 31.0, 35.0, 42.0, 33.0, 23.0, 20.0, 25.0, 26.0, 21.0, 16.0, 13.0, 10.0, 13.0, 7.0, 9.0, 6.0, 5.0, 3.0, 2.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.0078125, -8.7230224609375, -8.438232421875, -8.1534423828125, -7.86865234375, -7.5838623046875, -7.299072265625, -7.0142822265625, -6.7294921875, -6.4447021484375, -6.159912109375, -5.8751220703125, -5.59033203125, -5.3055419921875, -5.020751953125, -4.7359619140625, -4.451171875, -4.1663818359375, -3.881591796875, -3.5968017578125, -3.31201171875, -3.0272216796875, -2.742431640625, -2.4576416015625, -2.1728515625, -1.8880615234375, -1.603271484375, -1.3184814453125, -1.03369140625, -0.7489013671875, -0.464111328125, -0.1793212890625, 0.10546875, 0.3902587890625, 0.675048828125, 0.9598388671875, 1.24462890625, 1.5294189453125, 1.814208984375, 2.0989990234375, 2.3837890625, 2.6685791015625, 2.953369140625, 3.2381591796875, 3.52294921875, 3.8077392578125, 4.092529296875, 4.3773193359375, 4.662109375, 4.9468994140625, 5.231689453125, 5.5164794921875, 5.80126953125, 6.0860595703125, 6.370849609375, 6.6556396484375, 6.9404296875, 7.2252197265625, 7.510009765625, 7.7947998046875, 8.07958984375, 8.3643798828125, 8.649169921875, 8.9339599609375, 9.21875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 8.0, 4.0, 9.0, 14.0, 25.0, 31.0, 34.0, 90.0, 164.0, 302.0, 889.0, 2899.0, 12564.0, 110320.0, 791619.0, 112135.0, 12959.0, 2897.0, 888.0, 330.0, 141.0, 82.0, 45.0, 30.0, 22.0, 12.0, 7.0, 4.0, 8.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.25390625, -3.14361572265625, -3.0333251953125, -2.92303466796875, -2.812744140625, -2.70245361328125, -2.5921630859375, -2.48187255859375, -2.37158203125, -2.26129150390625, -2.1510009765625, -2.04071044921875, -1.930419921875, -1.82012939453125, -1.7098388671875, -1.59954833984375, -1.4892578125, -1.37896728515625, -1.2686767578125, -1.15838623046875, -1.048095703125, -0.93780517578125, -0.8275146484375, -0.71722412109375, -0.60693359375, -0.49664306640625, -0.3863525390625, -0.27606201171875, -0.165771484375, -0.05548095703125, 0.0548095703125, 0.16510009765625, 0.275390625, 0.38568115234375, 0.4959716796875, 0.60626220703125, 0.716552734375, 0.82684326171875, 0.9371337890625, 1.04742431640625, 1.15771484375, 1.26800537109375, 1.3782958984375, 1.48858642578125, 1.598876953125, 1.70916748046875, 1.8194580078125, 1.92974853515625, 2.0400390625, 2.15032958984375, 2.2606201171875, 2.37091064453125, 2.481201171875, 2.59149169921875, 2.7017822265625, 2.81207275390625, 2.92236328125, 3.03265380859375, 3.1429443359375, 3.25323486328125, 3.363525390625, 3.47381591796875, 3.5841064453125, 3.69439697265625, 3.8046875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 8.0, 6.0, 6.0, 18.0, 15.0, 21.0, 21.0, 32.0, 63.0, 81.0, 105.0, 100.0, 131.0, 91.0, 81.0, 43.0, 44.0, 39.0, 20.0, 23.0, 9.0, 10.0, 7.0, 7.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002199411392211914, -0.000209001824259758, -0.00019806250929832458, -0.00018712319433689117, -0.00017618387937545776, -0.00016524456441402435, -0.00015430524945259094, -0.00014336593449115753, -0.00013242661952972412, -0.00012148730456829071, -0.0001105479896068573, -9.960867464542389e-05, -8.866935968399048e-05, -7.773004472255707e-05, -6.679072976112366e-05, -5.5851414799690247e-05, -4.4912099838256836e-05, -3.3972784876823425e-05, -2.3033469915390015e-05, -1.2094154953956604e-05, -1.1548399925231934e-06, 9.784474968910217e-06, 2.0723789930343628e-05, 3.166310489177704e-05, 4.260241985321045e-05, 5.354173481464386e-05, 6.448104977607727e-05, 7.542036473751068e-05, 8.635967969894409e-05, 9.72989946603775e-05, 0.00010823830962181091, 0.00011917762458324432, 0.00013011693954467773, 0.00014105625450611115, 0.00015199556946754456, 0.00016293488442897797, 0.00017387419939041138, 0.0001848135143518448, 0.0001957528293132782, 0.0002066921442747116, 0.00021763145923614502, 0.00022857077419757843, 0.00023951008915901184, 0.00025044940412044525, 0.00026138871908187866, 0.00027232803404331207, 0.0002832673490047455, 0.0002942066639661789, 0.0003051459789276123, 0.0003160852938890457, 0.0003270246088504791, 0.00033796392381191254, 0.00034890323877334595, 0.00035984255373477936, 0.00037078186869621277, 0.0003817211836576462, 0.0003926604986190796, 0.000403599813580513, 0.0004145391285419464, 0.0004254784435033798, 0.00043641775846481323, 0.00044735707342624664, 0.00045829638838768005, 0.00046923570334911346, 0.0004801750183105469]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 13.0, 27.0, 50.0, 88.0, 167.0, 368.0, 919.0, 2480.0, 8211.0, 35393.0, 301253.0, 609537.0, 70820.0, 13336.0, 3686.0, 1285.0, 447.0, 208.0, 111.0, 59.0, 37.0, 19.0, 9.0, 4.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.873046875, -2.783782958984375, -2.69451904296875, -2.605255126953125, -2.5159912109375, -2.426727294921875, -2.33746337890625, -2.248199462890625, -2.158935546875, -2.069671630859375, -1.98040771484375, -1.891143798828125, -1.8018798828125, -1.712615966796875, -1.62335205078125, -1.534088134765625, -1.44482421875, -1.355560302734375, -1.26629638671875, -1.177032470703125, -1.0877685546875, -0.998504638671875, -0.90924072265625, -0.819976806640625, -0.730712890625, -0.641448974609375, -0.55218505859375, -0.462921142578125, -0.3736572265625, -0.284393310546875, -0.19512939453125, -0.105865478515625, -0.0166015625, 0.072662353515625, 0.16192626953125, 0.251190185546875, 0.3404541015625, 0.429718017578125, 0.51898193359375, 0.608245849609375, 0.697509765625, 0.786773681640625, 0.87603759765625, 0.965301513671875, 1.0545654296875, 1.143829345703125, 1.23309326171875, 1.322357177734375, 1.41162109375, 1.500885009765625, 1.59014892578125, 1.679412841796875, 1.7686767578125, 1.857940673828125, 1.94720458984375, 2.036468505859375, 2.125732421875, 2.214996337890625, 2.30426025390625, 2.393524169921875, 2.4827880859375, 2.572052001953125, 2.66131591796875, 2.750579833984375, 2.83984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 7.0, 6.0, 5.0, 12.0, 14.0, 11.0, 12.0, 19.0, 28.0, 35.0, 54.0, 68.0, 85.0, 83.0, 96.0, 84.0, 84.0, 71.0, 52.0, 36.0, 32.0, 24.0, 16.0, 17.0, 12.0, 6.0, 3.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.99169921875, -0.9621124267578125, -0.932525634765625, -0.9029388427734375, -0.87335205078125, -0.8437652587890625, -0.814178466796875, -0.7845916748046875, -0.7550048828125, -0.7254180908203125, -0.695831298828125, -0.6662445068359375, -0.63665771484375, -0.6070709228515625, -0.577484130859375, -0.5478973388671875, -0.518310546875, -0.4887237548828125, -0.459136962890625, -0.4295501708984375, -0.39996337890625, -0.3703765869140625, -0.340789794921875, -0.3112030029296875, -0.2816162109375, -0.2520294189453125, -0.222442626953125, -0.1928558349609375, -0.16326904296875, -0.1336822509765625, -0.104095458984375, -0.0745086669921875, -0.044921875, -0.0153350830078125, 0.014251708984375, 0.0438385009765625, 0.07342529296875, 0.1030120849609375, 0.132598876953125, 0.1621856689453125, 0.1917724609375, 0.2213592529296875, 0.250946044921875, 0.2805328369140625, 0.31011962890625, 0.3397064208984375, 0.369293212890625, 0.3988800048828125, 0.428466796875, 0.4580535888671875, 0.487640380859375, 0.5172271728515625, 0.54681396484375, 0.5764007568359375, 0.605987548828125, 0.6355743408203125, 0.6651611328125, 0.6947479248046875, 0.724334716796875, 0.7539215087890625, 0.78350830078125, 0.8130950927734375, 0.842681884765625, 0.8722686767578125, 0.90185546875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 15.0, 8.0, 44.0, 108.0, 183.0, 249.0, 206.0, 110.0, 42.0, 19.0, 9.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.586244583129883, -20.27833366394043, -18.970420837402344, -17.66250991821289, -16.354598999023438, -15.046687126159668, -13.738775253295898, -12.430864334106445, -11.122952461242676, -9.815040588378906, -8.507129669189453, -7.199217796325684, -5.891306400299072, -4.583395004272461, -3.2754831314086914, -1.9675722122192383, -0.6596603393554688, 0.6482511758804321, 1.956162691116333, 3.2640743255615234, 4.571985721588135, 5.879897117614746, 7.187808990478516, 8.495719909667969, 9.803631782531738, 11.111543655395508, 12.419454574584961, 13.72736644744873, 15.0352783203125, 16.343189239501953, 17.651100158691406, 18.95901107788086, 20.266925811767578, 21.57483673095703, 22.882749557495117, 24.19066047668457, 25.498571395874023, 26.80648422241211, 28.114395141601562, 29.422306060791016, 30.73021697998047, 32.03812789916992, 33.346038818359375, 34.653953552246094, 35.96186447143555, 37.269775390625, 38.57768630981445, 39.885597229003906, 41.193511962890625, 42.50142288208008, 43.80933380126953, 45.11724853515625, 46.4251594543457, 47.733070373535156, 49.04098129272461, 50.34889221191406, 51.656803131103516, 52.96471405029297, 54.27262496948242, 55.580535888671875, 56.888450622558594, 58.19636154174805, 59.5042724609375, 60.81218338012695, 62.120094299316406]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 12.0, 7.0, 7.0, 11.0, 10.0, 8.0, 21.0, 17.0, 18.0, 39.0, 26.0, 31.0, 39.0, 30.0, 29.0, 35.0, 48.0, 50.0, 41.0, 40.0, 36.0, 52.0, 50.0, 30.0, 40.0, 25.0, 38.0, 26.0, 22.0, 30.0, 23.0, 16.0, 16.0, 14.0, 11.0, 9.0, 7.0, 6.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.845316886901855, -15.3207426071167, -14.796168327331543, -14.271594047546387, -13.747020721435547, -13.22244644165039, -12.697872161865234, -12.173297882080078, -11.648723602294922, -11.124149322509766, -10.59957504272461, -10.075000762939453, -9.550426483154297, -9.02585220336914, -8.5012788772583, -7.9767045974731445, -7.452130317687988, -6.927556037902832, -6.402981758117676, -5.878407955169678, -5.3538336753845215, -4.829259395599365, -4.304685592651367, -3.780111312866211, -3.2555370330810547, -2.7309627532958984, -2.2063887119293213, -1.6818145513534546, -1.157240390777588, -0.6326661109924316, -0.10809206962585449, 0.41648197174072266, 0.9410552978515625, 1.4656294584274292, 1.990203619003296, 2.514777660369873, 3.0393519401550293, 3.5639262199401855, 4.088500022888184, 4.61307430267334, 5.137648582458496, 5.662222862243652, 6.186797142028809, 6.711370944976807, 7.235945224761963, 7.760519504547119, 8.285093307495117, 8.809667587280273, 9.33424186706543, 9.858816146850586, 10.383390426635742, 10.907964706420898, 11.432538986206055, 11.957113265991211, 12.48168659210205, 13.006260871887207, 13.530835151672363, 14.05540943145752, 14.579983711242676, 15.104557991027832, 15.629131317138672, 16.153705596923828, 16.678279876708984, 17.20285415649414, 17.727428436279297]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 7.0, 14.0, 13.0, 21.0, 26.0, 43.0, 65.0, 104.0, 166.0, 287.0, 505.0, 1014.0, 1949.0, 4971.0, 17147.0, 97244.0, 1080939.0, 2637377.0, 297597.0, 39780.0, 9244.0, 3088.0, 1309.0, 608.0, 325.0, 165.0, 109.0, 49.0, 43.0, 24.0, 13.0, 11.0, 4.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.046875, -14.642822265625, -14.23876953125, -13.834716796875, -13.4306640625, -13.026611328125, -12.62255859375, -12.218505859375, -11.814453125, -11.410400390625, -11.00634765625, -10.602294921875, -10.1982421875, -9.794189453125, -9.39013671875, -8.986083984375, -8.58203125, -8.177978515625, -7.77392578125, -7.369873046875, -6.9658203125, -6.561767578125, -6.15771484375, -5.753662109375, -5.349609375, -4.945556640625, -4.54150390625, -4.137451171875, -3.7333984375, -3.329345703125, -2.92529296875, -2.521240234375, -2.1171875, -1.713134765625, -1.30908203125, -0.905029296875, -0.5009765625, -0.096923828125, 0.30712890625, 0.711181640625, 1.115234375, 1.519287109375, 1.92333984375, 2.327392578125, 2.7314453125, 3.135498046875, 3.53955078125, 3.943603515625, 4.34765625, 4.751708984375, 5.15576171875, 5.559814453125, 5.9638671875, 6.367919921875, 6.77197265625, 7.176025390625, 7.580078125, 7.984130859375, 8.38818359375, 8.792236328125, 9.1962890625, 9.600341796875, 10.00439453125, 10.408447265625, 10.8125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 6.0, 7.0, 4.0, 8.0, 7.0, 14.0, 11.0, 9.0, 17.0, 16.0, 19.0, 30.0, 25.0, 34.0, 34.0, 48.0, 64.0, 44.0, 53.0, 52.0, 57.0, 62.0, 43.0, 51.0, 42.0, 47.0, 30.0, 30.0, 27.0, 16.0, 17.0, 15.0, 13.0, 12.0, 8.0, 7.0, 6.0, 8.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1875, -6.9613037109375, -6.735107421875, -6.5089111328125, -6.28271484375, -6.0565185546875, -5.830322265625, -5.6041259765625, -5.3779296875, -5.1517333984375, -4.925537109375, -4.6993408203125, -4.47314453125, -4.2469482421875, -4.020751953125, -3.7945556640625, -3.568359375, -3.3421630859375, -3.115966796875, -2.8897705078125, -2.66357421875, -2.4373779296875, -2.211181640625, -1.9849853515625, -1.7587890625, -1.5325927734375, -1.306396484375, -1.0802001953125, -0.85400390625, -0.6278076171875, -0.401611328125, -0.1754150390625, 0.05078125, 0.2769775390625, 0.503173828125, 0.7293701171875, 0.95556640625, 1.1817626953125, 1.407958984375, 1.6341552734375, 1.8603515625, 2.0865478515625, 2.312744140625, 2.5389404296875, 2.76513671875, 2.9913330078125, 3.217529296875, 3.4437255859375, 3.669921875, 3.8961181640625, 4.122314453125, 4.3485107421875, 4.57470703125, 4.8009033203125, 5.027099609375, 5.2532958984375, 5.4794921875, 5.7056884765625, 5.931884765625, 6.1580810546875, 6.38427734375, 6.6104736328125, 6.836669921875, 7.0628662109375, 7.2890625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 8.0, 10.0, 17.0, 24.0, 31.0, 48.0, 74.0, 122.0, 190.0, 398.0, 1083.0, 4781.0, 44502.0, 2676838.0, 1428713.0, 31847.0, 3811.0, 932.0, 350.0, 163.0, 99.0, 74.0, 43.0, 34.0, 19.0, 17.0, 12.0, 5.0, 4.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.78125, -19.1806640625, -18.580078125, -17.9794921875, -17.37890625, -16.7783203125, -16.177734375, -15.5771484375, -14.9765625, -14.3759765625, -13.775390625, -13.1748046875, -12.57421875, -11.9736328125, -11.373046875, -10.7724609375, -10.171875, -9.5712890625, -8.970703125, -8.3701171875, -7.76953125, -7.1689453125, -6.568359375, -5.9677734375, -5.3671875, -4.7666015625, -4.166015625, -3.5654296875, -2.96484375, -2.3642578125, -1.763671875, -1.1630859375, -0.5625, 0.0380859375, 0.638671875, 1.2392578125, 1.83984375, 2.4404296875, 3.041015625, 3.6416015625, 4.2421875, 4.8427734375, 5.443359375, 6.0439453125, 6.64453125, 7.2451171875, 7.845703125, 8.4462890625, 9.046875, 9.6474609375, 10.248046875, 10.8486328125, 11.44921875, 12.0498046875, 12.650390625, 13.2509765625, 13.8515625, 14.4521484375, 15.052734375, 15.6533203125, 16.25390625, 16.8544921875, 17.455078125, 18.0556640625, 18.65625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 5.0, 2.0, 6.0, 7.0, 4.0, 8.0, 8.0, 17.0, 11.0, 23.0, 28.0, 37.0, 48.0, 61.0, 92.0, 131.0, 182.0, 246.0, 298.0, 438.0, 536.0, 496.0, 387.0, 262.0, 209.0, 137.0, 91.0, 76.0, 47.0, 50.0, 29.0, 24.0, 21.0, 19.0, 9.0, 10.0, 7.0, 5.0, 3.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.10650634765625, -2.0274658203125, -1.94842529296875, -1.869384765625, -1.79034423828125, -1.7113037109375, -1.63226318359375, -1.55322265625, -1.47418212890625, -1.3951416015625, -1.31610107421875, -1.237060546875, -1.15802001953125, -1.0789794921875, -0.99993896484375, -0.9208984375, -0.84185791015625, -0.7628173828125, -0.68377685546875, -0.604736328125, -0.52569580078125, -0.4466552734375, -0.36761474609375, -0.28857421875, -0.20953369140625, -0.1304931640625, -0.05145263671875, 0.027587890625, 0.10662841796875, 0.1856689453125, 0.26470947265625, 0.34375, 0.42279052734375, 0.5018310546875, 0.58087158203125, 0.659912109375, 0.73895263671875, 0.8179931640625, 0.89703369140625, 0.97607421875, 1.05511474609375, 1.1341552734375, 1.21319580078125, 1.292236328125, 1.37127685546875, 1.4503173828125, 1.52935791015625, 1.6083984375, 1.68743896484375, 1.7664794921875, 1.84552001953125, 1.924560546875, 2.00360107421875, 2.0826416015625, 2.16168212890625, 2.24072265625, 2.31976318359375, 2.3988037109375, 2.47784423828125, 2.556884765625, 2.63592529296875, 2.7149658203125, 2.79400634765625, 2.873046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 5.0, 7.0, 7.0, 12.0, 13.0, 13.0, 20.0, 40.0, 39.0, 61.0, 65.0, 72.0, 95.0, 79.0, 94.0, 79.0, 61.0, 62.0, 44.0, 32.0, 21.0, 17.0, 12.0, 15.0, 6.0, 5.0, 5.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.28006649017334, -10.921660423278809, -10.563253402709961, -10.20484733581543, -9.846440315246582, -9.48803424835205, -9.129627227783203, -8.771221160888672, -8.41281509399414, -8.05440902709961, -7.696002006530762, -7.3375959396362305, -6.979189395904541, -6.620782852172852, -6.262376308441162, -5.903969764709473, -5.545563220977783, -5.187156677246094, -4.828750133514404, -4.470343589782715, -4.111937522888184, -3.753530979156494, -3.3951244354248047, -3.0367181301116943, -2.678311586380005, -2.3199050426483154, -1.961498737335205, -1.6030921936035156, -1.2446857690811157, -0.8862793445587158, -0.5278728008270264, -0.16946649551391602, 0.18894004821777344, 0.5473464727401733, 0.905752956867218, 1.2641594409942627, 1.6225658655166626, 1.9809722900390625, 2.339378833770752, 2.6977851390838623, 3.0561916828155518, 3.414598226547241, 3.7730045318603516, 4.131411075592041, 4.4898176193237305, 4.848223686218262, 5.206630706787109, 5.565036773681641, 5.92344331741333, 6.2818498611450195, 6.640256404876709, 6.998662948608398, 7.35706901550293, 7.715475559234619, 8.073882102966309, 8.43228816986084, 8.790695190429688, 9.149101257324219, 9.507508277893066, 9.865914344787598, 10.224321365356445, 10.582727432250977, 10.941133499145508, 11.299540519714355, 11.657946586608887]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 8.0, 7.0, 10.0, 13.0, 11.0, 16.0, 12.0, 21.0, 19.0, 26.0, 39.0, 34.0, 43.0, 56.0, 47.0, 44.0, 42.0, 52.0, 68.0, 35.0, 61.0, 39.0, 38.0, 38.0, 28.0, 31.0, 35.0, 27.0, 22.0, 17.0, 11.0, 7.0, 9.0, 11.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0408430099487305, -6.789460182189941, -6.538077354431152, -6.286694526672363, -6.035311698913574, -5.783928871154785, -5.532546043395996, -5.281163215637207, -5.029780387878418, -4.778397560119629, -4.52701473236084, -4.275631904602051, -4.024249076843262, -3.7728662490844727, -3.5214836597442627, -3.2701008319854736, -3.0187182426452637, -2.7673354148864746, -2.5159525871276855, -2.2645697593688965, -2.0131869316101074, -1.761804223060608, -1.5104215145111084, -1.2590386867523193, -1.0076558589935303, -0.7562730312347412, -0.5048902630805969, -0.25350749492645264, -0.0021246671676635742, 0.2492581605911255, 0.500640869140625, 0.7520236968994141, 1.0034065246582031, 1.2547893524169922, 1.5061721801757812, 1.7575548887252808, 2.0089378356933594, 2.2603206634521484, 2.5117032527923584, 2.7630860805511475, 3.0144689083099365, 3.2658517360687256, 3.5172345638275146, 3.7686171531677246, 4.019999980926514, 4.271382808685303, 4.522765636444092, 4.774148464202881, 5.02553129196167, 5.276914119720459, 5.528296947479248, 5.779679775238037, 6.031062602996826, 6.282445430755615, 6.533827781677246, 6.785210609436035, 7.036593437194824, 7.287976264953613, 7.539359092712402, 7.790741920471191, 8.04212474822998, 8.29350757598877, 8.544890403747559, 8.796273231506348, 9.047656059265137]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 7.0, 9.0, 16.0, 20.0, 39.0, 59.0, 100.0, 231.0, 575.0, 1933.0, 7134.0, 31281.0, 185635.0, 639816.0, 147506.0, 25513.0, 5945.0, 1732.0, 533.0, 206.0, 127.0, 49.0, 25.0, 19.0, 10.0, 6.0, 4.0, 7.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.546875, -4.4185791015625, -4.290283203125, -4.1619873046875, -4.03369140625, -3.9053955078125, -3.777099609375, -3.6488037109375, -3.5205078125, -3.3922119140625, -3.263916015625, -3.1356201171875, -3.00732421875, -2.8790283203125, -2.750732421875, -2.6224365234375, -2.494140625, -2.3658447265625, -2.237548828125, -2.1092529296875, -1.98095703125, -1.8526611328125, -1.724365234375, -1.5960693359375, -1.4677734375, -1.3394775390625, -1.211181640625, -1.0828857421875, -0.95458984375, -0.8262939453125, -0.697998046875, -0.5697021484375, -0.44140625, -0.3131103515625, -0.184814453125, -0.0565185546875, 0.07177734375, 0.2000732421875, 0.328369140625, 0.4566650390625, 0.5849609375, 0.7132568359375, 0.841552734375, 0.9698486328125, 1.09814453125, 1.2264404296875, 1.354736328125, 1.4830322265625, 1.611328125, 1.7396240234375, 1.867919921875, 1.9962158203125, 2.12451171875, 2.2528076171875, 2.381103515625, 2.5093994140625, 2.6376953125, 2.7659912109375, 2.894287109375, 3.0225830078125, 3.15087890625, 3.2791748046875, 3.407470703125, 3.5357666015625, 3.6640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 2.0, 8.0, 3.0, 5.0, 11.0, 12.0, 13.0, 11.0, 20.0, 28.0, 22.0, 37.0, 48.0, 49.0, 52.0, 71.0, 58.0, 68.0, 53.0, 65.0, 75.0, 51.0, 47.0, 33.0, 25.0, 30.0, 19.0, 23.0, 16.0, 11.0, 13.0, 8.0, 8.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3671875, -5.1732177734375, -4.979248046875, -4.7852783203125, -4.59130859375, -4.3973388671875, -4.203369140625, -4.0093994140625, -3.8154296875, -3.6214599609375, -3.427490234375, -3.2335205078125, -3.03955078125, -2.8455810546875, -2.651611328125, -2.4576416015625, -2.263671875, -2.0697021484375, -1.875732421875, -1.6817626953125, -1.48779296875, -1.2938232421875, -1.099853515625, -0.9058837890625, -0.7119140625, -0.5179443359375, -0.323974609375, -0.1300048828125, 0.06396484375, 0.2579345703125, 0.451904296875, 0.6458740234375, 0.83984375, 1.0338134765625, 1.227783203125, 1.4217529296875, 1.61572265625, 1.8096923828125, 2.003662109375, 2.1976318359375, 2.3916015625, 2.5855712890625, 2.779541015625, 2.9735107421875, 3.16748046875, 3.3614501953125, 3.555419921875, 3.7493896484375, 3.943359375, 4.1373291015625, 4.331298828125, 4.5252685546875, 4.71923828125, 4.9132080078125, 5.107177734375, 5.3011474609375, 5.4951171875, 5.6890869140625, 5.883056640625, 6.0770263671875, 6.27099609375, 6.4649658203125, 6.658935546875, 6.8529052734375, 7.046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 7.0, 9.0, 12.0, 28.0, 27.0, 57.0, 88.0, 167.0, 349.0, 719.0, 2100.0, 7392.0, 37985.0, 276879.0, 596521.0, 103766.0, 16492.0, 3770.0, 1150.0, 473.0, 238.0, 131.0, 72.0, 47.0, 24.0, 16.0, 10.0, 9.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.19140625, -4.07891845703125, -3.9664306640625, -3.85394287109375, -3.741455078125, -3.62896728515625, -3.5164794921875, -3.40399169921875, -3.29150390625, -3.17901611328125, -3.0665283203125, -2.95404052734375, -2.841552734375, -2.72906494140625, -2.6165771484375, -2.50408935546875, -2.3916015625, -2.27911376953125, -2.1666259765625, -2.05413818359375, -1.941650390625, -1.82916259765625, -1.7166748046875, -1.60418701171875, -1.49169921875, -1.37921142578125, -1.2667236328125, -1.15423583984375, -1.041748046875, -0.92926025390625, -0.8167724609375, -0.70428466796875, -0.591796875, -0.47930908203125, -0.3668212890625, -0.25433349609375, -0.141845703125, -0.02935791015625, 0.0831298828125, 0.19561767578125, 0.30810546875, 0.42059326171875, 0.5330810546875, 0.64556884765625, 0.758056640625, 0.87054443359375, 0.9830322265625, 1.09552001953125, 1.2080078125, 1.32049560546875, 1.4329833984375, 1.54547119140625, 1.657958984375, 1.77044677734375, 1.8829345703125, 1.99542236328125, 2.10791015625, 2.22039794921875, 2.3328857421875, 2.44537353515625, 2.557861328125, 2.67034912109375, 2.7828369140625, 2.89532470703125, 3.0078125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 1.0, 6.0, 5.0, 6.0, 8.0, 11.0, 10.0, 16.0, 13.0, 16.0, 32.0, 26.0, 30.0, 31.0, 37.0, 41.0, 55.0, 47.0, 40.0, 47.0, 56.0, 44.0, 51.0, 39.0, 49.0, 37.0, 32.0, 42.0, 36.0, 29.0, 18.0, 16.0, 8.0, 19.0, 12.0, 7.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.2486572265625, -7.958251953125, -7.6678466796875, -7.37744140625, -7.0870361328125, -6.796630859375, -6.5062255859375, -6.2158203125, -5.9254150390625, -5.635009765625, -5.3446044921875, -5.05419921875, -4.7637939453125, -4.473388671875, -4.1829833984375, -3.892578125, -3.6021728515625, -3.311767578125, -3.0213623046875, -2.73095703125, -2.4405517578125, -2.150146484375, -1.8597412109375, -1.5693359375, -1.2789306640625, -0.988525390625, -0.6981201171875, -0.40771484375, -0.1173095703125, 0.173095703125, 0.4635009765625, 0.75390625, 1.0443115234375, 1.334716796875, 1.6251220703125, 1.91552734375, 2.2059326171875, 2.496337890625, 2.7867431640625, 3.0771484375, 3.3675537109375, 3.657958984375, 3.9483642578125, 4.23876953125, 4.5291748046875, 4.819580078125, 5.1099853515625, 5.400390625, 5.6907958984375, 5.981201171875, 6.2716064453125, 6.56201171875, 6.8524169921875, 7.142822265625, 7.4332275390625, 7.7236328125, 8.0140380859375, 8.304443359375, 8.5948486328125, 8.88525390625, 9.1756591796875, 9.466064453125, 9.7564697265625, 10.046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 10.0, 13.0, 12.0, 16.0, 32.0, 35.0, 54.0, 88.0, 157.0, 266.0, 434.0, 850.0, 1577.0, 3382.0, 8183.0, 22813.0, 79542.0, 300283.0, 430834.0, 140587.0, 37715.0, 12259.0, 4790.0, 2165.0, 1050.0, 570.0, 327.0, 169.0, 130.0, 73.0, 43.0, 32.0, 18.0, 15.0, 10.0, 7.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81982421875, -0.7907638549804688, -0.7617034912109375, -0.7326431274414062, -0.703582763671875, -0.6745223999023438, -0.6454620361328125, -0.6164016723632812, -0.58734130859375, -0.5582809448242188, -0.5292205810546875, -0.5001602172851562, -0.471099853515625, -0.44203948974609375, -0.4129791259765625, -0.38391876220703125, -0.3548583984375, -0.32579803466796875, -0.2967376708984375, -0.26767730712890625, -0.238616943359375, -0.20955657958984375, -0.1804962158203125, -0.15143585205078125, -0.12237548828125, -0.09331512451171875, -0.0642547607421875, -0.03519439697265625, -0.006134033203125, 0.02292633056640625, 0.0519866943359375, 0.08104705810546875, 0.110107421875, 0.13916778564453125, 0.1682281494140625, 0.19728851318359375, 0.226348876953125, 0.25540924072265625, 0.2844696044921875, 0.31352996826171875, 0.34259033203125, 0.37165069580078125, 0.4007110595703125, 0.42977142333984375, 0.458831787109375, 0.48789215087890625, 0.5169525146484375, 0.5460128784179688, 0.5750732421875, 0.6041336059570312, 0.6331939697265625, 0.6622543334960938, 0.691314697265625, 0.7203750610351562, 0.7494354248046875, 0.7784957885742188, 0.80755615234375, 0.8366165161132812, 0.8656768798828125, 0.8947372436523438, 0.923797607421875, 0.9528579711914062, 0.9819183349609375, 1.0109786987304688, 1.0400390625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 16.0, 14.0, 18.0, 32.0, 43.0, 44.0, 63.0, 71.0, 87.0, 85.0, 102.0, 86.0, 103.0, 71.0, 53.0, 30.0, 24.0, 17.0, 12.0, 9.0, 9.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006046295166015625, -0.0005869641900062561, -0.0005692988634109497, -0.0005516335368156433, -0.0005339682102203369, -0.0005163028836250305, -0.0004986375570297241, -0.0004809722304344177, -0.00046330690383911133, -0.00044564157724380493, -0.00042797625064849854, -0.00041031092405319214, -0.00039264559745788574, -0.00037498027086257935, -0.00035731494426727295, -0.00033964961767196655, -0.00032198429107666016, -0.00030431896448135376, -0.00028665363788604736, -0.00026898831129074097, -0.00025132298469543457, -0.00023365765810012817, -0.00021599233150482178, -0.00019832700490951538, -0.00018066167831420898, -0.0001629963517189026, -0.0001453310251235962, -0.0001276656985282898, -0.0001100003719329834, -9.2335045337677e-05, -7.46697187423706e-05, -5.700439214706421e-05, -3.933906555175781e-05, -2.1673738956451416e-05, -4.0084123611450195e-06, 1.3656914234161377e-05, 3.1322240829467773e-05, 4.898756742477417e-05, 6.665289402008057e-05, 8.431822061538696e-05, 0.00010198354721069336, 0.00011964887380599976, 0.00013731420040130615, 0.00015497952699661255, 0.00017264485359191895, 0.00019031018018722534, 0.00020797550678253174, 0.00022564083337783813, 0.00024330615997314453, 0.00026097148656845093, 0.0002786368131637573, 0.0002963021397590637, 0.0003139674663543701, 0.0003316327929496765, 0.0003492981195449829, 0.0003669634461402893, 0.0003846287727355957, 0.0004022940993309021, 0.0004199594259262085, 0.0004376247525215149, 0.0004552900791168213, 0.0004729554057121277, 0.0004906207323074341, 0.0005082860589027405, 0.0005259513854980469]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 9.0, 8.0, 8.0, 24.0, 22.0, 34.0, 39.0, 57.0, 126.0, 198.0, 378.0, 760.0, 1771.0, 4661.0, 14324.0, 49855.0, 192224.0, 460345.0, 235836.0, 61242.0, 17101.0, 5581.0, 2045.0, 844.0, 449.0, 238.0, 130.0, 78.0, 48.0, 31.0, 24.0, 14.0, 13.0, 7.0, 9.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0], "bins": [-1.0439453125, -1.0137557983398438, -0.9835662841796875, -0.9533767700195312, -0.923187255859375, -0.8929977416992188, -0.8628082275390625, -0.8326187133789062, -0.80242919921875, -0.7722396850585938, -0.7420501708984375, -0.7118606567382812, -0.681671142578125, -0.6514816284179688, -0.6212921142578125, -0.5911026000976562, -0.5609130859375, -0.5307235717773438, -0.5005340576171875, -0.47034454345703125, -0.440155029296875, -0.40996551513671875, -0.3797760009765625, -0.34958648681640625, -0.31939697265625, -0.28920745849609375, -0.2590179443359375, -0.22882843017578125, -0.198638916015625, -0.16844940185546875, -0.1382598876953125, -0.10807037353515625, -0.077880859375, -0.04769134521484375, -0.0175018310546875, 0.01268768310546875, 0.042877197265625, 0.07306671142578125, 0.1032562255859375, 0.13344573974609375, 0.16363525390625, 0.19382476806640625, 0.2240142822265625, 0.25420379638671875, 0.284393310546875, 0.31458282470703125, 0.3447723388671875, 0.37496185302734375, 0.4051513671875, 0.43534088134765625, 0.4655303955078125, 0.49571990966796875, 0.525909423828125, 0.5560989379882812, 0.5862884521484375, 0.6164779663085938, 0.64666748046875, 0.6768569946289062, 0.7070465087890625, 0.7372360229492188, 0.767425537109375, 0.7976150512695312, 0.8278045654296875, 0.8579940795898438, 0.88818359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0, 7.0, 5.0, 19.0, 20.0, 12.0, 26.0, 30.0, 38.0, 35.0, 40.0, 55.0, 59.0, 62.0, 42.0, 65.0, 60.0, 63.0, 50.0, 49.0, 47.0, 39.0, 35.0, 28.0, 23.0, 23.0, 12.0, 13.0, 11.0, 5.0, 4.0, 7.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2161865234375, -0.20978927612304688, -0.20339202880859375, -0.19699478149414062, -0.1905975341796875, -0.18420028686523438, -0.17780303955078125, -0.17140579223632812, -0.165008544921875, -0.15861129760742188, -0.15221405029296875, -0.14581680297851562, -0.1394195556640625, -0.13302230834960938, -0.12662506103515625, -0.12022781372070312, -0.11383056640625, -0.10743331909179688, -0.10103607177734375, -0.09463882446289062, -0.0882415771484375, -0.08184432983398438, -0.07544708251953125, -0.06904983520507812, -0.062652587890625, -0.056255340576171875, -0.04985809326171875, -0.043460845947265625, -0.0370635986328125, -0.030666351318359375, -0.02426910400390625, -0.017871856689453125, -0.011474609375, -0.005077362060546875, 0.00131988525390625, 0.007717132568359375, 0.0141143798828125, 0.020511627197265625, 0.02690887451171875, 0.033306121826171875, 0.039703369140625, 0.046100616455078125, 0.05249786376953125, 0.058895111083984375, 0.0652923583984375, 0.07168960571289062, 0.07808685302734375, 0.08448410034179688, 0.09088134765625, 0.09727859497070312, 0.10367584228515625, 0.11007308959960938, 0.1164703369140625, 0.12286758422851562, 0.12926483154296875, 0.13566207885742188, 0.142059326171875, 0.14845657348632812, 0.15485382080078125, 0.16125106811523438, 0.1676483154296875, 0.17404556274414062, 0.18044281005859375, 0.18684005737304688, 0.1932373046875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 10.0, 5.0, 20.0, 27.0, 22.0, 51.0, 68.0, 104.0, 123.0, 123.0, 116.0, 98.0, 76.0, 37.0, 40.0, 20.0, 19.0, 8.0, 7.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.672966003417969, -10.371932983398438, -10.07089900970459, -9.769865989685059, -9.468832969665527, -9.167799949645996, -8.866765975952148, -8.565732955932617, -8.264699935913086, -7.9636664390563965, -7.662633419036865, -7.361599922180176, -7.0605669021606445, -6.759533405303955, -6.458499908447266, -6.157466888427734, -5.856433391571045, -5.5553998947143555, -5.254366874694824, -4.953333377838135, -4.6523003578186035, -4.351266860961914, -4.050233840942383, -3.7492003440856934, -3.448167085647583, -3.1471338272094727, -2.8461005687713623, -2.545067310333252, -2.2440338134765625, -1.9430006742477417, -1.6419672966003418, -1.3409340381622314, -1.039900779724121, -0.7388675212860107, -0.4378342032432556, -0.1368008852005005, 0.16423237323760986, 0.4652656316757202, 0.7662990093231201, 1.0673322677612305, 1.3683655261993408, 1.6693987846374512, 1.9704320430755615, 2.271465301513672, 2.5724987983703613, 2.8735318183898926, 3.174565315246582, 3.4755985736846924, 3.7766318321228027, 4.077665328979492, 4.378698348999023, 4.679731845855713, 4.980764865875244, 5.281798362731934, 5.582831382751465, 5.883864879608154, 6.184898376464844, 6.485931873321533, 6.7869648933410645, 7.087998390197754, 7.389031410217285, 7.690064907073975, 7.991098403930664, 8.292131423950195, 8.593164443969727]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 5.0, 4.0, 14.0, 7.0, 11.0, 12.0, 9.0, 22.0, 19.0, 25.0, 28.0, 43.0, 39.0, 58.0, 53.0, 41.0, 64.0, 65.0, 64.0, 57.0, 54.0, 37.0, 44.0, 38.0, 35.0, 31.0, 27.0, 15.0, 18.0, 12.0, 9.0, 12.0, 12.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.793221473693848, -4.625319480895996, -4.4574174880981445, -4.289515495300293, -4.121613502502441, -3.95371150970459, -3.785809278488159, -3.6179072856903076, -3.450005292892456, -3.2821033000946045, -3.114201307296753, -2.9462990760803223, -2.7783970832824707, -2.610495090484619, -2.4425930976867676, -2.274691104888916, -2.1067891120910645, -1.938887119293213, -1.7709851264953613, -1.6030830144882202, -1.4351810216903687, -1.267279028892517, -1.099376916885376, -0.9314749240875244, -0.7635729312896729, -0.5956709384918213, -0.42776888608932495, -0.2598668336868286, -0.09196484088897705, 0.07593715190887451, 0.24383926391601562, 0.4117412567138672, 0.579643726348877, 0.7475457191467285, 0.9154477715492249, 1.0833498239517212, 1.2512518167495728, 1.4191538095474243, 1.5870559215545654, 1.754957914352417, 1.9228599071502686, 2.09076189994812, 2.2586638927459717, 2.4265661239624023, 2.594468116760254, 2.7623701095581055, 2.930272102355957, 3.0981740951538086, 3.26607608795166, 3.4339780807495117, 3.6018800735473633, 3.769782066345215, 3.9376840591430664, 4.105586051940918, 4.2734880447387695, 4.441390037536621, 4.609292030334473, 4.777194023132324, 4.945096015930176, 5.112998008728027, 5.280900001525879, 5.4488019943237305, 5.616703987121582, 5.784605979919434, 5.952508449554443]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 5.0, 2.0, 10.0, 4.0, 7.0, 9.0, 8.0, 12.0, 23.0, 40.0, 68.0, 249.0, 1532.0, 23366.0, 948430.0, 71121.0, 3020.0, 379.0, 123.0, 41.0, 22.0, 17.0, 13.0, 5.0, 9.0, 6.0, 4.0, 4.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.984375, -21.18896484375, -20.3935546875, -19.59814453125, -18.802734375, -18.00732421875, -17.2119140625, -16.41650390625, -15.62109375, -14.82568359375, -14.0302734375, -13.23486328125, -12.439453125, -11.64404296875, -10.8486328125, -10.05322265625, -9.2578125, -8.46240234375, -7.6669921875, -6.87158203125, -6.076171875, -5.28076171875, -4.4853515625, -3.68994140625, -2.89453125, -2.09912109375, -1.3037109375, -0.50830078125, 0.287109375, 1.08251953125, 1.8779296875, 2.67333984375, 3.46875, 4.26416015625, 5.0595703125, 5.85498046875, 6.650390625, 7.44580078125, 8.2412109375, 9.03662109375, 9.83203125, 10.62744140625, 11.4228515625, 12.21826171875, 13.013671875, 13.80908203125, 14.6044921875, 15.39990234375, 16.1953125, 16.99072265625, 17.7861328125, 18.58154296875, 19.376953125, 20.17236328125, 20.9677734375, 21.76318359375, 22.55859375, 23.35400390625, 24.1494140625, 24.94482421875, 25.740234375, 26.53564453125, 27.3310546875, 28.12646484375, 28.921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 5.0, 6.0, 10.0, 9.0, 5.0, 9.0, 10.0, 13.0, 19.0, 12.0, 30.0, 28.0, 39.0, 40.0, 40.0, 49.0, 69.0, 79.0, 60.0, 66.0, 64.0, 54.0, 34.0, 41.0, 35.0, 35.0, 28.0, 24.0, 16.0, 17.0, 17.0, 12.0, 8.0, 4.0, 9.0, 7.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.453125, -10.100341796875, -9.74755859375, -9.394775390625, -9.0419921875, -8.689208984375, -8.33642578125, -7.983642578125, -7.630859375, -7.278076171875, -6.92529296875, -6.572509765625, -6.2197265625, -5.866943359375, -5.51416015625, -5.161376953125, -4.80859375, -4.455810546875, -4.10302734375, -3.750244140625, -3.3974609375, -3.044677734375, -2.69189453125, -2.339111328125, -1.986328125, -1.633544921875, -1.28076171875, -0.927978515625, -0.5751953125, -0.222412109375, 0.13037109375, 0.483154296875, 0.8359375, 1.188720703125, 1.54150390625, 1.894287109375, 2.2470703125, 2.599853515625, 2.95263671875, 3.305419921875, 3.658203125, 4.010986328125, 4.36376953125, 4.716552734375, 5.0693359375, 5.422119140625, 5.77490234375, 6.127685546875, 6.48046875, 6.833251953125, 7.18603515625, 7.538818359375, 7.8916015625, 8.244384765625, 8.59716796875, 8.949951171875, 9.302734375, 9.655517578125, 10.00830078125, 10.361083984375, 10.7138671875, 11.066650390625, 11.41943359375, 11.772216796875, 12.125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 6.0, 3.0, 8.0, 6.0, 9.0, 4.0, 13.0, 17.0, 26.0, 25.0, 33.0, 31.0, 55.0, 68.0, 86.0, 107.0, 157.0, 273.0, 893.0, 4540.0, 46040.0, 754061.0, 225521.0, 13366.0, 1947.0, 506.0, 207.0, 132.0, 80.0, 62.0, 55.0, 39.0, 40.0, 25.0, 27.0, 21.0, 12.0, 12.0, 7.0, 17.0, 8.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.171875, -11.80029296875, -11.4287109375, -11.05712890625, -10.685546875, -10.31396484375, -9.9423828125, -9.57080078125, -9.19921875, -8.82763671875, -8.4560546875, -8.08447265625, -7.712890625, -7.34130859375, -6.9697265625, -6.59814453125, -6.2265625, -5.85498046875, -5.4833984375, -5.11181640625, -4.740234375, -4.36865234375, -3.9970703125, -3.62548828125, -3.25390625, -2.88232421875, -2.5107421875, -2.13916015625, -1.767578125, -1.39599609375, -1.0244140625, -0.65283203125, -0.28125, 0.09033203125, 0.4619140625, 0.83349609375, 1.205078125, 1.57666015625, 1.9482421875, 2.31982421875, 2.69140625, 3.06298828125, 3.4345703125, 3.80615234375, 4.177734375, 4.54931640625, 4.9208984375, 5.29248046875, 5.6640625, 6.03564453125, 6.4072265625, 6.77880859375, 7.150390625, 7.52197265625, 7.8935546875, 8.26513671875, 8.63671875, 9.00830078125, 9.3798828125, 9.75146484375, 10.123046875, 10.49462890625, 10.8662109375, 11.23779296875, 11.609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 7.0, 3.0, 3.0, 11.0, 6.0, 8.0, 15.0, 15.0, 13.0, 11.0, 28.0, 25.0, 30.0, 28.0, 39.0, 42.0, 39.0, 37.0, 34.0, 40.0, 53.0, 46.0, 39.0, 44.0, 48.0, 40.0, 35.0, 30.0, 28.0, 24.0, 29.0, 24.0, 20.0, 16.0, 14.0, 7.0, 10.0, 13.0, 12.0, 9.0, 6.0, 3.0, 2.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0], "bins": [-9.53125, -9.25848388671875, -8.9857177734375, -8.71295166015625, -8.440185546875, -8.16741943359375, -7.8946533203125, -7.62188720703125, -7.34912109375, -7.07635498046875, -6.8035888671875, -6.53082275390625, -6.258056640625, -5.98529052734375, -5.7125244140625, -5.43975830078125, -5.1669921875, -4.89422607421875, -4.6214599609375, -4.34869384765625, -4.075927734375, -3.80316162109375, -3.5303955078125, -3.25762939453125, -2.98486328125, -2.71209716796875, -2.4393310546875, -2.16656494140625, -1.893798828125, -1.62103271484375, -1.3482666015625, -1.07550048828125, -0.802734375, -0.52996826171875, -0.2572021484375, 0.01556396484375, 0.288330078125, 0.56109619140625, 0.8338623046875, 1.10662841796875, 1.37939453125, 1.65216064453125, 1.9249267578125, 2.19769287109375, 2.470458984375, 2.74322509765625, 3.0159912109375, 3.28875732421875, 3.5615234375, 3.83428955078125, 4.1070556640625, 4.37982177734375, 4.652587890625, 4.92535400390625, 5.1981201171875, 5.47088623046875, 5.74365234375, 6.01641845703125, 6.2891845703125, 6.56195068359375, 6.834716796875, 7.10748291015625, 7.3802490234375, 7.65301513671875, 7.92578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 6.0, 13.0, 16.0, 22.0, 26.0, 25.0, 49.0, 81.0, 132.0, 254.0, 462.0, 894.0, 1917.0, 4546.0, 12531.0, 45634.0, 214483.0, 542037.0, 170582.0, 36836.0, 10733.0, 3847.0, 1600.0, 788.0, 402.0, 227.0, 146.0, 66.0, 67.0, 33.0, 26.0, 14.0, 22.0, 8.0, 6.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6982421875, -1.6474456787109375, -1.596649169921875, -1.5458526611328125, -1.49505615234375, -1.4442596435546875, -1.393463134765625, -1.3426666259765625, -1.2918701171875, -1.2410736083984375, -1.190277099609375, -1.1394805908203125, -1.08868408203125, -1.0378875732421875, -0.987091064453125, -0.9362945556640625, -0.885498046875, -0.8347015380859375, -0.783905029296875, -0.7331085205078125, -0.68231201171875, -0.6315155029296875, -0.580718994140625, -0.5299224853515625, -0.4791259765625, -0.4283294677734375, -0.377532958984375, -0.3267364501953125, -0.27593994140625, -0.2251434326171875, -0.174346923828125, -0.1235504150390625, -0.07275390625, -0.0219573974609375, 0.028839111328125, 0.0796356201171875, 0.13043212890625, 0.1812286376953125, 0.232025146484375, 0.2828216552734375, 0.3336181640625, 0.3844146728515625, 0.435211181640625, 0.4860076904296875, 0.53680419921875, 0.5876007080078125, 0.638397216796875, 0.6891937255859375, 0.739990234375, 0.7907867431640625, 0.841583251953125, 0.8923797607421875, 0.94317626953125, 0.9939727783203125, 1.044769287109375, 1.0955657958984375, 1.1463623046875, 1.1971588134765625, 1.247955322265625, 1.2987518310546875, 1.34954833984375, 1.4003448486328125, 1.451141357421875, 1.5019378662109375, 1.552734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 4.0, 6.0, 8.0, 4.0, 12.0, 14.0, 15.0, 30.0, 26.0, 42.0, 46.0, 76.0, 97.0, 91.0, 84.0, 96.0, 97.0, 75.0, 37.0, 33.0, 23.0, 19.0, 19.0, 12.0, 12.0, 11.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003116130828857422, -0.00030332058668136597, -0.00029502809047698975, -0.0002867355942726135, -0.0002784430980682373, -0.0002701506018638611, -0.00026185810565948486, -0.00025356560945510864, -0.0002452731132507324, -0.0002369806170463562, -0.00022868812084197998, -0.00022039562463760376, -0.00021210312843322754, -0.00020381063222885132, -0.0001955181360244751, -0.00018722563982009888, -0.00017893314361572266, -0.00017064064741134644, -0.00016234815120697021, -0.000154055655002594, -0.00014576315879821777, -0.00013747066259384155, -0.00012917816638946533, -0.00012088567018508911, -0.00011259317398071289, -0.00010430067777633667, -9.600818157196045e-05, -8.771568536758423e-05, -7.942318916320801e-05, -7.113069295883179e-05, -6.283819675445557e-05, -5.4545700550079346e-05, -4.6253204345703125e-05, -3.7960708141326904e-05, -2.9668211936950684e-05, -2.1375715732574463e-05, -1.3083219528198242e-05, -4.7907233238220215e-06, 3.5017728805541992e-06, 1.179426908493042e-05, 2.008676528930664e-05, 2.837926149368286e-05, 3.667175769805908e-05, 4.49642539024353e-05, 5.3256750106811523e-05, 6.154924631118774e-05, 6.984174251556396e-05, 7.813423871994019e-05, 8.64267349243164e-05, 9.471923112869263e-05, 0.00010301172733306885, 0.00011130422353744507, 0.00011959671974182129, 0.0001278892159461975, 0.00013618171215057373, 0.00014447420835494995, 0.00015276670455932617, 0.0001610592007637024, 0.0001693516969680786, 0.00017764419317245483, 0.00018593668937683105, 0.00019422918558120728, 0.0002025216817855835, 0.00021081417798995972, 0.00021910667419433594]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 0.0, 8.0, 5.0, 8.0, 10.0, 10.0, 23.0, 34.0, 42.0, 77.0, 87.0, 148.0, 280.0, 535.0, 978.0, 2078.0, 5157.0, 16063.0, 62831.0, 308547.0, 491907.0, 119244.0, 26868.0, 7847.0, 2883.0, 1286.0, 651.0, 329.0, 230.0, 147.0, 80.0, 57.0, 38.0, 16.0, 16.0, 5.0, 11.0, 4.0, 4.0, 6.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5595703125, -1.5079345703125, -1.456298828125, -1.4046630859375, -1.35302734375, -1.3013916015625, -1.249755859375, -1.1981201171875, -1.146484375, -1.0948486328125, -1.043212890625, -0.9915771484375, -0.93994140625, -0.8883056640625, -0.836669921875, -0.7850341796875, -0.7333984375, -0.6817626953125, -0.630126953125, -0.5784912109375, -0.52685546875, -0.4752197265625, -0.423583984375, -0.3719482421875, -0.3203125, -0.2686767578125, -0.217041015625, -0.1654052734375, -0.11376953125, -0.0621337890625, -0.010498046875, 0.0411376953125, 0.0927734375, 0.1444091796875, 0.196044921875, 0.2476806640625, 0.29931640625, 0.3509521484375, 0.402587890625, 0.4542236328125, 0.505859375, 0.5574951171875, 0.609130859375, 0.6607666015625, 0.71240234375, 0.7640380859375, 0.815673828125, 0.8673095703125, 0.9189453125, 0.9705810546875, 1.022216796875, 1.0738525390625, 1.12548828125, 1.1771240234375, 1.228759765625, 1.2803955078125, 1.33203125, 1.3836669921875, 1.435302734375, 1.4869384765625, 1.53857421875, 1.5902099609375, 1.641845703125, 1.6934814453125, 1.7451171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 3.0, 9.0, 8.0, 8.0, 19.0, 17.0, 27.0, 39.0, 51.0, 62.0, 76.0, 68.0, 90.0, 106.0, 73.0, 88.0, 58.0, 54.0, 34.0, 31.0, 26.0, 5.0, 10.0, 6.0, 5.0, 5.0, 9.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86083984375, -0.833984375, -0.80712890625, -0.7802734375, -0.75341796875, -0.7265625, -0.69970703125, -0.6728515625, -0.64599609375, -0.619140625, -0.59228515625, -0.5654296875, -0.53857421875, -0.51171875, -0.48486328125, -0.4580078125, -0.43115234375, -0.404296875, -0.37744140625, -0.3505859375, -0.32373046875, -0.296875, -0.27001953125, -0.2431640625, -0.21630859375, -0.189453125, -0.16259765625, -0.1357421875, -0.10888671875, -0.08203125, -0.05517578125, -0.0283203125, -0.00146484375, 0.025390625, 0.05224609375, 0.0791015625, 0.10595703125, 0.1328125, 0.15966796875, 0.1865234375, 0.21337890625, 0.240234375, 0.26708984375, 0.2939453125, 0.32080078125, 0.34765625, 0.37451171875, 0.4013671875, 0.42822265625, 0.455078125, 0.48193359375, 0.5087890625, 0.53564453125, 0.5625, 0.58935546875, 0.6162109375, 0.64306640625, 0.669921875, 0.69677734375, 0.7236328125, 0.75048828125, 0.77734375, 0.80419921875, 0.8310546875, 0.85791015625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 8.0, 3.0, 2.0, 14.0, 12.0, 23.0, 39.0, 58.0, 88.0, 108.0, 141.0, 137.0, 121.0, 83.0, 52.0, 38.0, 30.0, 10.0, 12.0, 6.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0128755569458, -14.361383438110352, -13.709890365600586, -13.058398246765137, -12.406906127929688, -11.755414009094238, -11.103921890258789, -10.452428817749023, -9.800936698913574, -9.149444580078125, -8.49795150756836, -7.84645938873291, -7.194967269897461, -6.543475151062012, -5.891982555389404, -5.240489959716797, -4.588997840881348, -3.9375054836273193, -3.286013126373291, -2.6345207691192627, -1.9830284118652344, -1.331536054611206, -0.6800436973571777, -0.028551101684570312, 0.6229410171508789, 1.2744333744049072, 1.9259257316589355, 2.577418088912964, 3.228910446166992, 3.8804028034210205, 4.531895160675049, 5.183387756347656, 5.834880828857422, 6.486372947692871, 7.1378655433654785, 7.789358139038086, 8.440850257873535, 9.092342376708984, 9.74383544921875, 10.3953275680542, 11.046819686889648, 11.698311805725098, 12.349803924560547, 13.001296997070312, 13.652789115905762, 14.304281234741211, 14.955774307250977, 15.607266426086426, 16.258758544921875, 16.91025161743164, 17.561742782592773, 18.21323585510254, 18.864727020263672, 19.516220092773438, 20.167713165283203, 20.81920623779297, 21.4706974029541, 22.122190475463867, 22.773681640625, 23.425174713134766, 24.07666778564453, 24.728158950805664, 25.37965202331543, 26.031143188476562, 26.682636260986328]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 5.0, 4.0, 7.0, 2.0, 9.0, 11.0, 16.0, 20.0, 21.0, 20.0, 21.0, 25.0, 33.0, 25.0, 34.0, 41.0, 38.0, 44.0, 48.0, 49.0, 50.0, 45.0, 60.0, 46.0, 48.0, 40.0, 30.0, 43.0, 27.0, 34.0, 16.0, 22.0, 10.0, 14.0, 11.0, 7.0, 6.0, 9.0, 3.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.328516006469727, -15.770965576171875, -15.213414192199707, -14.655863761901855, -14.098312377929688, -13.540761947631836, -12.983211517333984, -12.425661087036133, -11.868109703063965, -11.310559272766113, -10.753007888793945, -10.195457458496094, -9.637907028198242, -9.080355644226074, -8.522805213928223, -7.965254306793213, -7.407703399658203, -6.850152492523193, -6.292601585388184, -5.735051155090332, -5.177500247955322, -4.6199493408203125, -4.062398910522461, -3.504848003387451, -2.9472970962524414, -2.3897461891174316, -1.832195520401001, -1.2746447324752808, -0.7170939445495605, -0.15954303741455078, 0.3980076313018799, 0.9555583000183105, 1.5131092071533203, 2.07066011428833, 2.6282107830047607, 3.1857614517211914, 3.743312358856201, 4.300863265991211, 4.8584136962890625, 5.415964603424072, 5.973515510559082, 6.531066417694092, 7.088617324829102, 7.646167755126953, 8.203718185424805, 8.761269569396973, 9.318819999694824, 9.876371383666992, 10.433921813964844, 10.991472244262695, 11.549023628234863, 12.106574058532715, 12.664125442504883, 13.221675872802734, 13.779226303100586, 14.336776733398438, 14.894328117370605, 15.451878547668457, 16.009429931640625, 16.566980361938477, 17.124530792236328, 17.682083129882812, 18.239633560180664, 18.797183990478516, 19.354734420776367]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 7.0, 7.0, 8.0, 11.0, 14.0, 24.0, 39.0, 38.0, 62.0, 78.0, 157.0, 203.0, 264.0, 450.0, 645.0, 1094.0, 1993.0, 3784.0, 8293.0, 20354.0, 64566.0, 290508.0, 1636812.0, 1729117.0, 321898.0, 74537.0, 22173.0, 8395.0, 3816.0, 1921.0, 1073.0, 695.0, 439.0, 276.0, 160.0, 110.0, 62.0, 53.0, 46.0, 27.0, 22.0, 15.0, 11.0, 9.0, 1.0, 7.0, 4.0, 2.0, 1.0, 1.0], "bins": [-8.5078125, -8.27801513671875, -8.0482177734375, -7.81842041015625, -7.588623046875, -7.35882568359375, -7.1290283203125, -6.89923095703125, -6.66943359375, -6.43963623046875, -6.2098388671875, -5.98004150390625, -5.750244140625, -5.52044677734375, -5.2906494140625, -5.06085205078125, -4.8310546875, -4.60125732421875, -4.3714599609375, -4.14166259765625, -3.911865234375, -3.68206787109375, -3.4522705078125, -3.22247314453125, -2.99267578125, -2.76287841796875, -2.5330810546875, -2.30328369140625, -2.073486328125, -1.84368896484375, -1.6138916015625, -1.38409423828125, -1.154296875, -0.92449951171875, -0.6947021484375, -0.46490478515625, -0.235107421875, -0.00531005859375, 0.2244873046875, 0.45428466796875, 0.68408203125, 0.91387939453125, 1.1436767578125, 1.37347412109375, 1.603271484375, 1.83306884765625, 2.0628662109375, 2.29266357421875, 2.5224609375, 2.75225830078125, 2.9820556640625, 3.21185302734375, 3.441650390625, 3.67144775390625, 3.9012451171875, 4.13104248046875, 4.36083984375, 4.59063720703125, 4.8204345703125, 5.05023193359375, 5.280029296875, 5.50982666015625, 5.7396240234375, 5.96942138671875, 6.19921875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 7.0, 7.0, 9.0, 8.0, 10.0, 13.0, 25.0, 18.0, 25.0, 27.0, 36.0, 42.0, 46.0, 47.0, 60.0, 61.0, 58.0, 74.0, 56.0, 57.0, 45.0, 50.0, 44.0, 33.0, 25.0, 22.0, 21.0, 18.0, 10.0, 10.0, 12.0, 6.0, 3.0, 4.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.5223388671875, -6.286865234375, -6.0513916015625, -5.81591796875, -5.5804443359375, -5.344970703125, -5.1094970703125, -4.8740234375, -4.6385498046875, -4.403076171875, -4.1676025390625, -3.93212890625, -3.6966552734375, -3.461181640625, -3.2257080078125, -2.990234375, -2.7547607421875, -2.519287109375, -2.2838134765625, -2.04833984375, -1.8128662109375, -1.577392578125, -1.3419189453125, -1.1064453125, -0.8709716796875, -0.635498046875, -0.4000244140625, -0.16455078125, 0.0709228515625, 0.306396484375, 0.5418701171875, 0.77734375, 1.0128173828125, 1.248291015625, 1.4837646484375, 1.71923828125, 1.9547119140625, 2.190185546875, 2.4256591796875, 2.6611328125, 2.8966064453125, 3.132080078125, 3.3675537109375, 3.60302734375, 3.8385009765625, 4.073974609375, 4.3094482421875, 4.544921875, 4.7803955078125, 5.015869140625, 5.2513427734375, 5.48681640625, 5.7222900390625, 5.957763671875, 6.1932373046875, 6.4287109375, 6.6641845703125, 6.899658203125, 7.1351318359375, 7.37060546875, 7.6060791015625, 7.841552734375, 8.0770263671875, 8.3125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 8.0, 6.0, 3.0, 3.0, 10.0, 31.0, 27.0, 47.0, 77.0, 135.0, 293.0, 1086.0, 6655.0, 172134.0, 3954048.0, 54655.0, 3834.0, 695.0, 245.0, 119.0, 63.0, 43.0, 18.0, 14.0, 18.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.96875, -27.22021484375, -26.4716796875, -25.72314453125, -24.974609375, -24.22607421875, -23.4775390625, -22.72900390625, -21.98046875, -21.23193359375, -20.4833984375, -19.73486328125, -18.986328125, -18.23779296875, -17.4892578125, -16.74072265625, -15.9921875, -15.24365234375, -14.4951171875, -13.74658203125, -12.998046875, -12.24951171875, -11.5009765625, -10.75244140625, -10.00390625, -9.25537109375, -8.5068359375, -7.75830078125, -7.009765625, -6.26123046875, -5.5126953125, -4.76416015625, -4.015625, -3.26708984375, -2.5185546875, -1.77001953125, -1.021484375, -0.27294921875, 0.4755859375, 1.22412109375, 1.97265625, 2.72119140625, 3.4697265625, 4.21826171875, 4.966796875, 5.71533203125, 6.4638671875, 7.21240234375, 7.9609375, 8.70947265625, 9.4580078125, 10.20654296875, 10.955078125, 11.70361328125, 12.4521484375, 13.20068359375, 13.94921875, 14.69775390625, 15.4462890625, 16.19482421875, 16.943359375, 17.69189453125, 18.4404296875, 19.18896484375, 19.9375]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 7.0, 8.0, 12.0, 11.0, 19.0, 34.0, 34.0, 43.0, 60.0, 94.0, 119.0, 193.0, 280.0, 425.0, 636.0, 647.0, 457.0, 313.0, 196.0, 123.0, 87.0, 68.0, 47.0, 41.0, 27.0, 16.0, 18.0, 13.0, 11.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.87890625, -2.796722412109375, -2.71453857421875, -2.632354736328125, -2.5501708984375, -2.467987060546875, -2.38580322265625, -2.303619384765625, -2.221435546875, -2.139251708984375, -2.05706787109375, -1.974884033203125, -1.8927001953125, -1.810516357421875, -1.72833251953125, -1.646148681640625, -1.56396484375, -1.481781005859375, -1.39959716796875, -1.317413330078125, -1.2352294921875, -1.153045654296875, -1.07086181640625, -0.988677978515625, -0.906494140625, -0.824310302734375, -0.74212646484375, -0.659942626953125, -0.5777587890625, -0.495574951171875, -0.41339111328125, -0.331207275390625, -0.2490234375, -0.166839599609375, -0.08465576171875, -0.002471923828125, 0.0797119140625, 0.161895751953125, 0.24407958984375, 0.326263427734375, 0.408447265625, 0.490631103515625, 0.57281494140625, 0.654998779296875, 0.7371826171875, 0.819366455078125, 0.90155029296875, 0.983734130859375, 1.06591796875, 1.148101806640625, 1.23028564453125, 1.312469482421875, 1.3946533203125, 1.476837158203125, 1.55902099609375, 1.641204833984375, 1.723388671875, 1.805572509765625, 1.88775634765625, 1.969940185546875, 2.0521240234375, 2.134307861328125, 2.21649169921875, 2.298675537109375, 2.380859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 5.0, 7.0, 5.0, 9.0, 14.0, 16.0, 33.0, 43.0, 65.0, 86.0, 93.0, 116.0, 133.0, 113.0, 76.0, 61.0, 40.0, 29.0, 11.0, 15.0, 7.0, 8.0, 7.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.62356185913086, -13.170117378234863, -12.716672897338867, -12.263228416442871, -11.809783935546875, -11.356339454650879, -10.902894973754883, -10.449450492858887, -9.99600601196289, -9.542561531066895, -9.089117050170898, -8.635672569274902, -8.182228088378906, -7.72878360748291, -7.275339126586914, -6.821894645690918, -6.368450164794922, -5.915005683898926, -5.46156120300293, -5.008116722106934, -4.5546722412109375, -4.101227760314941, -3.6477832794189453, -3.194338798522949, -2.740894317626953, -2.287449836730957, -1.834005355834961, -1.3805608749389648, -0.9271163940429688, -0.47367191314697266, -0.020227432250976562, 0.43321704864501953, 0.886662483215332, 1.3401069641113281, 1.7935514450073242, 2.2469959259033203, 2.7004404067993164, 3.1538848876953125, 3.6073293685913086, 4.060773849487305, 4.514218330383301, 4.967662811279297, 5.421107292175293, 5.874551773071289, 6.327996253967285, 6.781440734863281, 7.234885215759277, 7.688329696655273, 8.14177417755127, 8.595218658447266, 9.048663139343262, 9.502107620239258, 9.955552101135254, 10.40899658203125, 10.862441062927246, 11.315885543823242, 11.769330024719238, 12.222774505615234, 12.67621898651123, 13.129663467407227, 13.583107948303223, 14.036552429199219, 14.489996910095215, 14.943441390991211, 15.396885871887207]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 0.0, 2.0, 4.0, 3.0, 4.0, 7.0, 9.0, 16.0, 6.0, 8.0, 15.0, 20.0, 16.0, 24.0, 27.0, 35.0, 26.0, 29.0, 49.0, 43.0, 57.0, 48.0, 60.0, 45.0, 62.0, 48.0, 37.0, 45.0, 37.0, 34.0, 29.0, 31.0, 20.0, 19.0, 19.0, 15.0, 14.0, 10.0, 11.0, 12.0, 6.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.911253929138184, -5.67911434173584, -5.446974277496338, -5.214834690093994, -4.982694625854492, -4.750555038452148, -4.518415451049805, -4.286275863647461, -4.054135799407959, -3.821995973587036, -3.5898561477661133, -3.3577165603637695, -3.1255767345428467, -2.893436908721924, -2.66129732131958, -2.4291574954986572, -2.1970176696777344, -1.9648778438568115, -1.7327381372451782, -1.500598430633545, -1.268458604812622, -1.0363187789916992, -0.8041790723800659, -0.5720393657684326, -0.33989953994750977, -0.10775977373123169, 0.12437999248504639, 0.35651975870132446, 0.5886595249176025, 0.8207993507385254, 1.0529390573501587, 1.285078763961792, 1.5172185897827148, 1.7493584156036377, 1.981498122215271, 2.2136378288269043, 2.445777654647827, 2.67791748046875, 2.9100570678710938, 3.1421968936920166, 3.3743367195129395, 3.6064765453338623, 3.838616371154785, 4.070755958557129, 4.302895545959473, 4.535035610198975, 4.767175197601318, 4.99931526184082, 5.231454849243164, 5.463594436645508, 5.69573450088501, 5.9278740882873535, 6.1600141525268555, 6.392153739929199, 6.624293327331543, 6.856432914733887, 7.088572978973389, 7.320712566375732, 7.552852630615234, 7.784992218017578, 8.017131805419922, 8.249271392822266, 8.481411933898926, 8.71355152130127, 8.945691108703613]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 9.0, 12.0, 15.0, 26.0, 48.0, 92.0, 190.0, 455.0, 1099.0, 2726.0, 7615.0, 27234.0, 191433.0, 722631.0, 71003.0, 15737.0, 4988.0, 1768.0, 761.0, 359.0, 161.0, 83.0, 45.0, 22.0, 12.0, 5.0, 5.0, 3.0, 4.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.6015625, -4.478179931640625, -4.35479736328125, -4.231414794921875, -4.1080322265625, -3.984649658203125, -3.86126708984375, -3.737884521484375, -3.614501953125, -3.491119384765625, -3.36773681640625, -3.244354248046875, -3.1209716796875, -2.997589111328125, -2.87420654296875, -2.750823974609375, -2.62744140625, -2.504058837890625, -2.38067626953125, -2.257293701171875, -2.1339111328125, -2.010528564453125, -1.88714599609375, -1.763763427734375, -1.640380859375, -1.516998291015625, -1.39361572265625, -1.270233154296875, -1.1468505859375, -1.023468017578125, -0.90008544921875, -0.776702880859375, -0.6533203125, -0.529937744140625, -0.40655517578125, -0.283172607421875, -0.1597900390625, -0.036407470703125, 0.08697509765625, 0.210357666015625, 0.333740234375, 0.457122802734375, 0.58050537109375, 0.703887939453125, 0.8272705078125, 0.950653076171875, 1.07403564453125, 1.197418212890625, 1.32080078125, 1.444183349609375, 1.56756591796875, 1.690948486328125, 1.8143310546875, 1.937713623046875, 2.06109619140625, 2.184478759765625, 2.307861328125, 2.431243896484375, 2.55462646484375, 2.678009033203125, 2.8013916015625, 2.924774169921875, 3.04815673828125, 3.171539306640625, 3.294921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 2.0, 6.0, 7.0, 10.0, 7.0, 10.0, 10.0, 10.0, 12.0, 23.0, 20.0, 32.0, 40.0, 41.0, 39.0, 46.0, 52.0, 60.0, 62.0, 64.0, 61.0, 59.0, 43.0, 35.0, 46.0, 29.0, 27.0, 35.0, 22.0, 21.0, 15.0, 15.0, 9.0, 4.0, 2.0, 4.0, 14.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.37109375, -4.205078125, -4.0390625, -3.873046875, -3.70703125, -3.541015625, -3.375, -3.208984375, -3.04296875, -2.876953125, -2.7109375, -2.544921875, -2.37890625, -2.212890625, -2.046875, -1.880859375, -1.71484375, -1.548828125, -1.3828125, -1.216796875, -1.05078125, -0.884765625, -0.71875, -0.552734375, -0.38671875, -0.220703125, -0.0546875, 0.111328125, 0.27734375, 0.443359375, 0.609375, 0.775390625, 0.94140625, 1.107421875, 1.2734375, 1.439453125, 1.60546875, 1.771484375, 1.9375, 2.103515625, 2.26953125, 2.435546875, 2.6015625, 2.767578125, 2.93359375, 3.099609375, 3.265625, 3.431640625, 3.59765625, 3.763671875, 3.9296875, 4.095703125, 4.26171875, 4.427734375, 4.59375, 4.759765625, 4.92578125, 5.091796875, 5.2578125, 5.423828125, 5.58984375, 5.755859375, 5.921875, 6.087890625, 6.25390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 12.0, 11.0, 8.0, 14.0, 22.0, 21.0, 35.0, 50.0, 76.0, 136.0, 214.0, 539.0, 1420.0, 3813.0, 11575.0, 46577.0, 407411.0, 500273.0, 56138.0, 13214.0, 4195.0, 1506.0, 587.0, 309.0, 133.0, 83.0, 49.0, 32.0, 31.0, 14.0, 14.0, 5.0, 12.0, 3.0, 7.0, 3.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.892578125, -2.802337646484375, -2.71209716796875, -2.621856689453125, -2.5316162109375, -2.441375732421875, -2.35113525390625, -2.260894775390625, -2.170654296875, -2.080413818359375, -1.99017333984375, -1.899932861328125, -1.8096923828125, -1.719451904296875, -1.62921142578125, -1.538970947265625, -1.44873046875, -1.358489990234375, -1.26824951171875, -1.178009033203125, -1.0877685546875, -0.997528076171875, -0.90728759765625, -0.817047119140625, -0.726806640625, -0.636566162109375, -0.54632568359375, -0.456085205078125, -0.3658447265625, -0.275604248046875, -0.18536376953125, -0.095123291015625, -0.0048828125, 0.085357666015625, 0.17559814453125, 0.265838623046875, 0.3560791015625, 0.446319580078125, 0.53656005859375, 0.626800537109375, 0.717041015625, 0.807281494140625, 0.89752197265625, 0.987762451171875, 1.0780029296875, 1.168243408203125, 1.25848388671875, 1.348724365234375, 1.43896484375, 1.529205322265625, 1.61944580078125, 1.709686279296875, 1.7999267578125, 1.890167236328125, 1.98040771484375, 2.070648193359375, 2.160888671875, 2.251129150390625, 2.34136962890625, 2.431610107421875, 2.5218505859375, 2.612091064453125, 2.70233154296875, 2.792572021484375, 2.8828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 9.0, 3.0, 3.0, 4.0, 4.0, 4.0, 13.0, 10.0, 12.0, 13.0, 27.0, 21.0, 36.0, 26.0, 37.0, 31.0, 36.0, 33.0, 48.0, 47.0, 42.0, 51.0, 52.0, 53.0, 48.0, 44.0, 41.0, 35.0, 38.0, 33.0, 24.0, 29.0, 21.0, 13.0, 19.0, 9.0, 8.0, 5.0, 5.0, 4.0, 5.0, 1.0, 4.0, 2.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.6640625, -9.37841796875, -9.0927734375, -8.80712890625, -8.521484375, -8.23583984375, -7.9501953125, -7.66455078125, -7.37890625, -7.09326171875, -6.8076171875, -6.52197265625, -6.236328125, -5.95068359375, -5.6650390625, -5.37939453125, -5.09375, -4.80810546875, -4.5224609375, -4.23681640625, -3.951171875, -3.66552734375, -3.3798828125, -3.09423828125, -2.80859375, -2.52294921875, -2.2373046875, -1.95166015625, -1.666015625, -1.38037109375, -1.0947265625, -0.80908203125, -0.5234375, -0.23779296875, 0.0478515625, 0.33349609375, 0.619140625, 0.90478515625, 1.1904296875, 1.47607421875, 1.76171875, 2.04736328125, 2.3330078125, 2.61865234375, 2.904296875, 3.18994140625, 3.4755859375, 3.76123046875, 4.046875, 4.33251953125, 4.6181640625, 4.90380859375, 5.189453125, 5.47509765625, 5.7607421875, 6.04638671875, 6.33203125, 6.61767578125, 6.9033203125, 7.18896484375, 7.474609375, 7.76025390625, 8.0458984375, 8.33154296875, 8.6171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 10.0, 7.0, 10.0, 13.0, 15.0, 36.0, 46.0, 66.0, 107.0, 138.0, 251.0, 368.0, 603.0, 1109.0, 1952.0, 3867.0, 7879.0, 18244.0, 49015.0, 169643.0, 477770.0, 217067.0, 60022.0, 21602.0, 9128.0, 4373.0, 2218.0, 1148.0, 676.0, 432.0, 245.0, 178.0, 115.0, 53.0, 52.0, 26.0, 30.0, 17.0, 9.0, 11.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6350021362304688, -0.6142425537109375, -0.5934829711914062, -0.572723388671875, -0.5519638061523438, -0.5312042236328125, -0.5104446411132812, -0.48968505859375, -0.46892547607421875, -0.4481658935546875, -0.42740631103515625, -0.406646728515625, -0.38588714599609375, -0.3651275634765625, -0.34436798095703125, -0.3236083984375, -0.30284881591796875, -0.2820892333984375, -0.26132965087890625, -0.240570068359375, -0.21981048583984375, -0.1990509033203125, -0.17829132080078125, -0.15753173828125, -0.13677215576171875, -0.1160125732421875, -0.09525299072265625, -0.074493408203125, -0.05373382568359375, -0.0329742431640625, -0.01221466064453125, 0.008544921875, 0.02930450439453125, 0.0500640869140625, 0.07082366943359375, 0.091583251953125, 0.11234283447265625, 0.1331024169921875, 0.15386199951171875, 0.17462158203125, 0.19538116455078125, 0.2161407470703125, 0.23690032958984375, 0.257659912109375, 0.27841949462890625, 0.2991790771484375, 0.31993865966796875, 0.3406982421875, 0.36145782470703125, 0.3822174072265625, 0.40297698974609375, 0.423736572265625, 0.44449615478515625, 0.4652557373046875, 0.48601531982421875, 0.50677490234375, 0.5275344848632812, 0.5482940673828125, 0.5690536499023438, 0.589813232421875, 0.6105728149414062, 0.6313323974609375, 0.6520919799804688, 0.6728515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 4.0, 2.0, 5.0, 7.0, 19.0, 16.0, 24.0, 36.0, 40.0, 54.0, 107.0, 110.0, 130.0, 110.0, 102.0, 77.0, 36.0, 36.0, 29.0, 17.0, 10.0, 5.0, 9.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005903244018554688, -0.0005745589733123779, -0.0005587935447692871, -0.0005430281162261963, -0.0005272626876831055, -0.0005114972591400146, -0.0004957318305969238, -0.000479966402053833, -0.0004642009735107422, -0.00044843554496765137, -0.00043267011642456055, -0.0004169046878814697, -0.0004011392593383789, -0.0003853738307952881, -0.00036960840225219727, -0.00035384297370910645, -0.0003380775451660156, -0.0003223121166229248, -0.000306546688079834, -0.00029078125953674316, -0.00027501583099365234, -0.0002592504024505615, -0.0002434849739074707, -0.00022771954536437988, -0.00021195411682128906, -0.00019618868827819824, -0.00018042325973510742, -0.0001646578311920166, -0.00014889240264892578, -0.00013312697410583496, -0.00011736154556274414, -0.00010159611701965332, -8.58306884765625e-05, -7.006525993347168e-05, -5.429983139038086e-05, -3.853440284729004e-05, -2.276897430419922e-05, -7.0035457611083984e-06, 8.761882781982422e-06, 2.4527311325073242e-05, 4.029273986816406e-05, 5.605816841125488e-05, 7.18235969543457e-05, 8.758902549743652e-05, 0.00010335445404052734, 0.00011911988258361816, 0.00013488531112670898, 0.0001506507396697998, 0.00016641616821289062, 0.00018218159675598145, 0.00019794702529907227, 0.00021371245384216309, 0.0002294778823852539, 0.0002452433109283447, 0.00026100873947143555, 0.00027677416801452637, 0.0002925395965576172, 0.000308305025100708, 0.00032407045364379883, 0.00033983588218688965, 0.00035560131072998047, 0.0003713667392730713, 0.0003871321678161621, 0.00040289759635925293, 0.00041866302490234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 3.0, 5.0, 7.0, 15.0, 14.0, 25.0, 42.0, 67.0, 102.0, 201.0, 346.0, 580.0, 1332.0, 2664.0, 6383.0, 17477.0, 60418.0, 312158.0, 504714.0, 100232.0, 25887.0, 8981.0, 3549.0, 1616.0, 767.0, 414.0, 213.0, 120.0, 56.0, 48.0, 31.0, 24.0, 18.0, 13.0, 14.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8173828125, -0.7902908325195312, -0.7631988525390625, -0.7361068725585938, -0.709014892578125, -0.6819229125976562, -0.6548309326171875, -0.6277389526367188, -0.60064697265625, -0.5735549926757812, -0.5464630126953125, -0.5193710327148438, -0.492279052734375, -0.46518707275390625, -0.4380950927734375, -0.41100311279296875, -0.3839111328125, -0.35681915283203125, -0.3297271728515625, -0.30263519287109375, -0.275543212890625, -0.24845123291015625, -0.2213592529296875, -0.19426727294921875, -0.16717529296875, -0.14008331298828125, -0.1129913330078125, -0.08589935302734375, -0.058807373046875, -0.03171539306640625, -0.0046234130859375, 0.02246856689453125, 0.049560546875, 0.07665252685546875, 0.1037445068359375, 0.13083648681640625, 0.157928466796875, 0.18502044677734375, 0.2121124267578125, 0.23920440673828125, 0.26629638671875, 0.29338836669921875, 0.3204803466796875, 0.34757232666015625, 0.374664306640625, 0.40175628662109375, 0.4288482666015625, 0.45594024658203125, 0.4830322265625, 0.5101242065429688, 0.5372161865234375, 0.5643081665039062, 0.591400146484375, 0.6184921264648438, 0.6455841064453125, 0.6726760864257812, 0.69976806640625, 0.7268600463867188, 0.7539520263671875, 0.7810440063476562, 0.808135986328125, 0.8352279663085938, 0.8623199462890625, 0.8894119262695312, 0.91650390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 3.0, 3.0, 5.0, 0.0, 4.0, 9.0, 10.0, 9.0, 9.0, 6.0, 13.0, 14.0, 16.0, 22.0, 33.0, 31.0, 33.0, 38.0, 56.0, 76.0, 76.0, 77.0, 69.0, 72.0, 60.0, 47.0, 42.0, 32.0, 26.0, 23.0, 14.0, 15.0, 8.0, 6.0, 15.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.153076171875, -0.1483306884765625, -0.143585205078125, -0.1388397216796875, -0.13409423828125, -0.1293487548828125, -0.124603271484375, -0.1198577880859375, -0.1151123046875, -0.1103668212890625, -0.105621337890625, -0.1008758544921875, -0.09613037109375, -0.0913848876953125, -0.086639404296875, -0.0818939208984375, -0.0771484375, -0.0724029541015625, -0.067657470703125, -0.0629119873046875, -0.05816650390625, -0.0534210205078125, -0.048675537109375, -0.0439300537109375, -0.0391845703125, -0.0344390869140625, -0.029693603515625, -0.0249481201171875, -0.02020263671875, -0.0154571533203125, -0.010711669921875, -0.0059661865234375, -0.001220703125, 0.0035247802734375, 0.008270263671875, 0.0130157470703125, 0.01776123046875, 0.0225067138671875, 0.027252197265625, 0.0319976806640625, 0.0367431640625, 0.0414886474609375, 0.046234130859375, 0.0509796142578125, 0.05572509765625, 0.0604705810546875, 0.065216064453125, 0.0699615478515625, 0.07470703125, 0.0794525146484375, 0.084197998046875, 0.0889434814453125, 0.09368896484375, 0.0984344482421875, 0.103179931640625, 0.1079254150390625, 0.1126708984375, 0.1174163818359375, 0.122161865234375, 0.1269073486328125, 0.13165283203125, 0.1363983154296875, 0.141143798828125, 0.1458892822265625, 0.150634765625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 8.0, 12.0, 15.0, 22.0, 42.0, 63.0, 86.0, 126.0, 126.0, 145.0, 126.0, 78.0, 54.0, 29.0, 17.0, 14.0, 6.0, 8.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.928842544555664, -9.597585678100586, -9.266328811645508, -8.93507194519043, -8.603815078735352, -8.272558212280273, -7.9413018226623535, -7.610045433044434, -7.2787885665893555, -6.947531700134277, -6.616274833679199, -6.285017967224121, -5.953761577606201, -5.622504711151123, -5.291247844696045, -4.959991455078125, -4.628734111785889, -4.2974772453308105, -3.9662206172943115, -3.6349637508392334, -3.3037071228027344, -2.9724502563476562, -2.641193389892578, -2.309936761856079, -1.978679895401001, -1.6474231481552124, -1.3161664009094238, -0.9849095344543457, -0.6536527872085571, -0.32239603996276855, 0.00886082649230957, 0.3401174545288086, 0.6713743209838867, 1.0026310682296753, 1.3338878154754639, 1.665144681930542, 1.9964014291763306, 2.327658176422119, 2.6589150428771973, 2.9901716709136963, 3.3214285373687744, 3.6526854038238525, 3.9839420318603516, 4.31519889831543, 4.646455764770508, 4.977712631225586, 5.308969497680664, 5.640225887298584, 5.971482753753662, 6.30273962020874, 6.633996486663818, 6.965252876281738, 7.296509742736816, 7.6277666091918945, 7.959023475646973, 8.29028034210205, 8.621537208557129, 8.952794075012207, 9.284050941467285, 9.615307807922363, 9.946564674377441, 10.277820587158203, 10.609077453613281, 10.94033432006836, 11.271591186523438]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 1.0, 5.0, 1.0, 4.0, 7.0, 6.0, 3.0, 16.0, 12.0, 10.0, 9.0, 19.0, 21.0, 23.0, 33.0, 31.0, 36.0, 41.0, 42.0, 63.0, 57.0, 56.0, 58.0, 59.0, 53.0, 44.0, 45.0, 52.0, 27.0, 22.0, 26.0, 24.0, 13.0, 19.0, 20.0, 10.0, 10.0, 11.0, 6.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.895216941833496, -3.7402265071868896, -3.585235834121704, -3.4302453994750977, -3.275254726409912, -3.1202642917633057, -2.965273857116699, -2.8102831840515137, -2.6552927494049072, -2.500302314758301, -2.3453116416931152, -2.190321207046509, -2.0353307723999023, -1.8803400993347168, -1.7253496646881104, -1.5703591108322144, -1.4153685569763184, -1.2603780031204224, -1.1053874492645264, -0.9503970146179199, -0.7954064607620239, -0.6404159069061279, -0.4854254126548767, -0.3304349184036255, -0.1754443645477295, -0.020453840494155884, 0.13453668355941772, 0.28952720761299133, 0.44451773166656494, 0.5995082855224609, 0.7544987797737122, 0.9094892740249634, 1.0644793510437012, 1.2194699048995972, 1.3744604587554932, 1.5294508934020996, 1.6844414472579956, 1.8394320011138916, 1.994422435760498, 2.1494131088256836, 2.30440354347229, 2.4593939781188965, 2.614384651184082, 2.7693750858306885, 2.924365520477295, 3.0793561935424805, 3.234346628189087, 3.3893370628356934, 3.544327735900879, 3.6993181705474854, 3.854308843612671, 4.009299278259277, 4.164289951324463, 4.319280624389648, 4.474270820617676, 4.629261493682861, 4.784252166748047, 4.939242839813232, 5.09423303604126, 5.249223709106445, 5.404214382171631, 5.559205055236816, 5.714195251464844, 5.869185924530029, 6.024176120758057]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 8.0, 11.0, 10.0, 17.0, 27.0, 38.0, 79.0, 213.0, 669.0, 3616.0, 38376.0, 757250.0, 234170.0, 11804.0, 1645.0, 355.0, 127.0, 53.0, 32.0, 21.0, 12.0, 10.0, 4.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1328125, -13.71435546875, -13.2958984375, -12.87744140625, -12.458984375, -12.04052734375, -11.6220703125, -11.20361328125, -10.78515625, -10.36669921875, -9.9482421875, -9.52978515625, -9.111328125, -8.69287109375, -8.2744140625, -7.85595703125, -7.4375, -7.01904296875, -6.6005859375, -6.18212890625, -5.763671875, -5.34521484375, -4.9267578125, -4.50830078125, -4.08984375, -3.67138671875, -3.2529296875, -2.83447265625, -2.416015625, -1.99755859375, -1.5791015625, -1.16064453125, -0.7421875, -0.32373046875, 0.0947265625, 0.51318359375, 0.931640625, 1.35009765625, 1.7685546875, 2.18701171875, 2.60546875, 3.02392578125, 3.4423828125, 3.86083984375, 4.279296875, 4.69775390625, 5.1162109375, 5.53466796875, 5.953125, 6.37158203125, 6.7900390625, 7.20849609375, 7.626953125, 8.04541015625, 8.4638671875, 8.88232421875, 9.30078125, 9.71923828125, 10.1376953125, 10.55615234375, 10.974609375, 11.39306640625, 11.8115234375, 12.22998046875, 12.6484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 9.0, 13.0, 9.0, 8.0, 8.0, 10.0, 19.0, 29.0, 27.0, 30.0, 44.0, 35.0, 51.0, 51.0, 64.0, 60.0, 50.0, 59.0, 68.0, 53.0, 39.0, 43.0, 24.0, 44.0, 21.0, 23.0, 28.0, 13.0, 12.0, 16.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.734375, -8.3780517578125, -8.021728515625, -7.6654052734375, -7.30908203125, -6.9527587890625, -6.596435546875, -6.2401123046875, -5.8837890625, -5.5274658203125, -5.171142578125, -4.8148193359375, -4.45849609375, -4.1021728515625, -3.745849609375, -3.3895263671875, -3.033203125, -2.6768798828125, -2.320556640625, -1.9642333984375, -1.60791015625, -1.2515869140625, -0.895263671875, -0.5389404296875, -0.1826171875, 0.1737060546875, 0.530029296875, 0.8863525390625, 1.24267578125, 1.5989990234375, 1.955322265625, 2.3116455078125, 2.66796875, 3.0242919921875, 3.380615234375, 3.7369384765625, 4.09326171875, 4.4495849609375, 4.805908203125, 5.1622314453125, 5.5185546875, 5.8748779296875, 6.231201171875, 6.5875244140625, 6.94384765625, 7.3001708984375, 7.656494140625, 8.0128173828125, 8.369140625, 8.7254638671875, 9.081787109375, 9.4381103515625, 9.79443359375, 10.1507568359375, 10.507080078125, 10.8634033203125, 11.2197265625, 11.5760498046875, 11.932373046875, 12.2886962890625, 12.64501953125, 13.0013427734375, 13.357666015625, 13.7139892578125, 14.0703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 8.0, 4.0, 5.0, 9.0, 12.0, 12.0, 16.0, 35.0, 42.0, 42.0, 58.0, 76.0, 138.0, 224.0, 357.0, 848.0, 1941.0, 6100.0, 28009.0, 201820.0, 623958.0, 154250.0, 22243.0, 4960.0, 1681.0, 711.0, 347.0, 210.0, 131.0, 72.0, 61.0, 55.0, 32.0, 21.0, 14.0, 18.0, 9.0, 11.0, 8.0, 0.0, 5.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.15625, -5.97210693359375, -5.7879638671875, -5.60382080078125, -5.419677734375, -5.23553466796875, -5.0513916015625, -4.86724853515625, -4.68310546875, -4.49896240234375, -4.3148193359375, -4.13067626953125, -3.946533203125, -3.76239013671875, -3.5782470703125, -3.39410400390625, -3.2099609375, -3.02581787109375, -2.8416748046875, -2.65753173828125, -2.473388671875, -2.28924560546875, -2.1051025390625, -1.92095947265625, -1.73681640625, -1.55267333984375, -1.3685302734375, -1.18438720703125, -1.000244140625, -0.81610107421875, -0.6319580078125, -0.44781494140625, -0.263671875, -0.07952880859375, 0.1046142578125, 0.28875732421875, 0.472900390625, 0.65704345703125, 0.8411865234375, 1.02532958984375, 1.20947265625, 1.39361572265625, 1.5777587890625, 1.76190185546875, 1.946044921875, 2.13018798828125, 2.3143310546875, 2.49847412109375, 2.6826171875, 2.86676025390625, 3.0509033203125, 3.23504638671875, 3.419189453125, 3.60333251953125, 3.7874755859375, 3.97161865234375, 4.15576171875, 4.33990478515625, 4.5240478515625, 4.70819091796875, 4.892333984375, 5.07647705078125, 5.2606201171875, 5.44476318359375, 5.62890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 1.0, 6.0, 5.0, 12.0, 8.0, 11.0, 13.0, 11.0, 21.0, 20.0, 30.0, 18.0, 19.0, 21.0, 34.0, 28.0, 31.0, 36.0, 37.0, 41.0, 41.0, 41.0, 34.0, 36.0, 38.0, 41.0, 31.0, 27.0, 25.0, 33.0, 25.0, 39.0, 24.0, 26.0, 16.0, 23.0, 21.0, 15.0, 8.0, 8.0, 9.0, 9.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.28125, -8.9942626953125, -8.707275390625, -8.4202880859375, -8.13330078125, -7.8463134765625, -7.559326171875, -7.2723388671875, -6.9853515625, -6.6983642578125, -6.411376953125, -6.1243896484375, -5.83740234375, -5.5504150390625, -5.263427734375, -4.9764404296875, -4.689453125, -4.4024658203125, -4.115478515625, -3.8284912109375, -3.54150390625, -3.2545166015625, -2.967529296875, -2.6805419921875, -2.3935546875, -2.1065673828125, -1.819580078125, -1.5325927734375, -1.24560546875, -0.9586181640625, -0.671630859375, -0.3846435546875, -0.09765625, 0.1893310546875, 0.476318359375, 0.7633056640625, 1.05029296875, 1.3372802734375, 1.624267578125, 1.9112548828125, 2.1982421875, 2.4852294921875, 2.772216796875, 3.0592041015625, 3.34619140625, 3.6331787109375, 3.920166015625, 4.2071533203125, 4.494140625, 4.7811279296875, 5.068115234375, 5.3551025390625, 5.64208984375, 5.9290771484375, 6.216064453125, 6.5030517578125, 6.7900390625, 7.0770263671875, 7.364013671875, 7.6510009765625, 7.93798828125, 8.2249755859375, 8.511962890625, 8.7989501953125, 9.0859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 9.0, 7.0, 8.0, 17.0, 26.0, 25.0, 56.0, 83.0, 115.0, 261.0, 428.0, 942.0, 2163.0, 6375.0, 21631.0, 102511.0, 522577.0, 316056.0, 55089.0, 13091.0, 4039.0, 1501.0, 715.0, 330.0, 172.0, 115.0, 64.0, 41.0, 34.0, 19.0, 10.0, 12.0, 11.0, 6.0, 1.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.087890625, -2.0295867919921875, -1.971282958984375, -1.9129791259765625, -1.85467529296875, -1.7963714599609375, -1.738067626953125, -1.6797637939453125, -1.6214599609375, -1.5631561279296875, -1.504852294921875, -1.4465484619140625, -1.38824462890625, -1.3299407958984375, -1.271636962890625, -1.2133331298828125, -1.155029296875, -1.0967254638671875, -1.038421630859375, -0.9801177978515625, -0.92181396484375, -0.8635101318359375, -0.805206298828125, -0.7469024658203125, -0.6885986328125, -0.6302947998046875, -0.571990966796875, -0.5136871337890625, -0.45538330078125, -0.3970794677734375, -0.338775634765625, -0.2804718017578125, -0.22216796875, -0.1638641357421875, -0.105560302734375, -0.0472564697265625, 0.01104736328125, 0.0693511962890625, 0.127655029296875, 0.1859588623046875, 0.2442626953125, 0.3025665283203125, 0.360870361328125, 0.4191741943359375, 0.47747802734375, 0.5357818603515625, 0.594085693359375, 0.6523895263671875, 0.710693359375, 0.7689971923828125, 0.827301025390625, 0.8856048583984375, 0.94390869140625, 1.0022125244140625, 1.060516357421875, 1.1188201904296875, 1.1771240234375, 1.2354278564453125, 1.293731689453125, 1.3520355224609375, 1.41033935546875, 1.4686431884765625, 1.526947021484375, 1.5852508544921875, 1.6435546875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 7.0, 4.0, 4.0, 4.0, 8.0, 9.0, 12.0, 14.0, 21.0, 28.0, 50.0, 51.0, 57.0, 85.0, 90.0, 87.0, 107.0, 79.0, 67.0, 42.0, 33.0, 30.0, 34.0, 18.0, 14.0, 11.0, 8.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.00037479400634765625, -0.00036571361124515533, -0.0003566332161426544, -0.0003475528210401535, -0.0003384724259376526, -0.00032939203083515167, -0.00032031163573265076, -0.00031123124063014984, -0.0003021508455276489, -0.000293070450425148, -0.0002839900553226471, -0.0002749096602201462, -0.00026582926511764526, -0.00025674887001514435, -0.00024766847491264343, -0.00023858807981014252, -0.0002295076847076416, -0.00022042728960514069, -0.00021134689450263977, -0.00020226649940013885, -0.00019318610429763794, -0.00018410570919513702, -0.0001750253140926361, -0.0001659449189901352, -0.00015686452388763428, -0.00014778412878513336, -0.00013870373368263245, -0.00012962333858013153, -0.00012054294347763062, -0.0001114625483751297, -0.00010238215327262878, -9.330175817012787e-05, -8.422136306762695e-05, -7.514096796512604e-05, -6.606057286262512e-05, -5.6980177760124207e-05, -4.789978265762329e-05, -3.8819387555122375e-05, -2.973899245262146e-05, -2.0658597350120544e-05, -1.1578202247619629e-05, -2.4978071451187134e-06, 6.582587957382202e-06, 1.5662983059883118e-05, 2.4743378162384033e-05, 3.382377326488495e-05, 4.2904168367385864e-05, 5.198456346988678e-05, 6.10649585723877e-05, 7.014535367488861e-05, 7.922574877738953e-05, 8.830614387989044e-05, 9.738653898239136e-05, 0.00010646693408489227, 0.00011554732918739319, 0.0001246277242898941, 0.00013370811939239502, 0.00014278851449489594, 0.00015186890959739685, 0.00016094930469989777, 0.00017002969980239868, 0.0001791100949048996, 0.0001881904900074005, 0.00019727088510990143, 0.00020635128021240234]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 15.0, 20.0, 24.0, 27.0, 42.0, 68.0, 94.0, 155.0, 234.0, 362.0, 541.0, 974.0, 1672.0, 3058.0, 6326.0, 14341.0, 37629.0, 114406.0, 347545.0, 343420.0, 112598.0, 37181.0, 14228.0, 6326.0, 3066.0, 1678.0, 903.0, 557.0, 347.0, 215.0, 144.0, 104.0, 71.0, 46.0, 32.0, 15.0, 17.0, 10.0, 12.0, 11.0, 4.0, 6.0, 5.0, 5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.296875, -1.257568359375, -1.21826171875, -1.178955078125, -1.1396484375, -1.100341796875, -1.06103515625, -1.021728515625, -0.982421875, -0.943115234375, -0.90380859375, -0.864501953125, -0.8251953125, -0.785888671875, -0.74658203125, -0.707275390625, -0.66796875, -0.628662109375, -0.58935546875, -0.550048828125, -0.5107421875, -0.471435546875, -0.43212890625, -0.392822265625, -0.353515625, -0.314208984375, -0.27490234375, -0.235595703125, -0.1962890625, -0.156982421875, -0.11767578125, -0.078369140625, -0.0390625, 0.000244140625, 0.03955078125, 0.078857421875, 0.1181640625, 0.157470703125, 0.19677734375, 0.236083984375, 0.275390625, 0.314697265625, 0.35400390625, 0.393310546875, 0.4326171875, 0.471923828125, 0.51123046875, 0.550537109375, 0.58984375, 0.629150390625, 0.66845703125, 0.707763671875, 0.7470703125, 0.786376953125, 0.82568359375, 0.864990234375, 0.904296875, 0.943603515625, 0.98291015625, 1.022216796875, 1.0615234375, 1.100830078125, 1.14013671875, 1.179443359375, 1.21875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 6.0, 7.0, 13.0, 10.0, 11.0, 17.0, 24.0, 27.0, 30.0, 42.0, 45.0, 44.0, 57.0, 57.0, 60.0, 79.0, 68.0, 57.0, 63.0, 49.0, 44.0, 32.0, 31.0, 28.0, 24.0, 12.0, 9.0, 16.0, 8.0, 4.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.66455078125, -0.6433792114257812, -0.6222076416015625, -0.6010360717773438, -0.579864501953125, -0.5586929321289062, -0.5375213623046875, -0.5163497924804688, -0.49517822265625, -0.47400665283203125, -0.4528350830078125, -0.43166351318359375, -0.410491943359375, -0.38932037353515625, -0.3681488037109375, -0.34697723388671875, -0.3258056640625, -0.30463409423828125, -0.2834625244140625, -0.26229095458984375, -0.241119384765625, -0.21994781494140625, -0.1987762451171875, -0.17760467529296875, -0.15643310546875, -0.13526153564453125, -0.1140899658203125, -0.09291839599609375, -0.071746826171875, -0.05057525634765625, -0.0294036865234375, -0.00823211669921875, 0.012939453125, 0.03411102294921875, 0.0552825927734375, 0.07645416259765625, 0.097625732421875, 0.11879730224609375, 0.1399688720703125, 0.16114044189453125, 0.18231201171875, 0.20348358154296875, 0.2246551513671875, 0.24582672119140625, 0.266998291015625, 0.28816986083984375, 0.3093414306640625, 0.33051300048828125, 0.3516845703125, 0.37285614013671875, 0.3940277099609375, 0.41519927978515625, 0.436370849609375, 0.45754241943359375, 0.4787139892578125, 0.49988555908203125, 0.52105712890625, 0.5422286987304688, 0.5634002685546875, 0.5845718383789062, 0.605743408203125, 0.6269149780273438, 0.6480865478515625, 0.6692581176757812, 0.6904296875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 9.0, 15.0, 23.0, 67.0, 126.0, 244.0, 259.0, 140.0, 69.0, 24.0, 12.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.24296188354492, -52.03572082519531, -50.8284797668457, -49.621238708496094, -48.413997650146484, -47.206756591796875, -45.999515533447266, -44.792274475097656, -43.58502960205078, -42.37778854370117, -41.17054748535156, -39.96330642700195, -38.756065368652344, -37.548824310302734, -36.341583251953125, -35.13433837890625, -33.927101135253906, -32.7198600769043, -31.512619018554688, -30.305377960205078, -29.09813690185547, -27.89089584350586, -26.683652877807617, -25.476411819458008, -24.2691707611084, -23.06192970275879, -21.85468864440918, -20.64744758605957, -19.440204620361328, -18.23296356201172, -17.02572250366211, -15.8184814453125, -14.611236572265625, -13.403995513916016, -12.196754455566406, -10.98951244354248, -9.782271385192871, -8.575030326843262, -7.367788791656494, -6.160547256469727, -4.953306198120117, -3.7460649013519287, -2.5388236045837402, -1.3315823078155518, -0.12434101104736328, 1.082900047302246, 2.2901415824890137, 3.4973831176757812, 4.704624176025391, 5.911865234375, 7.119106769561768, 8.326348304748535, 9.533589363098145, 10.740830421447754, 11.94807243347168, 13.155313491821289, 14.362554550170898, 15.569795608520508, 16.777036666870117, 17.984277725219727, 19.19152069091797, 20.398761749267578, 21.606002807617188, 22.813243865966797, 24.020484924316406]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 4.0, 4.0, 7.0, 11.0, 18.0, 10.0, 10.0, 20.0, 15.0, 16.0, 29.0, 24.0, 24.0, 36.0, 30.0, 33.0, 33.0, 41.0, 57.0, 30.0, 44.0, 35.0, 39.0, 43.0, 35.0, 46.0, 28.0, 30.0, 27.0, 31.0, 22.0, 26.0, 27.0, 16.0, 16.0, 10.0, 19.0, 9.0, 13.0, 8.0, 12.0, 5.0, 4.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.207592010498047, -13.686460494995117, -13.165328979492188, -12.644197463989258, -12.123065948486328, -11.601934432983398, -11.080801963806152, -10.559670448303223, -10.038538932800293, -9.517407417297363, -8.996275901794434, -8.475144386291504, -7.954012393951416, -7.432880878448486, -6.911748886108398, -6.390617370605469, -5.869485855102539, -5.348354339599609, -4.82722282409668, -4.306090831756592, -3.784959316253662, -3.2638278007507324, -2.7426960468292236, -2.221564292907715, -1.7004327774047852, -1.179301142692566, -0.6581695079803467, -0.13703787326812744, 0.3840937614440918, 0.9052252769470215, 1.4263570308685303, 1.947488784790039, 2.4686222076416016, 2.9897537231445312, 3.51088547706604, 4.032017230987549, 4.5531487464904785, 5.074280261993408, 5.595412254333496, 6.116543769836426, 6.6376752853393555, 7.158806800842285, 7.679938316345215, 8.201069831848145, 8.72220230102539, 9.24333381652832, 9.76446533203125, 10.28559684753418, 10.80672836303711, 11.327859878540039, 11.848991394042969, 12.370122909545898, 12.891254425048828, 13.412385940551758, 13.933518409729004, 14.454649925231934, 14.975781440734863, 15.496912956237793, 16.01804542541504, 16.53917694091797, 17.0603084564209, 17.581439971923828, 18.102571487426758, 18.623703002929688, 19.144834518432617]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 9.0, 9.0, 20.0, 26.0, 28.0, 33.0, 76.0, 129.0, 193.0, 340.0, 631.0, 1359.0, 3017.0, 8307.0, 31498.0, 199935.0, 2060860.0, 1684229.0, 163654.0, 27160.0, 7187.0, 2788.0, 1305.0, 643.0, 336.0, 186.0, 113.0, 78.0, 37.0, 29.0, 17.0, 12.0, 6.0, 5.0, 3.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.578125, -9.2686767578125, -8.959228515625, -8.6497802734375, -8.34033203125, -8.0308837890625, -7.721435546875, -7.4119873046875, -7.1025390625, -6.7930908203125, -6.483642578125, -6.1741943359375, -5.86474609375, -5.5552978515625, -5.245849609375, -4.9364013671875, -4.626953125, -4.3175048828125, -4.008056640625, -3.6986083984375, -3.38916015625, -3.0797119140625, -2.770263671875, -2.4608154296875, -2.1513671875, -1.8419189453125, -1.532470703125, -1.2230224609375, -0.91357421875, -0.6041259765625, -0.294677734375, 0.0147705078125, 0.32421875, 0.6336669921875, 0.943115234375, 1.2525634765625, 1.56201171875, 1.8714599609375, 2.180908203125, 2.4903564453125, 2.7998046875, 3.1092529296875, 3.418701171875, 3.7281494140625, 4.03759765625, 4.3470458984375, 4.656494140625, 4.9659423828125, 5.275390625, 5.5848388671875, 5.894287109375, 6.2037353515625, 6.51318359375, 6.8226318359375, 7.132080078125, 7.4415283203125, 7.7509765625, 8.0604248046875, 8.369873046875, 8.6793212890625, 8.98876953125, 9.2982177734375, 9.607666015625, 9.9171142578125, 10.2265625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 12.0, 9.0, 10.0, 8.0, 10.0, 17.0, 18.0, 29.0, 25.0, 30.0, 38.0, 46.0, 38.0, 52.0, 60.0, 62.0, 61.0, 59.0, 51.0, 44.0, 48.0, 47.0, 24.0, 36.0, 27.0, 22.0, 27.0, 16.0, 16.0, 11.0, 7.0, 11.0, 4.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.484375, -5.2691650390625, -5.053955078125, -4.8387451171875, -4.62353515625, -4.4083251953125, -4.193115234375, -3.9779052734375, -3.7626953125, -3.5474853515625, -3.332275390625, -3.1170654296875, -2.90185546875, -2.6866455078125, -2.471435546875, -2.2562255859375, -2.041015625, -1.8258056640625, -1.610595703125, -1.3953857421875, -1.18017578125, -0.9649658203125, -0.749755859375, -0.5345458984375, -0.3193359375, -0.1041259765625, 0.111083984375, 0.3262939453125, 0.54150390625, 0.7567138671875, 0.971923828125, 1.1871337890625, 1.40234375, 1.6175537109375, 1.832763671875, 2.0479736328125, 2.26318359375, 2.4783935546875, 2.693603515625, 2.9088134765625, 3.1240234375, 3.3392333984375, 3.554443359375, 3.7696533203125, 3.98486328125, 4.2000732421875, 4.415283203125, 4.6304931640625, 4.845703125, 5.0609130859375, 5.276123046875, 5.4913330078125, 5.70654296875, 5.9217529296875, 6.136962890625, 6.3521728515625, 6.5673828125, 6.7825927734375, 6.997802734375, 7.2130126953125, 7.42822265625, 7.6434326171875, 7.858642578125, 8.0738525390625, 8.2890625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 4.0, 4.0, 15.0, 22.0, 24.0, 28.0, 44.0, 70.0, 92.0, 180.0, 241.0, 470.0, 914.0, 1916.0, 5051.0, 16338.0, 78077.0, 919752.0, 2926385.0, 198424.0, 31374.0, 8619.0, 3145.0, 1397.0, 702.0, 319.0, 212.0, 150.0, 78.0, 61.0, 42.0, 29.0, 18.0, 19.0, 10.0, 13.0, 6.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-9.375, -9.10107421875, -8.8271484375, -8.55322265625, -8.279296875, -8.00537109375, -7.7314453125, -7.45751953125, -7.18359375, -6.90966796875, -6.6357421875, -6.36181640625, -6.087890625, -5.81396484375, -5.5400390625, -5.26611328125, -4.9921875, -4.71826171875, -4.4443359375, -4.17041015625, -3.896484375, -3.62255859375, -3.3486328125, -3.07470703125, -2.80078125, -2.52685546875, -2.2529296875, -1.97900390625, -1.705078125, -1.43115234375, -1.1572265625, -0.88330078125, -0.609375, -0.33544921875, -0.0615234375, 0.21240234375, 0.486328125, 0.76025390625, 1.0341796875, 1.30810546875, 1.58203125, 1.85595703125, 2.1298828125, 2.40380859375, 2.677734375, 2.95166015625, 3.2255859375, 3.49951171875, 3.7734375, 4.04736328125, 4.3212890625, 4.59521484375, 4.869140625, 5.14306640625, 5.4169921875, 5.69091796875, 5.96484375, 6.23876953125, 6.5126953125, 6.78662109375, 7.060546875, 7.33447265625, 7.6083984375, 7.88232421875, 8.15625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 5.0, 5.0, 6.0, 12.0, 9.0, 13.0, 23.0, 23.0, 25.0, 36.0, 64.0, 89.0, 132.0, 176.0, 238.0, 437.0, 566.0, 604.0, 529.0, 344.0, 224.0, 145.0, 109.0, 73.0, 59.0, 39.0, 28.0, 20.0, 10.0, 9.0, 5.0, 8.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.900390625, -2.8226318359375, -2.744873046875, -2.6671142578125, -2.58935546875, -2.5115966796875, -2.433837890625, -2.3560791015625, -2.2783203125, -2.2005615234375, -2.122802734375, -2.0450439453125, -1.96728515625, -1.8895263671875, -1.811767578125, -1.7340087890625, -1.65625, -1.5784912109375, -1.500732421875, -1.4229736328125, -1.34521484375, -1.2674560546875, -1.189697265625, -1.1119384765625, -1.0341796875, -0.9564208984375, -0.878662109375, -0.8009033203125, -0.72314453125, -0.6453857421875, -0.567626953125, -0.4898681640625, -0.412109375, -0.3343505859375, -0.256591796875, -0.1788330078125, -0.10107421875, -0.0233154296875, 0.054443359375, 0.1322021484375, 0.2099609375, 0.2877197265625, 0.365478515625, 0.4432373046875, 0.52099609375, 0.5987548828125, 0.676513671875, 0.7542724609375, 0.83203125, 0.9097900390625, 0.987548828125, 1.0653076171875, 1.14306640625, 1.2208251953125, 1.298583984375, 1.3763427734375, 1.4541015625, 1.5318603515625, 1.609619140625, 1.6873779296875, 1.76513671875, 1.8428955078125, 1.920654296875, 1.9984130859375, 2.076171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 17.0, 9.0, 19.0, 36.0, 48.0, 55.0, 75.0, 112.0, 102.0, 108.0, 113.0, 85.0, 76.0, 46.0, 28.0, 20.0, 13.0, 18.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.52951717376709, -13.1135892868042, -12.697661399841309, -12.281733512878418, -11.865804672241211, -11.44987678527832, -11.03394889831543, -10.618021011352539, -10.202093124389648, -9.786165237426758, -9.370237350463867, -8.954309463500977, -8.538381576538086, -8.122453689575195, -7.706524848937988, -7.290596961975098, -6.874669075012207, -6.458741188049316, -6.042813301086426, -5.626884937286377, -5.210957050323486, -4.795029163360596, -4.379100799560547, -3.9631729125976562, -3.5472450256347656, -3.131317138671875, -2.7153890132904053, -2.2994608879089355, -1.883533000946045, -1.4676051139831543, -1.0516769886016846, -0.6357488632202148, -0.21982192993164062, 0.19610607624053955, 0.6120340824127197, 1.0279620885849, 1.44389009475708, 1.8598179817199707, 2.2757461071014404, 2.69167423248291, 3.107602119445801, 3.5235300064086914, 3.939458131790161, 4.355386257171631, 4.7713141441345215, 5.187242031097412, 5.603170394897461, 6.019098281860352, 6.435026168823242, 6.850954055786133, 7.266881942749023, 7.682810306549072, 8.098737716674805, 8.514665603637695, 8.930594444274902, 9.346522331237793, 9.762450218200684, 10.178378105163574, 10.594305992126465, 11.010233879089355, 11.426162719726562, 11.842090606689453, 12.258018493652344, 12.673946380615234, 13.089874267578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 7.0, 2.0, 10.0, 15.0, 11.0, 20.0, 16.0, 26.0, 19.0, 29.0, 27.0, 41.0, 42.0, 45.0, 50.0, 55.0, 57.0, 50.0, 53.0, 54.0, 50.0, 46.0, 47.0, 37.0, 43.0, 27.0, 17.0, 14.0, 18.0, 16.0, 11.0, 15.0, 5.0, 3.0, 7.0, 3.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8878397941589355, -6.652812957763672, -6.417786121368408, -6.1827592849731445, -5.947731971740723, -5.712705612182617, -5.477678298950195, -5.242651462554932, -5.007624626159668, -4.772597789764404, -4.537570953369141, -4.302544116973877, -4.067517280578613, -3.8324902057647705, -3.5974631309509277, -3.362436294555664, -3.1274094581604004, -2.8923826217651367, -2.657355785369873, -2.4223287105560303, -2.1873018741607666, -1.952275037765503, -1.7172480821609497, -1.4822211265563965, -1.2471942901611328, -1.0121674537658691, -0.7771404981613159, -0.5421136021614075, -0.307086706161499, -0.07205986976623535, 0.16296708583831787, 0.3979940414428711, 0.6330204010009766, 0.868047297000885, 1.1030741930007935, 1.3381011486053467, 1.5731279850006104, 1.808154821395874, 2.043181896209717, 2.2782087326049805, 2.513235569000244, 2.748262405395508, 2.9832892417907715, 3.2183163166046143, 3.453343152999878, 3.6883699893951416, 3.9233970642089844, 4.158423900604248, 4.393450736999512, 4.628477573394775, 4.863504409790039, 5.098531246185303, 5.333558082580566, 5.568585395812988, 5.803612232208252, 6.038639068603516, 6.273665904998779, 6.508692741394043, 6.743719577789307, 6.97874641418457, 7.213773727416992, 7.448800086975098, 7.6838274002075195, 7.918854236602783, 8.153881072998047]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 17.0, 26.0, 19.0, 26.0, 57.0, 76.0, 115.0, 174.0, 312.0, 535.0, 892.0, 1720.0, 3224.0, 6511.0, 14515.0, 36463.0, 103901.0, 294853.0, 357841.0, 143188.0, 48540.0, 18619.0, 8171.0, 3904.0, 2078.0, 1115.0, 639.0, 363.0, 210.0, 141.0, 88.0, 56.0, 44.0, 27.0, 22.0, 13.0, 12.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-1.244140625, -1.20770263671875, -1.1712646484375, -1.13482666015625, -1.098388671875, -1.06195068359375, -1.0255126953125, -0.98907470703125, -0.95263671875, -0.91619873046875, -0.8797607421875, -0.84332275390625, -0.806884765625, -0.77044677734375, -0.7340087890625, -0.69757080078125, -0.6611328125, -0.62469482421875, -0.5882568359375, -0.55181884765625, -0.515380859375, -0.47894287109375, -0.4425048828125, -0.40606689453125, -0.36962890625, -0.33319091796875, -0.2967529296875, -0.26031494140625, -0.223876953125, -0.18743896484375, -0.1510009765625, -0.11456298828125, -0.078125, -0.04168701171875, -0.0052490234375, 0.03118896484375, 0.067626953125, 0.10406494140625, 0.1405029296875, 0.17694091796875, 0.21337890625, 0.24981689453125, 0.2862548828125, 0.32269287109375, 0.359130859375, 0.39556884765625, 0.4320068359375, 0.46844482421875, 0.5048828125, 0.54132080078125, 0.5777587890625, 0.61419677734375, 0.650634765625, 0.68707275390625, 0.7235107421875, 0.75994873046875, 0.79638671875, 0.83282470703125, 0.8692626953125, 0.90570068359375, 0.942138671875, 0.97857666015625, 1.0150146484375, 1.05145263671875, 1.087890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 6.0, 8.0, 9.0, 9.0, 5.0, 12.0, 18.0, 22.0, 18.0, 20.0, 26.0, 41.0, 41.0, 56.0, 42.0, 56.0, 51.0, 67.0, 58.0, 64.0, 54.0, 59.0, 39.0, 34.0, 31.0, 29.0, 19.0, 19.0, 13.0, 10.0, 11.0, 8.0, 16.0, 7.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.921875, -4.76605224609375, -4.6102294921875, -4.45440673828125, -4.298583984375, -4.14276123046875, -3.9869384765625, -3.83111572265625, -3.67529296875, -3.51947021484375, -3.3636474609375, -3.20782470703125, -3.052001953125, -2.89617919921875, -2.7403564453125, -2.58453369140625, -2.4287109375, -2.27288818359375, -2.1170654296875, -1.96124267578125, -1.805419921875, -1.64959716796875, -1.4937744140625, -1.33795166015625, -1.18212890625, -1.02630615234375, -0.8704833984375, -0.71466064453125, -0.558837890625, -0.40301513671875, -0.2471923828125, -0.09136962890625, 0.064453125, 0.22027587890625, 0.3760986328125, 0.53192138671875, 0.687744140625, 0.84356689453125, 0.9993896484375, 1.15521240234375, 1.31103515625, 1.46685791015625, 1.6226806640625, 1.77850341796875, 1.934326171875, 2.09014892578125, 2.2459716796875, 2.40179443359375, 2.5576171875, 2.71343994140625, 2.8692626953125, 3.02508544921875, 3.180908203125, 3.33673095703125, 3.4925537109375, 3.64837646484375, 3.80419921875, 3.96002197265625, 4.1158447265625, 4.27166748046875, 4.427490234375, 4.58331298828125, 4.7391357421875, 4.89495849609375, 5.05078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 7.0, 7.0, 7.0, 10.0, 18.0, 27.0, 30.0, 56.0, 94.0, 177.0, 348.0, 659.0, 1537.0, 4862.0, 19857.0, 128071.0, 603895.0, 244043.0, 33726.0, 7249.0, 2190.0, 832.0, 354.0, 194.0, 101.0, 60.0, 42.0, 37.0, 22.0, 16.0, 9.0, 2.0, 6.0, 2.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.322265625, -2.2606048583984375, -2.198944091796875, -2.1372833251953125, -2.07562255859375, -2.0139617919921875, -1.952301025390625, -1.8906402587890625, -1.8289794921875, -1.7673187255859375, -1.705657958984375, -1.6439971923828125, -1.58233642578125, -1.5206756591796875, -1.459014892578125, -1.3973541259765625, -1.335693359375, -1.2740325927734375, -1.212371826171875, -1.1507110595703125, -1.08905029296875, -1.0273895263671875, -0.965728759765625, -0.9040679931640625, -0.8424072265625, -0.7807464599609375, -0.719085693359375, -0.6574249267578125, -0.59576416015625, -0.5341033935546875, -0.472442626953125, -0.4107818603515625, -0.34912109375, -0.2874603271484375, -0.225799560546875, -0.1641387939453125, -0.10247802734375, -0.0408172607421875, 0.020843505859375, 0.0825042724609375, 0.1441650390625, 0.2058258056640625, 0.267486572265625, 0.3291473388671875, 0.39080810546875, 0.4524688720703125, 0.514129638671875, 0.5757904052734375, 0.637451171875, 0.6991119384765625, 0.760772705078125, 0.8224334716796875, 0.88409423828125, 0.9457550048828125, 1.007415771484375, 1.0690765380859375, 1.1307373046875, 1.1923980712890625, 1.254058837890625, 1.3157196044921875, 1.37738037109375, 1.4390411376953125, 1.500701904296875, 1.5623626708984375, 1.6240234375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 10.0, 14.0, 15.0, 7.0, 20.0, 12.0, 18.0, 16.0, 23.0, 38.0, 39.0, 35.0, 44.0, 51.0, 57.0, 57.0, 46.0, 47.0, 52.0, 45.0, 35.0, 37.0, 31.0, 47.0, 36.0, 27.0, 17.0, 23.0, 18.0, 21.0, 14.0, 10.0, 7.0, 2.0, 5.0, 6.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.453125, -9.175537109375, -8.89794921875, -8.620361328125, -8.3427734375, -8.065185546875, -7.78759765625, -7.510009765625, -7.232421875, -6.954833984375, -6.67724609375, -6.399658203125, -6.1220703125, -5.844482421875, -5.56689453125, -5.289306640625, -5.01171875, -4.734130859375, -4.45654296875, -4.178955078125, -3.9013671875, -3.623779296875, -3.34619140625, -3.068603515625, -2.791015625, -2.513427734375, -2.23583984375, -1.958251953125, -1.6806640625, -1.403076171875, -1.12548828125, -0.847900390625, -0.5703125, -0.292724609375, -0.01513671875, 0.262451171875, 0.5400390625, 0.817626953125, 1.09521484375, 1.372802734375, 1.650390625, 1.927978515625, 2.20556640625, 2.483154296875, 2.7607421875, 3.038330078125, 3.31591796875, 3.593505859375, 3.87109375, 4.148681640625, 4.42626953125, 4.703857421875, 4.9814453125, 5.259033203125, 5.53662109375, 5.814208984375, 6.091796875, 6.369384765625, 6.64697265625, 6.924560546875, 7.2021484375, 7.479736328125, 7.75732421875, 8.034912109375, 8.3125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 5.0, 5.0, 8.0, 13.0, 25.0, 35.0, 77.0, 108.0, 194.0, 333.0, 737.0, 1603.0, 4246.0, 13858.0, 58645.0, 333616.0, 503457.0, 99839.0, 21413.0, 6204.0, 2200.0, 970.0, 421.0, 204.0, 136.0, 80.0, 41.0, 27.0, 16.0, 11.0, 10.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6953125, -0.674957275390625, -0.65460205078125, -0.634246826171875, -0.6138916015625, -0.593536376953125, -0.57318115234375, -0.552825927734375, -0.532470703125, -0.512115478515625, -0.49176025390625, -0.471405029296875, -0.4510498046875, -0.430694580078125, -0.41033935546875, -0.389984130859375, -0.36962890625, -0.349273681640625, -0.32891845703125, -0.308563232421875, -0.2882080078125, -0.267852783203125, -0.24749755859375, -0.227142333984375, -0.206787109375, -0.186431884765625, -0.16607666015625, -0.145721435546875, -0.1253662109375, -0.105010986328125, -0.08465576171875, -0.064300537109375, -0.0439453125, -0.023590087890625, -0.00323486328125, 0.017120361328125, 0.0374755859375, 0.057830810546875, 0.07818603515625, 0.098541259765625, 0.118896484375, 0.139251708984375, 0.15960693359375, 0.179962158203125, 0.2003173828125, 0.220672607421875, 0.24102783203125, 0.261383056640625, 0.28173828125, 0.302093505859375, 0.32244873046875, 0.342803955078125, 0.3631591796875, 0.383514404296875, 0.40386962890625, 0.424224853515625, 0.444580078125, 0.464935302734375, 0.48529052734375, 0.505645751953125, 0.5260009765625, 0.546356201171875, 0.56671142578125, 0.587066650390625, 0.607421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 4.0, 15.0, 18.0, 22.0, 22.0, 45.0, 59.0, 57.0, 76.0, 103.0, 98.0, 92.0, 81.0, 57.0, 55.0, 54.0, 28.0, 34.0, 17.0, 18.0, 10.0, 8.0, 6.0, 1.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002295970916748047, -0.0002213306725025177, -0.0002130642533302307, -0.00020479783415794373, -0.00019653141498565674, -0.00018826499581336975, -0.00017999857664108276, -0.00017173215746879578, -0.0001634657382965088, -0.0001551993191242218, -0.00014693289995193481, -0.00013866648077964783, -0.00013040006160736084, -0.00012213364243507385, -0.00011386722326278687, -0.00010560080409049988, -9.733438491821289e-05, -8.90679657459259e-05, -8.080154657363892e-05, -7.253512740135193e-05, -6.426870822906494e-05, -5.6002289056777954e-05, -4.773586988449097e-05, -3.946945071220398e-05, -3.120303153991699e-05, -2.2936612367630005e-05, -1.4670193195343018e-05, -6.40377402305603e-06, 1.862645149230957e-06, 1.0129064321517944e-05, 1.839548349380493e-05, 2.666190266609192e-05, 3.4928321838378906e-05, 4.3194741010665894e-05, 5.146116018295288e-05, 5.972757935523987e-05, 6.799399852752686e-05, 7.626041769981384e-05, 8.452683687210083e-05, 9.279325604438782e-05, 0.0001010596752166748, 0.00010932609438896179, 0.00011759251356124878, 0.00012585893273353577, 0.00013412535190582275, 0.00014239177107810974, 0.00015065819025039673, 0.00015892460942268372, 0.0001671910285949707, 0.0001754574477672577, 0.00018372386693954468, 0.00019199028611183167, 0.00020025670528411865, 0.00020852312445640564, 0.00021678954362869263, 0.00022505596280097961, 0.0002333223819732666, 0.0002415888011455536, 0.0002498552203178406, 0.00025812163949012756, 0.00026638805866241455, 0.00027465447783470154, 0.0002829208970069885, 0.0002911873161792755, 0.0002994537353515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 9.0, 9.0, 10.0, 16.0, 31.0, 36.0, 84.0, 114.0, 184.0, 343.0, 768.0, 1636.0, 4397.0, 14723.0, 61535.0, 322886.0, 494262.0, 112421.0, 23865.0, 6720.0, 2390.0, 1019.0, 468.0, 233.0, 156.0, 76.0, 53.0, 33.0, 26.0, 18.0, 9.0, 7.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.74951171875, -0.7287979125976562, -0.7080841064453125, -0.6873703002929688, -0.666656494140625, -0.6459426879882812, -0.6252288818359375, -0.6045150756835938, -0.58380126953125, -0.5630874633789062, -0.5423736572265625, -0.5216598510742188, -0.500946044921875, -0.48023223876953125, -0.4595184326171875, -0.43880462646484375, -0.4180908203125, -0.39737701416015625, -0.3766632080078125, -0.35594940185546875, -0.335235595703125, -0.31452178955078125, -0.2938079833984375, -0.27309417724609375, -0.25238037109375, -0.23166656494140625, -0.2109527587890625, -0.19023895263671875, -0.169525146484375, -0.14881134033203125, -0.1280975341796875, -0.10738372802734375, -0.086669921875, -0.06595611572265625, -0.0452423095703125, -0.02452850341796875, -0.003814697265625, 0.01689910888671875, 0.0376129150390625, 0.05832672119140625, 0.07904052734375, 0.09975433349609375, 0.1204681396484375, 0.14118194580078125, 0.161895751953125, 0.18260955810546875, 0.2033233642578125, 0.22403717041015625, 0.2447509765625, 0.26546478271484375, 0.2861785888671875, 0.30689239501953125, 0.327606201171875, 0.34832000732421875, 0.3690338134765625, 0.38974761962890625, 0.41046142578125, 0.43117523193359375, 0.4518890380859375, 0.47260284423828125, 0.493316650390625, 0.5140304565429688, 0.5347442626953125, 0.5554580688476562, 0.576171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 8.0, 7.0, 7.0, 10.0, 11.0, 19.0, 25.0, 20.0, 33.0, 35.0, 55.0, 63.0, 74.0, 78.0, 82.0, 84.0, 77.0, 56.0, 62.0, 41.0, 40.0, 19.0, 18.0, 21.0, 8.0, 9.0, 6.0, 7.0, 11.0, 6.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1317138671875, -0.127288818359375, -0.12286376953125, -0.118438720703125, -0.114013671875, -0.109588623046875, -0.10516357421875, -0.100738525390625, -0.0963134765625, -0.091888427734375, -0.08746337890625, -0.083038330078125, -0.07861328125, -0.074188232421875, -0.06976318359375, -0.065338134765625, -0.0609130859375, -0.056488037109375, -0.05206298828125, -0.047637939453125, -0.043212890625, -0.038787841796875, -0.03436279296875, -0.029937744140625, -0.0255126953125, -0.021087646484375, -0.01666259765625, -0.012237548828125, -0.0078125, -0.003387451171875, 0.00103759765625, 0.005462646484375, 0.0098876953125, 0.014312744140625, 0.01873779296875, 0.023162841796875, 0.027587890625, 0.032012939453125, 0.03643798828125, 0.040863037109375, 0.0452880859375, 0.049713134765625, 0.05413818359375, 0.058563232421875, 0.06298828125, 0.067413330078125, 0.07183837890625, 0.076263427734375, 0.0806884765625, 0.085113525390625, 0.08953857421875, 0.093963623046875, 0.098388671875, 0.102813720703125, 0.10723876953125, 0.111663818359375, 0.1160888671875, 0.120513916015625, 0.12493896484375, 0.129364013671875, 0.1337890625, 0.138214111328125, 0.14263916015625, 0.147064208984375, 0.1514892578125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 16.0, 18.0, 29.0, 61.0, 98.0, 143.0, 156.0, 174.0, 118.0, 65.0, 55.0, 27.0, 14.0, 9.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-12.437932014465332, -12.081622123718262, -11.725312232971191, -11.369002342224121, -11.01269245147705, -10.65638256072998, -10.30007266998291, -9.94376277923584, -9.58745288848877, -9.2311429977417, -8.874833106994629, -8.518523216247559, -8.162213325500488, -7.805903434753418, -7.449593544006348, -7.093283653259277, -6.736973762512207, -6.380663871765137, -6.024353981018066, -5.668044090270996, -5.311734199523926, -4.9554243087768555, -4.599114418029785, -4.242804527282715, -3.8864946365356445, -3.530184745788574, -3.173874855041504, -2.8175649642944336, -2.4612550735473633, -2.104945182800293, -1.7486352920532227, -1.3923254013061523, -1.036015510559082, -0.6797056198120117, -0.3233957290649414, 0.032914161682128906, 0.3892240524291992, 0.7455339431762695, 1.1018438339233398, 1.4581537246704102, 1.8144636154174805, 2.170773506164551, 2.527083396911621, 2.8833932876586914, 3.2397031784057617, 3.596013069152832, 3.9523229598999023, 4.308632850646973, 4.664942741394043, 5.021252632141113, 5.377562522888184, 5.733872413635254, 6.090182304382324, 6.4464921951293945, 6.802802085876465, 7.159111976623535, 7.5154218673706055, 7.871731758117676, 8.228041648864746, 8.584351539611816, 8.940661430358887, 9.296971321105957, 9.653281211853027, 10.009591102600098, 10.365900993347168]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 2.0, 7.0, 1.0, 8.0, 12.0, 12.0, 13.0, 17.0, 22.0, 27.0, 34.0, 32.0, 42.0, 44.0, 59.0, 56.0, 72.0, 69.0, 54.0, 61.0, 66.0, 52.0, 53.0, 42.0, 29.0, 16.0, 16.0, 18.0, 15.0, 14.0, 9.0, 6.0, 6.0, 7.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20181131362915, -4.036828517913818, -3.8718457221984863, -3.706862688064575, -3.541879892349243, -3.376897096633911, -3.2119140625, -3.046931266784668, -2.881948471069336, -2.716965675354004, -2.551982879638672, -2.3869998455047607, -2.2220170497894287, -2.0570342540740967, -1.892051339149475, -1.7270684242248535, -1.5620856285095215, -1.3971028327941895, -1.2321199178695679, -1.0671370029449463, -0.9021542072296143, -0.7371713519096375, -0.5721884965896606, -0.40720558166503906, -0.24222278594970703, -0.07723993062973022, 0.08774292469024658, 0.2527257800102234, 0.4177086353302002, 0.582691490650177, 0.7476743459701538, 0.9126572608947754, 1.0776405334472656, 1.2426233291625977, 1.4076062440872192, 1.5725891590118408, 1.7375719547271729, 1.9025547504425049, 2.067537784576416, 2.232520580291748, 2.39750337600708, 2.562486171722412, 2.727468967437744, 2.8924520015716553, 3.0574347972869873, 3.2224175930023193, 3.3874006271362305, 3.5523834228515625, 3.7173662185668945, 3.8823490142822266, 4.047331809997559, 4.212314605712891, 4.377297401428223, 4.542280673980713, 4.707263469696045, 4.872246265411377, 5.037229061126709, 5.202211856842041, 5.367194652557373, 5.532177448272705, 5.697160720825195, 5.862143516540527, 6.027126312255859, 6.192109107971191, 6.357091903686523]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 5.0, 8.0, 10.0, 21.0, 37.0, 38.0, 75.0, 134.0, 200.0, 285.0, 458.0, 787.0, 1357.0, 2393.0, 4466.0, 8963.0, 19218.0, 45977.0, 142841.0, 420765.0, 266688.0, 78101.0, 29151.0, 12792.0, 6094.0, 3261.0, 1776.0, 1003.0, 588.0, 370.0, 200.0, 159.0, 110.0, 54.0, 48.0, 39.0, 27.0, 18.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-3.9140625, -3.790771484375, -3.66748046875, -3.544189453125, -3.4208984375, -3.297607421875, -3.17431640625, -3.051025390625, -2.927734375, -2.804443359375, -2.68115234375, -2.557861328125, -2.4345703125, -2.311279296875, -2.18798828125, -2.064697265625, -1.94140625, -1.818115234375, -1.69482421875, -1.571533203125, -1.4482421875, -1.324951171875, -1.20166015625, -1.078369140625, -0.955078125, -0.831787109375, -0.70849609375, -0.585205078125, -0.4619140625, -0.338623046875, -0.21533203125, -0.092041015625, 0.03125, 0.154541015625, 0.27783203125, 0.401123046875, 0.5244140625, 0.647705078125, 0.77099609375, 0.894287109375, 1.017578125, 1.140869140625, 1.26416015625, 1.387451171875, 1.5107421875, 1.634033203125, 1.75732421875, 1.880615234375, 2.00390625, 2.127197265625, 2.25048828125, 2.373779296875, 2.4970703125, 2.620361328125, 2.74365234375, 2.866943359375, 2.990234375, 3.113525390625, 3.23681640625, 3.360107421875, 3.4833984375, 3.606689453125, 3.72998046875, 3.853271484375, 3.9765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 8.0, 6.0, 9.0, 16.0, 5.0, 13.0, 21.0, 22.0, 27.0, 29.0, 33.0, 38.0, 37.0, 41.0, 52.0, 65.0, 58.0, 44.0, 47.0, 64.0, 57.0, 48.0, 42.0, 37.0, 36.0, 26.0, 20.0, 15.0, 14.0, 14.0, 7.0, 6.0, 10.0, 3.0, 8.0, 10.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.5390625, -9.21240234375, -8.8857421875, -8.55908203125, -8.232421875, -7.90576171875, -7.5791015625, -7.25244140625, -6.92578125, -6.59912109375, -6.2724609375, -5.94580078125, -5.619140625, -5.29248046875, -4.9658203125, -4.63916015625, -4.3125, -3.98583984375, -3.6591796875, -3.33251953125, -3.005859375, -2.67919921875, -2.3525390625, -2.02587890625, -1.69921875, -1.37255859375, -1.0458984375, -0.71923828125, -0.392578125, -0.06591796875, 0.2607421875, 0.58740234375, 0.9140625, 1.24072265625, 1.5673828125, 1.89404296875, 2.220703125, 2.54736328125, 2.8740234375, 3.20068359375, 3.52734375, 3.85400390625, 4.1806640625, 4.50732421875, 4.833984375, 5.16064453125, 5.4873046875, 5.81396484375, 6.140625, 6.46728515625, 6.7939453125, 7.12060546875, 7.447265625, 7.77392578125, 8.1005859375, 8.42724609375, 8.75390625, 9.08056640625, 9.4072265625, 9.73388671875, 10.060546875, 10.38720703125, 10.7138671875, 11.04052734375, 11.3671875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 12.0, 1.0, 14.0, 11.0, 20.0, 38.0, 25.0, 51.0, 72.0, 81.0, 106.0, 163.0, 296.0, 544.0, 1190.0, 3418.0, 12058.0, 58955.0, 456625.0, 440421.0, 56803.0, 11572.0, 3422.0, 1241.0, 564.0, 282.0, 145.0, 120.0, 74.0, 58.0, 43.0, 38.0, 26.0, 21.0, 9.0, 8.0, 9.0, 3.0, 6.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0234375, -4.85015869140625, -4.6768798828125, -4.50360107421875, -4.330322265625, -4.15704345703125, -3.9837646484375, -3.81048583984375, -3.63720703125, -3.46392822265625, -3.2906494140625, -3.11737060546875, -2.944091796875, -2.77081298828125, -2.5975341796875, -2.42425537109375, -2.2509765625, -2.07769775390625, -1.9044189453125, -1.73114013671875, -1.557861328125, -1.38458251953125, -1.2113037109375, -1.03802490234375, -0.86474609375, -0.69146728515625, -0.5181884765625, -0.34490966796875, -0.171630859375, 0.00164794921875, 0.1749267578125, 0.34820556640625, 0.521484375, 0.69476318359375, 0.8680419921875, 1.04132080078125, 1.214599609375, 1.38787841796875, 1.5611572265625, 1.73443603515625, 1.90771484375, 2.08099365234375, 2.2542724609375, 2.42755126953125, 2.600830078125, 2.77410888671875, 2.9473876953125, 3.12066650390625, 3.2939453125, 3.46722412109375, 3.6405029296875, 3.81378173828125, 3.987060546875, 4.16033935546875, 4.3336181640625, 4.50689697265625, 4.68017578125, 4.85345458984375, 5.0267333984375, 5.20001220703125, 5.373291015625, 5.54656982421875, 5.7198486328125, 5.89312744140625, 6.06640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 15.0, 8.0, 6.0, 14.0, 19.0, 17.0, 17.0, 27.0, 28.0, 41.0, 24.0, 44.0, 31.0, 49.0, 50.0, 54.0, 45.0, 55.0, 44.0, 47.0, 40.0, 45.0, 35.0, 27.0, 39.0, 26.0, 27.0, 21.0, 16.0, 12.0, 13.0, 13.0, 13.0, 6.0, 10.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9921875, -9.6573486328125, -9.322509765625, -8.9876708984375, -8.65283203125, -8.3179931640625, -7.983154296875, -7.6483154296875, -7.3134765625, -6.9786376953125, -6.643798828125, -6.3089599609375, -5.97412109375, -5.6392822265625, -5.304443359375, -4.9696044921875, -4.634765625, -4.2999267578125, -3.965087890625, -3.6302490234375, -3.29541015625, -2.9605712890625, -2.625732421875, -2.2908935546875, -1.9560546875, -1.6212158203125, -1.286376953125, -0.9515380859375, -0.61669921875, -0.2818603515625, 0.052978515625, 0.3878173828125, 0.72265625, 1.0574951171875, 1.392333984375, 1.7271728515625, 2.06201171875, 2.3968505859375, 2.731689453125, 3.0665283203125, 3.4013671875, 3.7362060546875, 4.071044921875, 4.4058837890625, 4.74072265625, 5.0755615234375, 5.410400390625, 5.7452392578125, 6.080078125, 6.4149169921875, 6.749755859375, 7.0845947265625, 7.41943359375, 7.7542724609375, 8.089111328125, 8.4239501953125, 8.7587890625, 9.0936279296875, 9.428466796875, 9.7633056640625, 10.09814453125, 10.4329833984375, 10.767822265625, 11.1026611328125, 11.4375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 8.0, 8.0, 8.0, 7.0, 11.0, 16.0, 31.0, 45.0, 77.0, 140.0, 292.0, 620.0, 1633.0, 5445.0, 24989.0, 222331.0, 682604.0, 91390.0, 13371.0, 3387.0, 1180.0, 462.0, 210.0, 121.0, 54.0, 35.0, 25.0, 15.0, 12.0, 13.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.140625, -2.072265625, -2.00390625, -1.935546875, -1.8671875, -1.798828125, -1.73046875, -1.662109375, -1.59375, -1.525390625, -1.45703125, -1.388671875, -1.3203125, -1.251953125, -1.18359375, -1.115234375, -1.046875, -0.978515625, -0.91015625, -0.841796875, -0.7734375, -0.705078125, -0.63671875, -0.568359375, -0.5, -0.431640625, -0.36328125, -0.294921875, -0.2265625, -0.158203125, -0.08984375, -0.021484375, 0.046875, 0.115234375, 0.18359375, 0.251953125, 0.3203125, 0.388671875, 0.45703125, 0.525390625, 0.59375, 0.662109375, 0.73046875, 0.798828125, 0.8671875, 0.935546875, 1.00390625, 1.072265625, 1.140625, 1.208984375, 1.27734375, 1.345703125, 1.4140625, 1.482421875, 1.55078125, 1.619140625, 1.6875, 1.755859375, 1.82421875, 1.892578125, 1.9609375, 2.029296875, 2.09765625, 2.166015625, 2.234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 8.0, 12.0, 10.0, 19.0, 31.0, 41.0, 36.0, 77.0, 62.0, 71.0, 93.0, 98.0, 90.0, 69.0, 61.0, 50.0, 41.0, 28.0, 16.0, 13.0, 14.0, 10.0, 8.0, 6.0, 5.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002911090850830078, -0.0002830158919095993, -0.0002749226987361908, -0.0002668295055627823, -0.0002587363123893738, -0.00025064311921596527, -0.00024254992604255676, -0.00023445673286914825, -0.00022636353969573975, -0.00021827034652233124, -0.00021017715334892273, -0.00020208396017551422, -0.0001939907670021057, -0.0001858975738286972, -0.0001778043806552887, -0.0001697111874818802, -0.00016161799430847168, -0.00015352480113506317, -0.00014543160796165466, -0.00013733841478824615, -0.00012924522161483765, -0.00012115202844142914, -0.00011305883526802063, -0.00010496564209461212, -9.687244892120361e-05, -8.87792557477951e-05, -8.06860625743866e-05, -7.259286940097809e-05, -6.449967622756958e-05, -5.640648305416107e-05, -4.8313289880752563e-05, -4.0220096707344055e-05, -3.212690353393555e-05, -2.403371036052704e-05, -1.594051718711853e-05, -7.847324013710022e-06, 2.4586915969848633e-07, 8.339062333106995e-06, 1.6432255506515503e-05, 2.452544867992401e-05, 3.261864185333252e-05, 4.071183502674103e-05, 4.8805028200149536e-05, 5.6898221373558044e-05, 6.499141454696655e-05, 7.308460772037506e-05, 8.117780089378357e-05, 8.927099406719208e-05, 9.736418724060059e-05, 0.0001054573804140091, 0.0001135505735874176, 0.00012164376676082611, 0.00012973695993423462, 0.00013783015310764313, 0.00014592334628105164, 0.00015401653945446014, 0.00016210973262786865, 0.00017020292580127716, 0.00017829611897468567, 0.00018638931214809418, 0.00019448250532150269, 0.0002025756984949112, 0.0002106688916683197, 0.0002187620848417282, 0.00022685527801513672]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 3.0, 4.0, 5.0, 8.0, 18.0, 24.0, 31.0, 46.0, 77.0, 149.0, 246.0, 418.0, 817.0, 1701.0, 4220.0, 13310.0, 61019.0, 420188.0, 457192.0, 66538.0, 14410.0, 4405.0, 1800.0, 851.0, 446.0, 234.0, 132.0, 70.0, 54.0, 45.0, 19.0, 21.0, 18.0, 5.0, 8.0, 6.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.9208984375, -1.86444091796875, -1.8079833984375, -1.75152587890625, -1.695068359375, -1.63861083984375, -1.5821533203125, -1.52569580078125, -1.46923828125, -1.41278076171875, -1.3563232421875, -1.29986572265625, -1.243408203125, -1.18695068359375, -1.1304931640625, -1.07403564453125, -1.017578125, -0.96112060546875, -0.9046630859375, -0.84820556640625, -0.791748046875, -0.73529052734375, -0.6788330078125, -0.62237548828125, -0.56591796875, -0.50946044921875, -0.4530029296875, -0.39654541015625, -0.340087890625, -0.28363037109375, -0.2271728515625, -0.17071533203125, -0.1142578125, -0.05780029296875, -0.0013427734375, 0.05511474609375, 0.111572265625, 0.16802978515625, 0.2244873046875, 0.28094482421875, 0.33740234375, 0.39385986328125, 0.4503173828125, 0.50677490234375, 0.563232421875, 0.61968994140625, 0.6761474609375, 0.73260498046875, 0.7890625, 0.84552001953125, 0.9019775390625, 0.95843505859375, 1.014892578125, 1.07135009765625, 1.1278076171875, 1.18426513671875, 1.24072265625, 1.29718017578125, 1.3536376953125, 1.41009521484375, 1.466552734375, 1.52301025390625, 1.5794677734375, 1.63592529296875, 1.6923828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 6.0, 10.0, 8.0, 11.0, 18.0, 20.0, 28.0, 29.0, 46.0, 50.0, 58.0, 83.0, 91.0, 123.0, 84.0, 70.0, 65.0, 52.0, 37.0, 23.0, 14.0, 15.0, 12.0, 8.0, 6.0, 8.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.0283203125, -1.0015106201171875, -0.974700927734375, -0.9478912353515625, -0.92108154296875, -0.8942718505859375, -0.867462158203125, -0.8406524658203125, -0.8138427734375, -0.7870330810546875, -0.760223388671875, -0.7334136962890625, -0.70660400390625, -0.6797943115234375, -0.652984619140625, -0.6261749267578125, -0.599365234375, -0.5725555419921875, -0.545745849609375, -0.5189361572265625, -0.49212646484375, -0.4653167724609375, -0.438507080078125, -0.4116973876953125, -0.3848876953125, -0.3580780029296875, -0.331268310546875, -0.3044586181640625, -0.27764892578125, -0.2508392333984375, -0.224029541015625, -0.1972198486328125, -0.17041015625, -0.1436004638671875, -0.116790771484375, -0.0899810791015625, -0.06317138671875, -0.0363616943359375, -0.009552001953125, 0.0172576904296875, 0.0440673828125, 0.0708770751953125, 0.097686767578125, 0.1244964599609375, 0.15130615234375, 0.1781158447265625, 0.204925537109375, 0.2317352294921875, 0.258544921875, 0.2853546142578125, 0.312164306640625, 0.3389739990234375, 0.36578369140625, 0.3925933837890625, 0.419403076171875, 0.4462127685546875, 0.4730224609375, 0.4998321533203125, 0.526641845703125, 0.5534515380859375, 0.58026123046875, 0.6070709228515625, 0.633880615234375, 0.6606903076171875, 0.6875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 16.0, 24.0, 72.0, 118.0, 215.0, 240.0, 164.0, 79.0, 30.0, 20.0, 8.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-51.33169174194336, -50.31011962890625, -49.288543701171875, -48.2669677734375, -47.24539566040039, -46.22382354736328, -45.202247619628906, -44.18067169189453, -43.15909957885742, -42.13752746582031, -41.11595153808594, -40.09437561035156, -39.07280349731445, -38.051231384277344, -37.02965545654297, -36.008079528808594, -34.986507415771484, -33.964935302734375, -32.943359375, -31.921785354614258, -30.900211334228516, -29.878637313842773, -28.85706329345703, -27.83548927307129, -26.813915252685547, -25.792341232299805, -24.770767211914062, -23.74919319152832, -22.727619171142578, -21.706045150756836, -20.684471130371094, -19.66289710998535, -18.64132308959961, -17.619749069213867, -16.598175048828125, -15.576601028442383, -14.55502700805664, -13.533452987670898, -12.511878967285156, -11.490304946899414, -10.468729972839355, -9.447155952453613, -8.425581932067871, -7.404007911682129, -6.382433891296387, -5.3608598709106445, -4.339285850524902, -3.31771183013916, -2.296137809753418, -1.2745637893676758, -0.2529897689819336, 0.7685842514038086, 1.7901582717895508, 2.811732292175293, 3.833306312561035, 4.854880332946777, 5.8764543533325195, 6.898028373718262, 7.919602394104004, 8.941176414489746, 9.962750434875488, 10.98432445526123, 12.005898475646973, 13.027472496032715, 14.049046516418457]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 7.0, 5.0, 11.0, 11.0, 11.0, 18.0, 21.0, 18.0, 29.0, 23.0, 30.0, 38.0, 44.0, 50.0, 49.0, 43.0, 57.0, 49.0, 41.0, 41.0, 45.0, 42.0, 34.0, 45.0, 36.0, 31.0, 22.0, 27.0, 16.0, 23.0, 13.0, 20.0, 15.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.96473503112793, -17.381614685058594, -16.79849624633789, -16.215375900268555, -15.632257461547852, -15.049137115478516, -14.466017723083496, -13.882898330688477, -13.299778938293457, -12.716659545898438, -12.133540153503418, -11.550420761108398, -10.967300415039062, -10.38418197631836, -9.801061630249023, -9.217942237854004, -8.634822845458984, -8.051703453063965, -7.468584060668945, -6.885464191436768, -6.302344799041748, -5.7192254066467285, -5.136105537414551, -4.552986145019531, -3.9698667526245117, -3.386747360229492, -2.8036277294158936, -2.220508098602295, -1.6373887062072754, -1.0542693138122559, -0.4711496829986572, 0.1119699478149414, 0.6950893402099609, 1.27820885181427, 1.861328363418579, 2.4444479942321777, 3.0275673866271973, 3.610686779022217, 4.1938066482543945, 4.776926040649414, 5.360045433044434, 5.943164825439453, 6.526284217834473, 7.10940408706665, 7.69252347946167, 8.275642395019531, 8.858762741088867, 9.441882133483887, 10.025001525878906, 10.608120918273926, 11.191240310668945, 11.774359703063965, 12.357479095458984, 12.94059944152832, 13.52371883392334, 14.10683822631836, 14.689957618713379, 15.273077011108398, 15.856196403503418, 16.439315795898438, 17.022436141967773, 17.605554580688477, 18.188674926757812, 18.771793365478516, 19.35491371154785]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 6.0, 6.0, 3.0, 6.0, 19.0, 18.0, 41.0, 59.0, 92.0, 138.0, 252.0, 359.0, 586.0, 1174.0, 2380.0, 5228.0, 13494.0, 48738.0, 274553.0, 2138753.0, 1474420.0, 178804.0, 35424.0, 10907.0, 4276.0, 2022.0, 1040.0, 614.0, 324.0, 195.0, 112.0, 76.0, 41.0, 38.0, 21.0, 17.0, 14.0, 4.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.40625, -7.14990234375, -6.8935546875, -6.63720703125, -6.380859375, -6.12451171875, -5.8681640625, -5.61181640625, -5.35546875, -5.09912109375, -4.8427734375, -4.58642578125, -4.330078125, -4.07373046875, -3.8173828125, -3.56103515625, -3.3046875, -3.04833984375, -2.7919921875, -2.53564453125, -2.279296875, -2.02294921875, -1.7666015625, -1.51025390625, -1.25390625, -0.99755859375, -0.7412109375, -0.48486328125, -0.228515625, 0.02783203125, 0.2841796875, 0.54052734375, 0.796875, 1.05322265625, 1.3095703125, 1.56591796875, 1.822265625, 2.07861328125, 2.3349609375, 2.59130859375, 2.84765625, 3.10400390625, 3.3603515625, 3.61669921875, 3.873046875, 4.12939453125, 4.3857421875, 4.64208984375, 4.8984375, 5.15478515625, 5.4111328125, 5.66748046875, 5.923828125, 6.18017578125, 6.4365234375, 6.69287109375, 6.94921875, 7.20556640625, 7.4619140625, 7.71826171875, 7.974609375, 8.23095703125, 8.4873046875, 8.74365234375, 9.0]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 14.0, 18.0, 18.0, 24.0, 22.0, 44.0, 40.0, 45.0, 61.0, 58.0, 59.0, 69.0, 60.0, 78.0, 55.0, 57.0, 45.0, 42.0, 37.0, 29.0, 23.0, 21.0, 12.0, 7.0, 6.0, 9.0, 11.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3046875, -5.0858154296875, -4.866943359375, -4.6480712890625, -4.42919921875, -4.2103271484375, -3.991455078125, -3.7725830078125, -3.5537109375, -3.3348388671875, -3.115966796875, -2.8970947265625, -2.67822265625, -2.4593505859375, -2.240478515625, -2.0216064453125, -1.802734375, -1.5838623046875, -1.364990234375, -1.1461181640625, -0.92724609375, -0.7083740234375, -0.489501953125, -0.2706298828125, -0.0517578125, 0.1671142578125, 0.385986328125, 0.6048583984375, 0.82373046875, 1.0426025390625, 1.261474609375, 1.4803466796875, 1.69921875, 1.9180908203125, 2.136962890625, 2.3558349609375, 2.57470703125, 2.7935791015625, 3.012451171875, 3.2313232421875, 3.4501953125, 3.6690673828125, 3.887939453125, 4.1068115234375, 4.32568359375, 4.5445556640625, 4.763427734375, 4.9822998046875, 5.201171875, 5.4200439453125, 5.638916015625, 5.8577880859375, 6.07666015625, 6.2955322265625, 6.514404296875, 6.7332763671875, 6.9521484375, 7.1710205078125, 7.389892578125, 7.6087646484375, 7.82763671875, 8.0465087890625, 8.265380859375, 8.4842529296875, 8.703125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 15.0, 16.0, 14.0, 24.0, 52.0, 64.0, 73.0, 115.0, 232.0, 345.0, 680.0, 1325.0, 3091.0, 8394.0, 28897.0, 156502.0, 2281612.0, 1559000.0, 117176.0, 23783.0, 7410.0, 2728.0, 1228.0, 613.0, 329.0, 186.0, 105.0, 93.0, 46.0, 22.0, 27.0, 20.0, 8.0, 14.0, 7.0, 8.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.19171142578125, -6.9342041015625, -6.67669677734375, -6.419189453125, -6.16168212890625, -5.9041748046875, -5.64666748046875, -5.38916015625, -5.13165283203125, -4.8741455078125, -4.61663818359375, -4.359130859375, -4.10162353515625, -3.8441162109375, -3.58660888671875, -3.3291015625, -3.07159423828125, -2.8140869140625, -2.55657958984375, -2.299072265625, -2.04156494140625, -1.7840576171875, -1.52655029296875, -1.26904296875, -1.01153564453125, -0.7540283203125, -0.49652099609375, -0.239013671875, 0.01849365234375, 0.2760009765625, 0.53350830078125, 0.791015625, 1.04852294921875, 1.3060302734375, 1.56353759765625, 1.821044921875, 2.07855224609375, 2.3360595703125, 2.59356689453125, 2.85107421875, 3.10858154296875, 3.3660888671875, 3.62359619140625, 3.881103515625, 4.13861083984375, 4.3961181640625, 4.65362548828125, 4.9111328125, 5.16864013671875, 5.4261474609375, 5.68365478515625, 5.941162109375, 6.19866943359375, 6.4561767578125, 6.71368408203125, 6.97119140625, 7.22869873046875, 7.4862060546875, 7.74371337890625, 8.001220703125, 8.25872802734375, 8.5162353515625, 8.77374267578125, 9.03125]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 11.0, 12.0, 20.0, 27.0, 35.0, 44.0, 80.0, 116.0, 168.0, 250.0, 339.0, 544.0, 651.0, 619.0, 385.0, 244.0, 160.0, 97.0, 79.0, 60.0, 29.0, 35.0, 23.0, 13.0, 9.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.623046875, -2.539947509765625, -2.45684814453125, -2.373748779296875, -2.2906494140625, -2.207550048828125, -2.12445068359375, -2.041351318359375, -1.958251953125, -1.875152587890625, -1.79205322265625, -1.708953857421875, -1.6258544921875, -1.542755126953125, -1.45965576171875, -1.376556396484375, -1.29345703125, -1.210357666015625, -1.12725830078125, -1.044158935546875, -0.9610595703125, -0.877960205078125, -0.79486083984375, -0.711761474609375, -0.628662109375, -0.545562744140625, -0.46246337890625, -0.379364013671875, -0.2962646484375, -0.213165283203125, -0.13006591796875, -0.046966552734375, 0.0361328125, 0.119232177734375, 0.20233154296875, 0.285430908203125, 0.3685302734375, 0.451629638671875, 0.53472900390625, 0.617828369140625, 0.700927734375, 0.784027099609375, 0.86712646484375, 0.950225830078125, 1.0333251953125, 1.116424560546875, 1.19952392578125, 1.282623291015625, 1.36572265625, 1.448822021484375, 1.53192138671875, 1.615020751953125, 1.6981201171875, 1.781219482421875, 1.86431884765625, 1.947418212890625, 2.030517578125, 2.113616943359375, 2.19671630859375, 2.279815673828125, 2.3629150390625, 2.446014404296875, 2.52911376953125, 2.612213134765625, 2.6953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 9.0, 16.0, 24.0, 25.0, 22.0, 47.0, 43.0, 58.0, 73.0, 85.0, 94.0, 104.0, 83.0, 59.0, 50.0, 52.0, 35.0, 28.0, 22.0, 11.0, 13.0, 13.0, 4.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.298828125, -8.003110885620117, -7.707393169403076, -7.411675453186035, -7.115958213806152, -6.820240497589111, -6.52452278137207, -6.2288055419921875, -5.9330878257751465, -5.6373701095581055, -5.341652870178223, -5.045935153961182, -4.750217437744141, -4.454500198364258, -4.158782482147217, -3.863065004348755, -3.567347526550293, -3.271630048751831, -2.975912570953369, -2.680194854736328, -2.384477376937866, -2.0887598991394043, -1.7930423021316528, -1.4973247051239014, -1.2016072273254395, -0.9058896899223328, -0.6101721525192261, -0.3144546151161194, -0.018737077713012695, 0.2769804000854492, 0.5726979970932007, 0.8684155941009521, 1.1641340255737305, 1.4598515033721924, 1.7555691003799438, 2.0512866973876953, 2.3470041751861572, 2.642721652984619, 2.93843936920166, 3.234156847000122, 3.529874324798584, 3.825591802597046, 4.121309280395508, 4.417026996612549, 4.71274471282959, 5.008461952209473, 5.304179668426514, 5.599897384643555, 5.8956146240234375, 6.1913323402404785, 6.487049579620361, 6.782767295837402, 7.078484535217285, 7.374202251434326, 7.669919967651367, 7.96563720703125, 8.261354446411133, 8.557071685791016, 8.852789878845215, 9.148507118225098, 9.44422435760498, 9.73994255065918, 10.035659790039062, 10.331377029418945, 10.627095222473145]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 13.0, 5.0, 12.0, 7.0, 20.0, 10.0, 17.0, 20.0, 30.0, 27.0, 34.0, 27.0, 31.0, 50.0, 42.0, 47.0, 43.0, 39.0, 44.0, 49.0, 40.0, 47.0, 44.0, 47.0, 38.0, 38.0, 35.0, 23.0, 20.0, 21.0, 9.0, 15.0, 11.0, 13.0, 7.0, 6.0, 13.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.892825126647949, -6.693816184997559, -6.49480676651001, -6.295797824859619, -6.09678840637207, -5.89777946472168, -5.698770523071289, -5.499761581420898, -5.30075216293335, -5.101743221282959, -4.90273380279541, -4.7037248611450195, -4.504715919494629, -4.30570650100708, -4.1066975593566895, -3.9076883792877197, -3.70867919921875, -3.5096700191497803, -3.3106608390808105, -3.11165189743042, -2.91264271736145, -2.7136335372924805, -2.51462459564209, -2.31561541557312, -2.1166062355041504, -1.9175970554351807, -1.7185879945755005, -1.5195789337158203, -1.3205697536468506, -1.1215605735778809, -0.9225515127182007, -0.7235424518585205, -0.524533748626709, -0.32552462816238403, -0.12651550769805908, 0.07249361276626587, 0.2715027332305908, 0.47051185369491577, 0.6695209741592407, 0.8685300350189209, 1.0675392150878906, 1.2665483951568604, 1.4655574560165405, 1.6645665168762207, 1.8635756969451904, 2.06258487701416, 2.261593818664551, 2.4606029987335205, 2.6596121788024902, 2.85862135887146, 3.0576305389404297, 3.2566394805908203, 3.45564866065979, 3.6546578407287598, 3.8536667823791504, 4.052676200866699, 4.25168514251709, 4.4506940841674805, 4.649703502655029, 4.84871244430542, 5.047721862792969, 5.246730804443359, 5.44573974609375, 5.644748687744141, 5.8437581062316895]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 8.0, 10.0, 26.0, 38.0, 53.0, 60.0, 100.0, 156.0, 217.0, 353.0, 611.0, 954.0, 1599.0, 2912.0, 5459.0, 10632.0, 23106.0, 52756.0, 148017.0, 361546.0, 274544.0, 94058.0, 36961.0, 16449.0, 8199.0, 4164.0, 2225.0, 1319.0, 783.0, 456.0, 282.0, 173.0, 107.0, 63.0, 52.0, 38.0, 19.0, 13.0, 16.0, 8.0, 4.0, 7.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-1.373046875, -1.334686279296875, -1.29632568359375, -1.257965087890625, -1.2196044921875, -1.181243896484375, -1.14288330078125, -1.104522705078125, -1.066162109375, -1.027801513671875, -0.98944091796875, -0.951080322265625, -0.9127197265625, -0.874359130859375, -0.83599853515625, -0.797637939453125, -0.75927734375, -0.720916748046875, -0.68255615234375, -0.644195556640625, -0.6058349609375, -0.567474365234375, -0.52911376953125, -0.490753173828125, -0.452392578125, -0.414031982421875, -0.37567138671875, -0.337310791015625, -0.2989501953125, -0.260589599609375, -0.22222900390625, -0.183868408203125, -0.1455078125, -0.107147216796875, -0.06878662109375, -0.030426025390625, 0.0079345703125, 0.046295166015625, 0.08465576171875, 0.123016357421875, 0.161376953125, 0.199737548828125, 0.23809814453125, 0.276458740234375, 0.3148193359375, 0.353179931640625, 0.39154052734375, 0.429901123046875, 0.46826171875, 0.506622314453125, 0.54498291015625, 0.583343505859375, 0.6217041015625, 0.660064697265625, 0.69842529296875, 0.736785888671875, 0.775146484375, 0.813507080078125, 0.85186767578125, 0.890228271484375, 0.9285888671875, 0.966949462890625, 1.00531005859375, 1.043670654296875, 1.08203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 7.0, 9.0, 12.0, 11.0, 15.0, 12.0, 19.0, 29.0, 27.0, 26.0, 24.0, 34.0, 39.0, 44.0, 39.0, 60.0, 49.0, 43.0, 47.0, 45.0, 51.0, 43.0, 36.0, 40.0, 34.0, 39.0, 32.0, 24.0, 21.0, 16.0, 10.0, 14.0, 12.0, 8.0, 7.0, 2.0, 6.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.3359375, -4.1943359375, -4.052734375, -3.9111328125, -3.76953125, -3.6279296875, -3.486328125, -3.3447265625, -3.203125, -3.0615234375, -2.919921875, -2.7783203125, -2.63671875, -2.4951171875, -2.353515625, -2.2119140625, -2.0703125, -1.9287109375, -1.787109375, -1.6455078125, -1.50390625, -1.3623046875, -1.220703125, -1.0791015625, -0.9375, -0.7958984375, -0.654296875, -0.5126953125, -0.37109375, -0.2294921875, -0.087890625, 0.0537109375, 0.1953125, 0.3369140625, 0.478515625, 0.6201171875, 0.76171875, 0.9033203125, 1.044921875, 1.1865234375, 1.328125, 1.4697265625, 1.611328125, 1.7529296875, 1.89453125, 2.0361328125, 2.177734375, 2.3193359375, 2.4609375, 2.6025390625, 2.744140625, 2.8857421875, 3.02734375, 3.1689453125, 3.310546875, 3.4521484375, 3.59375, 3.7353515625, 3.876953125, 4.0185546875, 4.16015625, 4.3017578125, 4.443359375, 4.5849609375, 4.7265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 11.0, 15.0, 14.0, 18.0, 23.0, 40.0, 55.0, 68.0, 113.0, 207.0, 316.0, 717.0, 1507.0, 3700.0, 10773.0, 37225.0, 174682.0, 519703.0, 230016.0, 48012.0, 13210.0, 4478.0, 1811.0, 814.0, 409.0, 219.0, 117.0, 89.0, 47.0, 37.0, 21.0, 22.0, 13.0, 14.0, 9.0, 5.0, 6.0, 12.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4931640625, -1.4426727294921875, -1.392181396484375, -1.3416900634765625, -1.29119873046875, -1.2407073974609375, -1.190216064453125, -1.1397247314453125, -1.0892333984375, -1.0387420654296875, -0.988250732421875, -0.9377593994140625, -0.88726806640625, -0.8367767333984375, -0.786285400390625, -0.7357940673828125, -0.685302734375, -0.6348114013671875, -0.584320068359375, -0.5338287353515625, -0.48333740234375, -0.4328460693359375, -0.382354736328125, -0.3318634033203125, -0.2813720703125, -0.2308807373046875, -0.180389404296875, -0.1298980712890625, -0.07940673828125, -0.0289154052734375, 0.021575927734375, 0.0720672607421875, 0.12255859375, 0.1730499267578125, 0.223541259765625, 0.2740325927734375, 0.32452392578125, 0.3750152587890625, 0.425506591796875, 0.4759979248046875, 0.5264892578125, 0.5769805908203125, 0.627471923828125, 0.6779632568359375, 0.72845458984375, 0.7789459228515625, 0.829437255859375, 0.8799285888671875, 0.930419921875, 0.9809112548828125, 1.031402587890625, 1.0818939208984375, 1.13238525390625, 1.1828765869140625, 1.233367919921875, 1.2838592529296875, 1.3343505859375, 1.3848419189453125, 1.435333251953125, 1.4858245849609375, 1.53631591796875, 1.5868072509765625, 1.637298583984375, 1.6877899169921875, 1.73828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 3.0, 7.0, 9.0, 15.0, 14.0, 20.0, 33.0, 25.0, 26.0, 42.0, 32.0, 42.0, 50.0, 50.0, 56.0, 50.0, 37.0, 57.0, 38.0, 61.0, 40.0, 40.0, 36.0, 32.0, 29.0, 27.0, 16.0, 24.0, 18.0, 13.0, 10.0, 7.0, 10.0, 9.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.7890625, -10.4932861328125, -10.197509765625, -9.9017333984375, -9.60595703125, -9.3101806640625, -9.014404296875, -8.7186279296875, -8.4228515625, -8.1270751953125, -7.831298828125, -7.5355224609375, -7.23974609375, -6.9439697265625, -6.648193359375, -6.3524169921875, -6.056640625, -5.7608642578125, -5.465087890625, -5.1693115234375, -4.87353515625, -4.5777587890625, -4.281982421875, -3.9862060546875, -3.6904296875, -3.3946533203125, -3.098876953125, -2.8031005859375, -2.50732421875, -2.2115478515625, -1.915771484375, -1.6199951171875, -1.32421875, -1.0284423828125, -0.732666015625, -0.4368896484375, -0.14111328125, 0.1546630859375, 0.450439453125, 0.7462158203125, 1.0419921875, 1.3377685546875, 1.633544921875, 1.9293212890625, 2.22509765625, 2.5208740234375, 2.816650390625, 3.1124267578125, 3.408203125, 3.7039794921875, 3.999755859375, 4.2955322265625, 4.59130859375, 4.8870849609375, 5.182861328125, 5.4786376953125, 5.7744140625, 6.0701904296875, 6.365966796875, 6.6617431640625, 6.95751953125, 7.2532958984375, 7.549072265625, 7.8448486328125, 8.140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 4.0, 7.0, 6.0, 10.0, 16.0, 30.0, 32.0, 60.0, 83.0, 142.0, 315.0, 506.0, 1111.0, 2760.0, 7959.0, 32273.0, 228489.0, 642753.0, 104471.0, 18561.0, 5086.0, 1985.0, 839.0, 463.0, 201.0, 149.0, 100.0, 44.0, 33.0, 16.0, 16.0, 5.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9072265625, -0.8773040771484375, -0.847381591796875, -0.8174591064453125, -0.78753662109375, -0.7576141357421875, -0.727691650390625, -0.6977691650390625, -0.6678466796875, -0.6379241943359375, -0.608001708984375, -0.5780792236328125, -0.54815673828125, -0.5182342529296875, -0.488311767578125, -0.4583892822265625, -0.428466796875, -0.3985443115234375, -0.368621826171875, -0.3386993408203125, -0.30877685546875, -0.2788543701171875, -0.248931884765625, -0.2190093994140625, -0.1890869140625, -0.1591644287109375, -0.129241943359375, -0.0993194580078125, -0.06939697265625, -0.0394744873046875, -0.009552001953125, 0.0203704833984375, 0.05029296875, 0.0802154541015625, 0.110137939453125, 0.1400604248046875, 0.16998291015625, 0.1999053955078125, 0.229827880859375, 0.2597503662109375, 0.2896728515625, 0.3195953369140625, 0.349517822265625, 0.3794403076171875, 0.40936279296875, 0.4392852783203125, 0.469207763671875, 0.4991302490234375, 0.529052734375, 0.5589752197265625, 0.588897705078125, 0.6188201904296875, 0.64874267578125, 0.6786651611328125, 0.708587646484375, 0.7385101318359375, 0.7684326171875, 0.7983551025390625, 0.828277587890625, 0.8582000732421875, 0.88812255859375, 0.9180450439453125, 0.947967529296875, 0.9778900146484375, 1.0078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 8.0, 3.0, 15.0, 29.0, 28.0, 51.0, 66.0, 92.0, 107.0, 150.0, 114.0, 90.0, 55.0, 54.0, 34.0, 28.0, 14.0, 16.0, 6.0, 12.0, 11.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0005254745483398438, -0.000512830913066864, -0.0005001872777938843, -0.00048754364252090454, -0.0004749000072479248, -0.00046225637197494507, -0.00044961273670196533, -0.0004369691014289856, -0.00042432546615600586, -0.0004116818308830261, -0.0003990381956100464, -0.00038639456033706665, -0.0003737509250640869, -0.0003611072897911072, -0.00034846365451812744, -0.0003358200192451477, -0.00032317638397216797, -0.00031053274869918823, -0.0002978891134262085, -0.00028524547815322876, -0.000272601842880249, -0.0002599582076072693, -0.00024731457233428955, -0.00023467093706130981, -0.00022202730178833008, -0.00020938366651535034, -0.0001967400312423706, -0.00018409639596939087, -0.00017145276069641113, -0.0001588091254234314, -0.00014616549015045166, -0.00013352185487747192, -0.00012087821960449219, -0.00010823458433151245, -9.559094905853271e-05, -8.294731378555298e-05, -7.030367851257324e-05, -5.7660043239593506e-05, -4.501640796661377e-05, -3.237277269363403e-05, -1.9729137420654297e-05, -7.0855021476745605e-06, 5.558133125305176e-06, 1.8201768398284912e-05, 3.084540367126465e-05, 4.3489038944244385e-05, 5.613267421722412e-05, 6.877630949020386e-05, 8.14199447631836e-05, 9.406358003616333e-05, 0.00010670721530914307, 0.0001193508505821228, 0.00013199448585510254, 0.00014463812112808228, 0.000157281756401062, 0.00016992539167404175, 0.00018256902694702148, 0.00019521266222000122, 0.00020785629749298096, 0.0002204999327659607, 0.00023314356803894043, 0.00024578720331192017, 0.0002584308385848999, 0.00027107447385787964, 0.0002837181091308594]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 12.0, 10.0, 17.0, 25.0, 33.0, 54.0, 53.0, 90.0, 159.0, 271.0, 439.0, 770.0, 1426.0, 3205.0, 8497.0, 28573.0, 159141.0, 651838.0, 151345.0, 27773.0, 8231.0, 3196.0, 1466.0, 758.0, 407.0, 273.0, 154.0, 94.0, 80.0, 46.0, 35.0, 29.0, 14.0, 13.0, 8.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0380859375, -1.0070877075195312, -0.9760894775390625, -0.9450912475585938, -0.914093017578125, -0.8830947875976562, -0.8520965576171875, -0.8210983276367188, -0.79010009765625, -0.7591018676757812, -0.7281036376953125, -0.6971054077148438, -0.666107177734375, -0.6351089477539062, -0.6041107177734375, -0.5731124877929688, -0.5421142578125, -0.5111160278320312, -0.4801177978515625, -0.44911956787109375, -0.418121337890625, -0.38712310791015625, -0.3561248779296875, -0.32512664794921875, -0.29412841796875, -0.26313018798828125, -0.2321319580078125, -0.20113372802734375, -0.170135498046875, -0.13913726806640625, -0.1081390380859375, -0.07714080810546875, -0.046142578125, -0.01514434814453125, 0.0158538818359375, 0.04685211181640625, 0.077850341796875, 0.10884857177734375, 0.1398468017578125, 0.17084503173828125, 0.20184326171875, 0.23284149169921875, 0.2638397216796875, 0.29483795166015625, 0.325836181640625, 0.35683441162109375, 0.3878326416015625, 0.41883087158203125, 0.4498291015625, 0.48082733154296875, 0.5118255615234375, 0.5428237915039062, 0.573822021484375, 0.6048202514648438, 0.6358184814453125, 0.6668167114257812, 0.69781494140625, 0.7288131713867188, 0.7598114013671875, 0.7908096313476562, 0.821807861328125, 0.8528060913085938, 0.8838043212890625, 0.9148025512695312, 0.94580078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 4.0, 4.0, 11.0, 10.0, 20.0, 15.0, 19.0, 24.0, 41.0, 38.0, 54.0, 77.0, 102.0, 120.0, 112.0, 83.0, 68.0, 45.0, 35.0, 28.0, 19.0, 10.0, 8.0, 5.0, 8.0, 9.0, 8.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1796875, -0.1731548309326172, -0.16662216186523438, -0.16008949279785156, -0.15355682373046875, -0.14702415466308594, -0.14049148559570312, -0.1339588165283203, -0.1274261474609375, -0.12089347839355469, -0.11436080932617188, -0.10782814025878906, -0.10129547119140625, -0.09476280212402344, -0.08823013305664062, -0.08169746398925781, -0.075164794921875, -0.06863212585449219, -0.062099456787109375, -0.05556678771972656, -0.04903411865234375, -0.04250144958496094, -0.035968780517578125, -0.029436111450195312, -0.0229034423828125, -0.016370773315429688, -0.009838104248046875, -0.0033054351806640625, 0.00322723388671875, 0.009759902954101562, 0.016292572021484375, 0.022825241088867188, 0.02935791015625, 0.03589057922363281, 0.042423248291015625, 0.04895591735839844, 0.05548858642578125, 0.06202125549316406, 0.06855392456054688, 0.07508659362792969, 0.0816192626953125, 0.08815193176269531, 0.09468460083007812, 0.10121726989746094, 0.10774993896484375, 0.11428260803222656, 0.12081527709960938, 0.1273479461669922, 0.133880615234375, 0.1404132843017578, 0.14694595336914062, 0.15347862243652344, 0.16001129150390625, 0.16654396057128906, 0.17307662963867188, 0.1796092987060547, 0.1861419677734375, 0.1926746368408203, 0.19920730590820312, 0.20573997497558594, 0.21227264404296875, 0.21880531311035156, 0.22533798217773438, 0.2318706512451172, 0.2384033203125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 10.0, 17.0, 28.0, 30.0, 47.0, 63.0, 95.0, 131.0, 124.0, 136.0, 82.0, 68.0, 45.0, 35.0, 24.0, 16.0, 15.0, 11.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.032035827636719, -7.778270244598389, -7.524504661560059, -7.2707390785217285, -7.016973495483398, -6.763207912445068, -6.509442329406738, -6.255676746368408, -6.001911163330078, -5.748145580291748, -5.494379997253418, -5.240614414215088, -4.986848831176758, -4.733083248138428, -4.479317665100098, -4.225552082061768, -3.9717864990234375, -3.7180209159851074, -3.4642553329467773, -3.2104897499084473, -2.956724166870117, -2.702958583831787, -2.449193000793457, -2.195427417755127, -1.9416618347167969, -1.6878962516784668, -1.4341306686401367, -1.1803650856018066, -0.9265995025634766, -0.6728339195251465, -0.4190683364868164, -0.16530275344848633, 0.08846378326416016, 0.34222936630249023, 0.5959949493408203, 0.8497605323791504, 1.1035261154174805, 1.3572916984558105, 1.6110572814941406, 1.8648228645324707, 2.118588447570801, 2.372354030609131, 2.626119613647461, 2.879885196685791, 3.133650779724121, 3.387416362762451, 3.6411819458007812, 3.8949475288391113, 4.148713111877441, 4.4024786949157715, 4.656244277954102, 4.910009860992432, 5.163775444030762, 5.417541027069092, 5.671306610107422, 5.925072193145752, 6.178837776184082, 6.432603359222412, 6.686368942260742, 6.940134525299072, 7.193900108337402, 7.447665691375732, 7.7014312744140625, 7.955196857452393, 8.208962440490723]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 7.0, 9.0, 16.0, 13.0, 27.0, 16.0, 21.0, 29.0, 35.0, 27.0, 39.0, 50.0, 44.0, 51.0, 52.0, 39.0, 58.0, 44.0, 49.0, 55.0, 52.0, 33.0, 39.0, 35.0, 34.0, 18.0, 15.0, 13.0, 15.0, 16.0, 5.0, 7.0, 9.0, 7.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.473176956176758, -4.333288192749023, -4.193399429321289, -4.053510665893555, -3.9136219024658203, -3.773733139038086, -3.6338441371917725, -3.493955373764038, -3.3540666103363037, -3.2141778469085693, -3.074289083480835, -2.9344003200531006, -2.794511318206787, -2.6546225547790527, -2.5147337913513184, -2.374845027923584, -2.2349562644958496, -2.0950675010681152, -1.9551787376403809, -1.815289855003357, -1.6754010915756226, -1.5355123281478882, -1.3956234455108643, -1.2557346820831299, -1.1158459186553955, -0.9759571552276611, -0.836068332195282, -0.6961795091629028, -0.5562907457351685, -0.4164019823074341, -0.27651315927505493, -0.13662433624267578, 0.0032644271850585938, 0.14315322041511536, 0.2830420136451721, 0.4229308068752289, 0.5628196001052856, 0.70270836353302, 0.8425971865653992, 0.9824860095977783, 1.1223747730255127, 1.262263536453247, 1.4021522998809814, 1.5420411825180054, 1.6819299459457397, 1.8218187093734741, 1.961707592010498, 2.1015963554382324, 2.241485118865967, 2.381373882293701, 2.5212626457214355, 2.66115140914917, 2.8010401725769043, 2.9409289360046387, 3.080817937850952, 3.2207067012786865, 3.360595464706421, 3.5004842281341553, 3.6403729915618896, 3.780261754989624, 3.9201507568359375, 4.060039520263672, 4.199928283691406, 4.339817047119141, 4.479705810546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 3.0, 5.0, 6.0, 9.0, 9.0, 8.0, 10.0, 23.0, 31.0, 51.0, 69.0, 88.0, 126.0, 184.0, 246.0, 430.0, 563.0, 852.0, 1364.0, 2142.0, 3436.0, 5914.0, 10326.0, 19099.0, 38123.0, 87802.0, 263049.0, 380695.0, 127326.0, 50468.0, 24413.0, 13013.0, 7098.0, 4218.0, 2578.0, 1590.0, 1045.0, 692.0, 428.0, 325.0, 185.0, 159.0, 118.0, 69.0, 48.0, 40.0, 18.0, 16.0, 12.0, 7.0, 5.0, 6.0, 7.0, 4.0, 4.0, 0.0, 3.0], "bins": [-3.30078125, -3.2042236328125, -3.107666015625, -3.0111083984375, -2.91455078125, -2.8179931640625, -2.721435546875, -2.6248779296875, -2.5283203125, -2.4317626953125, -2.335205078125, -2.2386474609375, -2.14208984375, -2.0455322265625, -1.948974609375, -1.8524169921875, -1.755859375, -1.6593017578125, -1.562744140625, -1.4661865234375, -1.36962890625, -1.2730712890625, -1.176513671875, -1.0799560546875, -0.9833984375, -0.8868408203125, -0.790283203125, -0.6937255859375, -0.59716796875, -0.5006103515625, -0.404052734375, -0.3074951171875, -0.2109375, -0.1143798828125, -0.017822265625, 0.0787353515625, 0.17529296875, 0.2718505859375, 0.368408203125, 0.4649658203125, 0.5615234375, 0.6580810546875, 0.754638671875, 0.8511962890625, 0.94775390625, 1.0443115234375, 1.140869140625, 1.2374267578125, 1.333984375, 1.4305419921875, 1.527099609375, 1.6236572265625, 1.72021484375, 1.8167724609375, 1.913330078125, 2.0098876953125, 2.1064453125, 2.2030029296875, 2.299560546875, 2.3961181640625, 2.49267578125, 2.5892333984375, 2.685791015625, 2.7823486328125, 2.87890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 11.0, 2.0, 15.0, 14.0, 20.0, 17.0, 31.0, 25.0, 30.0, 38.0, 36.0, 51.0, 45.0, 61.0, 59.0, 49.0, 67.0, 53.0, 64.0, 41.0, 44.0, 43.0, 32.0, 23.0, 38.0, 19.0, 12.0, 12.0, 7.0, 17.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0546875, -9.7159423828125, -9.377197265625, -9.0384521484375, -8.69970703125, -8.3609619140625, -8.022216796875, -7.6834716796875, -7.3447265625, -7.0059814453125, -6.667236328125, -6.3284912109375, -5.98974609375, -5.6510009765625, -5.312255859375, -4.9735107421875, -4.634765625, -4.2960205078125, -3.957275390625, -3.6185302734375, -3.27978515625, -2.9410400390625, -2.602294921875, -2.2635498046875, -1.9248046875, -1.5860595703125, -1.247314453125, -0.9085693359375, -0.56982421875, -0.2310791015625, 0.107666015625, 0.4464111328125, 0.78515625, 1.1239013671875, 1.462646484375, 1.8013916015625, 2.14013671875, 2.4788818359375, 2.817626953125, 3.1563720703125, 3.4951171875, 3.8338623046875, 4.172607421875, 4.5113525390625, 4.85009765625, 5.1888427734375, 5.527587890625, 5.8663330078125, 6.205078125, 6.5438232421875, 6.882568359375, 7.2213134765625, 7.56005859375, 7.8988037109375, 8.237548828125, 8.5762939453125, 8.9150390625, 9.2537841796875, 9.592529296875, 9.9312744140625, 10.27001953125, 10.6087646484375, 10.947509765625, 11.2862548828125, 11.625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 11.0, 7.0, 9.0, 13.0, 20.0, 31.0, 50.0, 49.0, 55.0, 88.0, 137.0, 227.0, 459.0, 1045.0, 2671.0, 8498.0, 31993.0, 189342.0, 667405.0, 113373.0, 22794.0, 6232.0, 2092.0, 791.0, 410.0, 237.0, 135.0, 110.0, 69.0, 48.0, 30.0, 27.0, 16.0, 18.0, 12.0, 7.0, 10.0, 10.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.015625, -4.85052490234375, -4.6854248046875, -4.52032470703125, -4.355224609375, -4.19012451171875, -4.0250244140625, -3.85992431640625, -3.69482421875, -3.52972412109375, -3.3646240234375, -3.19952392578125, -3.034423828125, -2.86932373046875, -2.7042236328125, -2.53912353515625, -2.3740234375, -2.20892333984375, -2.0438232421875, -1.87872314453125, -1.713623046875, -1.54852294921875, -1.3834228515625, -1.21832275390625, -1.05322265625, -0.88812255859375, -0.7230224609375, -0.55792236328125, -0.392822265625, -0.22772216796875, -0.0626220703125, 0.10247802734375, 0.267578125, 0.43267822265625, 0.5977783203125, 0.76287841796875, 0.927978515625, 1.09307861328125, 1.2581787109375, 1.42327880859375, 1.58837890625, 1.75347900390625, 1.9185791015625, 2.08367919921875, 2.248779296875, 2.41387939453125, 2.5789794921875, 2.74407958984375, 2.9091796875, 3.07427978515625, 3.2393798828125, 3.40447998046875, 3.569580078125, 3.73468017578125, 3.8997802734375, 4.06488037109375, 4.22998046875, 4.39508056640625, 4.5601806640625, 4.72528076171875, 4.890380859375, 5.05548095703125, 5.2205810546875, 5.38568115234375, 5.55078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 7.0, 9.0, 8.0, 12.0, 9.0, 21.0, 22.0, 20.0, 20.0, 25.0, 31.0, 36.0, 27.0, 37.0, 42.0, 36.0, 38.0, 44.0, 40.0, 40.0, 38.0, 46.0, 41.0, 40.0, 30.0, 35.0, 27.0, 26.0, 30.0, 22.0, 22.0, 25.0, 13.0, 13.0, 12.0, 10.0, 7.0, 10.0, 6.0, 7.0, 5.0, 0.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.0, -9.685302734375, -9.37060546875, -9.055908203125, -8.7412109375, -8.426513671875, -8.11181640625, -7.797119140625, -7.482421875, -7.167724609375, -6.85302734375, -6.538330078125, -6.2236328125, -5.908935546875, -5.59423828125, -5.279541015625, -4.96484375, -4.650146484375, -4.33544921875, -4.020751953125, -3.7060546875, -3.391357421875, -3.07666015625, -2.761962890625, -2.447265625, -2.132568359375, -1.81787109375, -1.503173828125, -1.1884765625, -0.873779296875, -0.55908203125, -0.244384765625, 0.0703125, 0.385009765625, 0.69970703125, 1.014404296875, 1.3291015625, 1.643798828125, 1.95849609375, 2.273193359375, 2.587890625, 2.902587890625, 3.21728515625, 3.531982421875, 3.8466796875, 4.161376953125, 4.47607421875, 4.790771484375, 5.10546875, 5.420166015625, 5.73486328125, 6.049560546875, 6.3642578125, 6.678955078125, 6.99365234375, 7.308349609375, 7.623046875, 7.937744140625, 8.25244140625, 8.567138671875, 8.8818359375, 9.196533203125, 9.51123046875, 9.825927734375, 10.140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 2.0, 4.0, 2.0, 3.0, 10.0, 14.0, 22.0, 32.0, 51.0, 67.0, 122.0, 218.0, 384.0, 688.0, 1546.0, 3693.0, 10715.0, 37342.0, 168800.0, 572856.0, 190756.0, 42158.0, 11804.0, 3994.0, 1622.0, 744.0, 370.0, 190.0, 134.0, 75.0, 51.0, 32.0, 18.0, 16.0, 2.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.5341796875, -1.4910125732421875, -1.447845458984375, -1.4046783447265625, -1.36151123046875, -1.3183441162109375, -1.275177001953125, -1.2320098876953125, -1.1888427734375, -1.1456756591796875, -1.102508544921875, -1.0593414306640625, -1.01617431640625, -0.9730072021484375, -0.929840087890625, -0.8866729736328125, -0.843505859375, -0.8003387451171875, -0.757171630859375, -0.7140045166015625, -0.67083740234375, -0.6276702880859375, -0.584503173828125, -0.5413360595703125, -0.4981689453125, -0.4550018310546875, -0.411834716796875, -0.3686676025390625, -0.32550048828125, -0.2823333740234375, -0.239166259765625, -0.1959991455078125, -0.15283203125, -0.1096649169921875, -0.066497802734375, -0.0233306884765625, 0.01983642578125, 0.0630035400390625, 0.106170654296875, 0.1493377685546875, 0.1925048828125, 0.2356719970703125, 0.278839111328125, 0.3220062255859375, 0.36517333984375, 0.4083404541015625, 0.451507568359375, 0.4946746826171875, 0.537841796875, 0.5810089111328125, 0.624176025390625, 0.6673431396484375, 0.71051025390625, 0.7536773681640625, 0.796844482421875, 0.8400115966796875, 0.8831787109375, 0.9263458251953125, 0.969512939453125, 1.0126800537109375, 1.05584716796875, 1.0990142822265625, 1.142181396484375, 1.1853485107421875, 1.228515625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 3.0, 5.0, 9.0, 7.0, 12.0, 11.0, 16.0, 12.0, 28.0, 37.0, 44.0, 66.0, 83.0, 127.0, 151.0, 111.0, 78.0, 59.0, 44.0, 35.0, 22.0, 17.0, 10.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003955364227294922, -0.00038573332130908966, -0.00037593021988868713, -0.0003661271184682846, -0.0003563240170478821, -0.00034652091562747955, -0.000336717814207077, -0.0003269147127866745, -0.00031711161136627197, -0.00030730850994586945, -0.0002975054085254669, -0.0002877023071050644, -0.00027789920568466187, -0.00026809610426425934, -0.0002582930028438568, -0.0002484899014234543, -0.00023868680000305176, -0.00022888369858264923, -0.0002190805971622467, -0.00020927749574184418, -0.00019947439432144165, -0.00018967129290103912, -0.0001798681914806366, -0.00017006509006023407, -0.00016026198863983154, -0.00015045888721942902, -0.0001406557857990265, -0.00013085268437862396, -0.00012104958295822144, -0.00011124648153781891, -0.00010144338011741638, -9.164027869701385e-05, -8.183717727661133e-05, -7.20340758562088e-05, -6.223097443580627e-05, -5.242787301540375e-05, -4.262477159500122e-05, -3.2821670174598694e-05, -2.3018568754196167e-05, -1.321546733379364e-05, -3.4123659133911133e-06, 6.3907355070114136e-06, 1.619383692741394e-05, 2.5996938347816467e-05, 3.5800039768218994e-05, 4.560314118862152e-05, 5.540624260902405e-05, 6.520934402942657e-05, 7.50124454498291e-05, 8.481554687023163e-05, 9.461864829063416e-05, 0.00010442174971103668, 0.00011422485113143921, 0.00012402795255184174, 0.00013383105397224426, 0.0001436341553926468, 0.00015343725681304932, 0.00016324035823345184, 0.00017304345965385437, 0.0001828465610742569, 0.00019264966249465942, 0.00020245276391506195, 0.00021225586533546448, 0.000222058966755867, 0.00023186206817626953]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 10.0, 3.0, 6.0, 8.0, 11.0, 20.0, 30.0, 37.0, 65.0, 107.0, 187.0, 323.0, 718.0, 1670.0, 4215.0, 12991.0, 47201.0, 207840.0, 579250.0, 143852.0, 34236.0, 9925.0, 3240.0, 1313.0, 591.0, 301.0, 133.0, 87.0, 58.0, 46.0, 33.0, 18.0, 13.0, 9.0, 8.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6396484375, -1.5933074951171875, -1.546966552734375, -1.5006256103515625, -1.45428466796875, -1.4079437255859375, -1.361602783203125, -1.3152618408203125, -1.2689208984375, -1.2225799560546875, -1.176239013671875, -1.1298980712890625, -1.08355712890625, -1.0372161865234375, -0.990875244140625, -0.9445343017578125, -0.898193359375, -0.8518524169921875, -0.805511474609375, -0.7591705322265625, -0.71282958984375, -0.6664886474609375, -0.620147705078125, -0.5738067626953125, -0.5274658203125, -0.4811248779296875, -0.434783935546875, -0.3884429931640625, -0.34210205078125, -0.2957611083984375, -0.249420166015625, -0.2030792236328125, -0.15673828125, -0.1103973388671875, -0.064056396484375, -0.0177154541015625, 0.02862548828125, 0.0749664306640625, 0.121307373046875, 0.1676483154296875, 0.2139892578125, 0.2603302001953125, 0.306671142578125, 0.3530120849609375, 0.39935302734375, 0.4456939697265625, 0.492034912109375, 0.5383758544921875, 0.584716796875, 0.6310577392578125, 0.677398681640625, 0.7237396240234375, 0.77008056640625, 0.8164215087890625, 0.862762451171875, 0.9091033935546875, 0.9554443359375, 1.0017852783203125, 1.048126220703125, 1.0944671630859375, 1.14080810546875, 1.1871490478515625, 1.233489990234375, 1.2798309326171875, 1.326171875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 7.0, 11.0, 8.0, 7.0, 18.0, 17.0, 29.0, 39.0, 40.0, 50.0, 82.0, 92.0, 114.0, 95.0, 61.0, 53.0, 48.0, 58.0, 34.0, 28.0, 25.0, 19.0, 9.0, 10.0, 9.0, 6.0, 9.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56640625, -0.5454254150390625, -0.524444580078125, -0.5034637451171875, -0.48248291015625, -0.4615020751953125, -0.440521240234375, -0.4195404052734375, -0.3985595703125, -0.3775787353515625, -0.356597900390625, -0.3356170654296875, -0.31463623046875, -0.2936553955078125, -0.272674560546875, -0.2516937255859375, -0.230712890625, -0.2097320556640625, -0.188751220703125, -0.1677703857421875, -0.14678955078125, -0.1258087158203125, -0.104827880859375, -0.0838470458984375, -0.0628662109375, -0.0418853759765625, -0.020904541015625, 7.62939453125e-05, 0.02105712890625, 0.0420379638671875, 0.063018798828125, 0.0839996337890625, 0.10498046875, 0.1259613037109375, 0.146942138671875, 0.1679229736328125, 0.18890380859375, 0.2098846435546875, 0.230865478515625, 0.2518463134765625, 0.2728271484375, 0.2938079833984375, 0.314788818359375, 0.3357696533203125, 0.35675048828125, 0.3777313232421875, 0.398712158203125, 0.4196929931640625, 0.440673828125, 0.4616546630859375, 0.482635498046875, 0.5036163330078125, 0.52459716796875, 0.5455780029296875, 0.566558837890625, 0.5875396728515625, 0.6085205078125, 0.6295013427734375, 0.650482177734375, 0.6714630126953125, 0.69244384765625, 0.7134246826171875, 0.734405517578125, 0.7553863525390625, 0.7763671875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 3.0, 8.0, 23.0, 44.0, 86.0, 199.0, 230.0, 198.0, 111.0, 53.0, 24.0, 12.0, 5.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.984786987304688, -13.028854370117188, -12.072922706604004, -11.116990089416504, -10.16105842590332, -9.20512580871582, -8.24919319152832, -7.293261528015137, -6.337329387664795, -5.381397247314453, -4.425465106964111, -3.4695327281951904, -2.5136005878448486, -1.5576682090759277, -0.6017360687255859, 0.35419607162475586, 1.3101282119750977, 2.2660603523254395, 3.2219924926757812, 4.177925109863281, 5.133856773376465, 6.089789390563965, 7.045721530914307, 8.001653671264648, 8.957586288452148, 9.913518905639648, 10.869450569152832, 11.825383186340332, 12.781314849853516, 13.737247467041016, 14.693180084228516, 15.6491117477417, 16.605043411254883, 17.560976028442383, 18.516908645629883, 19.47283935546875, 20.42877197265625, 21.38470458984375, 22.34063720703125, 23.29656982421875, 24.252500534057617, 25.208433151245117, 26.164365768432617, 27.120296478271484, 28.076229095458984, 29.032161712646484, 29.988094329833984, 30.944026947021484, 31.899959564208984, 32.855892181396484, 33.811824798583984, 34.767757415771484, 35.723690032958984, 36.67961883544922, 37.63555145263672, 38.59148406982422, 39.54741668701172, 40.50334930419922, 41.45928192138672, 42.41521453857422, 43.37114715576172, 44.32707977294922, 45.28300857543945, 46.23894119262695, 47.19487380981445]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 1.0, 6.0, 5.0, 6.0, 8.0, 10.0, 13.0, 11.0, 15.0, 15.0, 21.0, 37.0, 22.0, 33.0, 39.0, 32.0, 33.0, 37.0, 44.0, 50.0, 51.0, 54.0, 50.0, 35.0, 37.0, 35.0, 34.0, 37.0, 37.0, 31.0, 30.0, 26.0, 20.0, 14.0, 13.0, 10.0, 11.0, 9.0, 7.0, 8.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-20.426511764526367, -19.849178314208984, -19.27184295654297, -18.694509506225586, -18.117176055908203, -17.539840698242188, -16.962507247924805, -16.385173797607422, -15.807838439941406, -15.230504035949707, -14.653169631958008, -14.075836181640625, -13.498501777648926, -12.921167373657227, -12.343833923339844, -11.766499519348145, -11.189165115356445, -10.611830711364746, -10.034496307373047, -9.457162857055664, -8.879828453063965, -8.302494049072266, -7.725160121917725, -7.147826194763184, -6.570491790771484, -5.993157386779785, -5.415823459625244, -4.838489532470703, -4.261155128479004, -3.683820962905884, -3.1064867973327637, -2.5291528701782227, -1.9518203735351562, -1.3744862079620361, -0.797152042388916, -0.2198178768157959, 0.3575162887573242, 0.9348504543304443, 1.5121846199035645, 2.0895185470581055, 2.6668529510498047, 3.244187116622925, 3.821521282196045, 4.398855209350586, 4.976189613342285, 5.553524017333984, 6.130857944488525, 6.708191871643066, 7.285526275634766, 7.862860679626465, 8.440195083618164, 9.017528533935547, 9.594862937927246, 10.172197341918945, 10.749530792236328, 11.326865196228027, 11.904199600219727, 12.481534004211426, 13.058868408203125, 13.636201858520508, 14.213536262512207, 14.790870666503906, 15.368204116821289, 15.945538520812988, 16.522872924804688]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 10.0, 7.0, 17.0, 18.0, 30.0, 49.0, 83.0, 133.0, 216.0, 443.0, 848.0, 2071.0, 5894.0, 25899.0, 247583.0, 3147191.0, 700845.0, 49196.0, 8805.0, 2736.0, 1005.0, 552.0, 252.0, 150.0, 90.0, 58.0, 38.0, 18.0, 11.0, 10.0, 4.0, 6.0, 3.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.671875, -8.305419921875, -7.93896484375, -7.572509765625, -7.2060546875, -6.839599609375, -6.47314453125, -6.106689453125, -5.740234375, -5.373779296875, -5.00732421875, -4.640869140625, -4.2744140625, -3.907958984375, -3.54150390625, -3.175048828125, -2.80859375, -2.442138671875, -2.07568359375, -1.709228515625, -1.3427734375, -0.976318359375, -0.60986328125, -0.243408203125, 0.123046875, 0.489501953125, 0.85595703125, 1.222412109375, 1.5888671875, 1.955322265625, 2.32177734375, 2.688232421875, 3.0546875, 3.421142578125, 3.78759765625, 4.154052734375, 4.5205078125, 4.886962890625, 5.25341796875, 5.619873046875, 5.986328125, 6.352783203125, 6.71923828125, 7.085693359375, 7.4521484375, 7.818603515625, 8.18505859375, 8.551513671875, 8.91796875, 9.284423828125, 9.65087890625, 10.017333984375, 10.3837890625, 10.750244140625, 11.11669921875, 11.483154296875, 11.849609375, 12.216064453125, 12.58251953125, 12.948974609375, 13.3154296875, 13.681884765625, 14.04833984375, 14.414794921875, 14.78125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 5.0, 9.0, 15.0, 16.0, 10.0, 14.0, 26.0, 37.0, 35.0, 50.0, 42.0, 48.0, 51.0, 66.0, 48.0, 59.0, 65.0, 54.0, 53.0, 54.0, 48.0, 32.0, 42.0, 32.0, 19.0, 14.0, 15.0, 7.0, 6.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.82421875, -5.63201904296875, -5.4398193359375, -5.24761962890625, -5.055419921875, -4.86322021484375, -4.6710205078125, -4.47882080078125, -4.28662109375, -4.09442138671875, -3.9022216796875, -3.71002197265625, -3.517822265625, -3.32562255859375, -3.1334228515625, -2.94122314453125, -2.7490234375, -2.55682373046875, -2.3646240234375, -2.17242431640625, -1.980224609375, -1.78802490234375, -1.5958251953125, -1.40362548828125, -1.21142578125, -1.01922607421875, -0.8270263671875, -0.63482666015625, -0.442626953125, -0.25042724609375, -0.0582275390625, 0.13397216796875, 0.326171875, 0.51837158203125, 0.7105712890625, 0.90277099609375, 1.094970703125, 1.28717041015625, 1.4793701171875, 1.67156982421875, 1.86376953125, 2.05596923828125, 2.2481689453125, 2.44036865234375, 2.632568359375, 2.82476806640625, 3.0169677734375, 3.20916748046875, 3.4013671875, 3.59356689453125, 3.7857666015625, 3.97796630859375, 4.170166015625, 4.36236572265625, 4.5545654296875, 4.74676513671875, 4.93896484375, 5.13116455078125, 5.3233642578125, 5.51556396484375, 5.707763671875, 5.89996337890625, 6.0921630859375, 6.28436279296875, 6.4765625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 8.0, 1.0, 6.0, 12.0, 15.0, 23.0, 30.0, 51.0, 68.0, 138.0, 242.0, 546.0, 1235.0, 3693.0, 14715.0, 96242.0, 2531514.0, 1461395.0, 67638.0, 11496.0, 3072.0, 1127.0, 464.0, 202.0, 130.0, 74.0, 53.0, 24.0, 24.0, 21.0, 4.0, 7.0, 7.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.96875, -10.6251220703125, -10.281494140625, -9.9378662109375, -9.59423828125, -9.2506103515625, -8.906982421875, -8.5633544921875, -8.2197265625, -7.8760986328125, -7.532470703125, -7.1888427734375, -6.84521484375, -6.5015869140625, -6.157958984375, -5.8143310546875, -5.470703125, -5.1270751953125, -4.783447265625, -4.4398193359375, -4.09619140625, -3.7525634765625, -3.408935546875, -3.0653076171875, -2.7216796875, -2.3780517578125, -2.034423828125, -1.6907958984375, -1.34716796875, -1.0035400390625, -0.659912109375, -0.3162841796875, 0.02734375, 0.3709716796875, 0.714599609375, 1.0582275390625, 1.40185546875, 1.7454833984375, 2.089111328125, 2.4327392578125, 2.7763671875, 3.1199951171875, 3.463623046875, 3.8072509765625, 4.15087890625, 4.4945068359375, 4.838134765625, 5.1817626953125, 5.525390625, 5.8690185546875, 6.212646484375, 6.5562744140625, 6.89990234375, 7.2435302734375, 7.587158203125, 7.9307861328125, 8.2744140625, 8.6180419921875, 8.961669921875, 9.3052978515625, 9.64892578125, 9.9925537109375, 10.336181640625, 10.6798095703125, 11.0234375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 12.0, 3.0, 11.0, 17.0, 18.0, 19.0, 21.0, 41.0, 37.0, 55.0, 84.0, 116.0, 161.0, 286.0, 461.0, 506.0, 571.0, 471.0, 369.0, 224.0, 173.0, 116.0, 67.0, 54.0, 40.0, 31.0, 23.0, 17.0, 18.0, 12.0, 12.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.07421875, -2.001373291015625, -1.92852783203125, -1.855682373046875, -1.7828369140625, -1.709991455078125, -1.63714599609375, -1.564300537109375, -1.491455078125, -1.418609619140625, -1.34576416015625, -1.272918701171875, -1.2000732421875, -1.127227783203125, -1.05438232421875, -0.981536865234375, -0.90869140625, -0.835845947265625, -0.76300048828125, -0.690155029296875, -0.6173095703125, -0.544464111328125, -0.47161865234375, -0.398773193359375, -0.325927734375, -0.253082275390625, -0.18023681640625, -0.107391357421875, -0.0345458984375, 0.038299560546875, 0.11114501953125, 0.183990478515625, 0.2568359375, 0.329681396484375, 0.40252685546875, 0.475372314453125, 0.5482177734375, 0.621063232421875, 0.69390869140625, 0.766754150390625, 0.839599609375, 0.912445068359375, 0.98529052734375, 1.058135986328125, 1.1309814453125, 1.203826904296875, 1.27667236328125, 1.349517822265625, 1.42236328125, 1.495208740234375, 1.56805419921875, 1.640899658203125, 1.7137451171875, 1.786590576171875, 1.85943603515625, 1.932281494140625, 2.005126953125, 2.077972412109375, 2.15081787109375, 2.223663330078125, 2.2965087890625, 2.369354248046875, 2.44219970703125, 2.515045166015625, 2.587890625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 5.0, 5.0, 2.0, 8.0, 9.0, 13.0, 12.0, 25.0, 36.0, 30.0, 41.0, 52.0, 66.0, 71.0, 73.0, 88.0, 86.0, 66.0, 58.0, 60.0, 46.0, 37.0, 25.0, 17.0, 22.0, 14.0, 8.0, 4.0, 3.0, 3.0, 4.0, 9.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.334240913391113, -8.072463989257812, -7.810688018798828, -7.5489115715026855, -7.287135124206543, -7.025358200073242, -6.7635817527771, -6.501805305480957, -6.2400288581848145, -5.978252410888672, -5.716475963592529, -5.454699516296387, -5.192922592163086, -4.931146621704102, -4.669369697570801, -4.407593250274658, -4.145816802978516, -3.884040355682373, -3.6222639083862305, -3.360487222671509, -3.098710775375366, -2.8369343280792236, -2.575157642364502, -2.3133811950683594, -2.051604747772217, -1.7898283004760742, -1.528051733970642, -1.26627516746521, -1.0044987201690674, -0.7427222728729248, -0.4809457063674927, -0.21916913986206055, 0.04260730743408203, 0.3043838143348694, 0.5661603212356567, 0.8279368281364441, 1.0897133350372314, 1.351489782333374, 1.6132663488388062, 1.8750429153442383, 2.136819362640381, 2.3985958099365234, 2.660372257232666, 2.9221489429473877, 3.1839253902435303, 3.445701837539673, 3.7074785232543945, 3.969254970550537, 4.23103141784668, 4.492807865142822, 4.754584312438965, 5.016360759735107, 5.27813720703125, 5.539914131164551, 5.801690578460693, 6.063467025756836, 6.3252434730529785, 6.587019920349121, 6.848796367645264, 7.110572814941406, 7.372349739074707, 7.634125709533691, 7.895902633666992, 8.157678604125977, 8.419455528259277]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 10.0, 12.0, 6.0, 19.0, 9.0, 21.0, 22.0, 26.0, 18.0, 23.0, 40.0, 27.0, 33.0, 46.0, 53.0, 45.0, 50.0, 36.0, 38.0, 48.0, 47.0, 43.0, 41.0, 38.0, 27.0, 41.0, 39.0, 21.0, 25.0, 26.0, 13.0, 10.0, 11.0, 11.0, 4.0, 7.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.693583965301514, -6.493732929229736, -6.293882369995117, -6.09403133392334, -5.894180774688721, -5.694329738616943, -5.494479179382324, -5.294628143310547, -5.0947771072387695, -4.894926071166992, -4.695075511932373, -4.495224475860596, -4.295373916625977, -4.095522880554199, -3.895672082901001, -3.6958212852478027, -3.4959707260131836, -3.2961199283599854, -3.096269130706787, -2.8964180946350098, -2.6965675354003906, -2.4967164993286133, -2.296865701675415, -2.097014904022217, -1.8971641063690186, -1.6973133087158203, -1.497462511062622, -1.2976115942001343, -1.097760796546936, -0.8979099988937378, -0.69805908203125, -0.49820828437805176, -0.2983570098876953, -0.09850618243217468, 0.10134464502334595, 0.30119550228118896, 0.5010462999343872, 0.7008970975875854, 0.9007480144500732, 1.1005988121032715, 1.3004496097564697, 1.500300407409668, 1.7001512050628662, 1.900002121925354, 2.099853038787842, 2.299703598022461, 2.4995546340942383, 2.6994054317474365, 2.8992562294006348, 3.099107027053833, 3.2989578247070312, 3.4988088607788086, 3.6986594200134277, 3.898510456085205, 4.098361015319824, 4.298212051391602, 4.498063087463379, 4.697914123535156, 4.897764682769775, 5.097615718841553, 5.297466278076172, 5.497317314147949, 5.697168350219727, 5.897018909454346, 6.096869468688965]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 13.0, 15.0, 7.0, 18.0, 29.0, 42.0, 64.0, 70.0, 149.0, 217.0, 370.0, 635.0, 1118.0, 1914.0, 3757.0, 8198.0, 21200.0, 72995.0, 287048.0, 441479.0, 147208.0, 37488.0, 12627.0, 5436.0, 2791.0, 1519.0, 834.0, 463.0, 306.0, 180.0, 118.0, 88.0, 43.0, 23.0, 21.0, 15.0, 12.0, 9.0, 6.0, 8.0, 3.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.884765625, -1.8280792236328125, -1.771392822265625, -1.7147064208984375, -1.65802001953125, -1.6013336181640625, -1.544647216796875, -1.4879608154296875, -1.4312744140625, -1.3745880126953125, -1.317901611328125, -1.2612152099609375, -1.20452880859375, -1.1478424072265625, -1.091156005859375, -1.0344696044921875, -0.977783203125, -0.9210968017578125, -0.864410400390625, -0.8077239990234375, -0.75103759765625, -0.6943511962890625, -0.637664794921875, -0.5809783935546875, -0.5242919921875, -0.4676055908203125, -0.410919189453125, -0.3542327880859375, -0.29754638671875, -0.2408599853515625, -0.184173583984375, -0.1274871826171875, -0.07080078125, -0.0141143798828125, 0.042572021484375, 0.0992584228515625, 0.15594482421875, 0.2126312255859375, 0.269317626953125, 0.3260040283203125, 0.3826904296875, 0.4393768310546875, 0.496063232421875, 0.5527496337890625, 0.60943603515625, 0.6661224365234375, 0.722808837890625, 0.7794952392578125, 0.836181640625, 0.8928680419921875, 0.949554443359375, 1.0062408447265625, 1.06292724609375, 1.1196136474609375, 1.176300048828125, 1.2329864501953125, 1.2896728515625, 1.3463592529296875, 1.403045654296875, 1.4597320556640625, 1.51641845703125, 1.5731048583984375, 1.629791259765625, 1.6864776611328125, 1.7431640625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 9.0, 15.0, 11.0, 21.0, 24.0, 18.0, 27.0, 36.0, 45.0, 35.0, 48.0, 48.0, 48.0, 56.0, 58.0, 71.0, 67.0, 61.0, 59.0, 40.0, 45.0, 39.0, 31.0, 26.0, 15.0, 11.0, 11.0, 9.0, 6.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8515625, -5.68267822265625, -5.5137939453125, -5.34490966796875, -5.176025390625, -5.00714111328125, -4.8382568359375, -4.66937255859375, -4.50048828125, -4.33160400390625, -4.1627197265625, -3.99383544921875, -3.824951171875, -3.65606689453125, -3.4871826171875, -3.31829833984375, -3.1494140625, -2.98052978515625, -2.8116455078125, -2.64276123046875, -2.473876953125, -2.30499267578125, -2.1361083984375, -1.96722412109375, -1.79833984375, -1.62945556640625, -1.4605712890625, -1.29168701171875, -1.122802734375, -0.95391845703125, -0.7850341796875, -0.61614990234375, -0.447265625, -0.27838134765625, -0.1094970703125, 0.05938720703125, 0.228271484375, 0.39715576171875, 0.5660400390625, 0.73492431640625, 0.90380859375, 1.07269287109375, 1.2415771484375, 1.41046142578125, 1.579345703125, 1.74822998046875, 1.9171142578125, 2.08599853515625, 2.2548828125, 2.42376708984375, 2.5926513671875, 2.76153564453125, 2.930419921875, 3.09930419921875, 3.2681884765625, 3.43707275390625, 3.60595703125, 3.77484130859375, 3.9437255859375, 4.11260986328125, 4.281494140625, 4.45037841796875, 4.6192626953125, 4.78814697265625, 4.95703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 3.0, 1.0, 5.0, 6.0, 8.0, 21.0, 21.0, 25.0, 40.0, 34.0, 69.0, 110.0, 154.0, 262.0, 509.0, 1026.0, 2207.0, 5653.0, 19159.0, 118855.0, 588824.0, 261446.0, 35484.0, 8537.0, 3142.0, 1332.0, 668.0, 341.0, 211.0, 139.0, 89.0, 50.0, 41.0, 17.0, 14.0, 10.0, 13.0, 9.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.197265625, -2.1279296875, -2.05859375, -1.9892578125, -1.919921875, -1.8505859375, -1.78125, -1.7119140625, -1.642578125, -1.5732421875, -1.50390625, -1.4345703125, -1.365234375, -1.2958984375, -1.2265625, -1.1572265625, -1.087890625, -1.0185546875, -0.94921875, -0.8798828125, -0.810546875, -0.7412109375, -0.671875, -0.6025390625, -0.533203125, -0.4638671875, -0.39453125, -0.3251953125, -0.255859375, -0.1865234375, -0.1171875, -0.0478515625, 0.021484375, 0.0908203125, 0.16015625, 0.2294921875, 0.298828125, 0.3681640625, 0.4375, 0.5068359375, 0.576171875, 0.6455078125, 0.71484375, 0.7841796875, 0.853515625, 0.9228515625, 0.9921875, 1.0615234375, 1.130859375, 1.2001953125, 1.26953125, 1.3388671875, 1.408203125, 1.4775390625, 1.546875, 1.6162109375, 1.685546875, 1.7548828125, 1.82421875, 1.8935546875, 1.962890625, 2.0322265625, 2.1015625, 2.1708984375, 2.240234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 11.0, 9.0, 13.0, 12.0, 13.0, 21.0, 29.0, 25.0, 33.0, 45.0, 49.0, 45.0, 52.0, 58.0, 62.0, 61.0, 66.0, 52.0, 60.0, 47.0, 49.0, 39.0, 41.0, 21.0, 22.0, 19.0, 16.0, 5.0, 8.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -11.03369140625, -10.7080078125, -10.38232421875, -10.056640625, -9.73095703125, -9.4052734375, -9.07958984375, -8.75390625, -8.42822265625, -8.1025390625, -7.77685546875, -7.451171875, -7.12548828125, -6.7998046875, -6.47412109375, -6.1484375, -5.82275390625, -5.4970703125, -5.17138671875, -4.845703125, -4.52001953125, -4.1943359375, -3.86865234375, -3.54296875, -3.21728515625, -2.8916015625, -2.56591796875, -2.240234375, -1.91455078125, -1.5888671875, -1.26318359375, -0.9375, -0.61181640625, -0.2861328125, 0.03955078125, 0.365234375, 0.69091796875, 1.0166015625, 1.34228515625, 1.66796875, 1.99365234375, 2.3193359375, 2.64501953125, 2.970703125, 3.29638671875, 3.6220703125, 3.94775390625, 4.2734375, 4.59912109375, 4.9248046875, 5.25048828125, 5.576171875, 5.90185546875, 6.2275390625, 6.55322265625, 6.87890625, 7.20458984375, 7.5302734375, 7.85595703125, 8.181640625, 8.50732421875, 8.8330078125, 9.15869140625, 9.484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 9.0, 13.0, 12.0, 20.0, 34.0, 32.0, 45.0, 66.0, 94.0, 178.0, 214.0, 333.0, 527.0, 849.0, 1427.0, 2463.0, 5027.0, 12357.0, 45031.0, 313604.0, 541353.0, 91007.0, 19308.0, 6863.0, 3133.0, 1705.0, 1024.0, 621.0, 376.0, 262.0, 176.0, 110.0, 85.0, 54.0, 40.0, 21.0, 17.0, 13.0, 13.0, 10.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0009765625, -0.9688873291015625, -0.936798095703125, -0.9047088623046875, -0.87261962890625, -0.8405303955078125, -0.808441162109375, -0.7763519287109375, -0.7442626953125, -0.7121734619140625, -0.680084228515625, -0.6479949951171875, -0.61590576171875, -0.5838165283203125, -0.551727294921875, -0.5196380615234375, -0.487548828125, -0.4554595947265625, -0.423370361328125, -0.3912811279296875, -0.35919189453125, -0.3271026611328125, -0.295013427734375, -0.2629241943359375, -0.2308349609375, -0.1987457275390625, -0.166656494140625, -0.1345672607421875, -0.10247802734375, -0.0703887939453125, -0.038299560546875, -0.0062103271484375, 0.02587890625, 0.0579681396484375, 0.090057373046875, 0.1221466064453125, 0.15423583984375, 0.1863250732421875, 0.218414306640625, 0.2505035400390625, 0.2825927734375, 0.3146820068359375, 0.346771240234375, 0.3788604736328125, 0.41094970703125, 0.4430389404296875, 0.475128173828125, 0.5072174072265625, 0.539306640625, 0.5713958740234375, 0.603485107421875, 0.6355743408203125, 0.66766357421875, 0.6997528076171875, 0.731842041015625, 0.7639312744140625, 0.7960205078125, 0.8281097412109375, 0.860198974609375, 0.8922882080078125, 0.92437744140625, 0.9564666748046875, 0.988555908203125, 1.0206451416015625, 1.052734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 1.0, 4.0, 8.0, 10.0, 9.0, 22.0, 31.0, 60.0, 101.0, 120.0, 177.0, 174.0, 105.0, 67.0, 46.0, 17.0, 13.0, 11.0, 6.0, 4.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007238388061523438, -0.0007029622793197632, -0.0006820857524871826, -0.000661209225654602, -0.0006403326988220215, -0.0006194561719894409, -0.0005985796451568604, -0.0005777031183242798, -0.0005568265914916992, -0.0005359500646591187, -0.0005150735378265381, -0.0004941970109939575, -0.00047332048416137695, -0.0004524439573287964, -0.0004315674304962158, -0.00041069090366363525, -0.0003898143768310547, -0.0003689378499984741, -0.00034806132316589355, -0.000327184796333313, -0.0003063082695007324, -0.00028543174266815186, -0.0002645552158355713, -0.00024367868900299072, -0.00022280216217041016, -0.0002019256353378296, -0.00018104910850524902, -0.00016017258167266846, -0.0001392960548400879, -0.00011841952800750732, -9.754300117492676e-05, -7.666647434234619e-05, -5.5789947509765625e-05, -3.491342067718506e-05, -1.4036893844604492e-05, 6.839632987976074e-06, 2.771615982055664e-05, 4.859268665313721e-05, 6.946921348571777e-05, 9.034574031829834e-05, 0.0001112222671508789, 0.00013209879398345947, 0.00015297532081604004, 0.0001738518476486206, 0.00019472837448120117, 0.00021560490131378174, 0.0002364814281463623, 0.00025735795497894287, 0.00027823448181152344, 0.000299111008644104, 0.00031998753547668457, 0.00034086406230926514, 0.0003617405891418457, 0.00038261711597442627, 0.00040349364280700684, 0.0004243701696395874, 0.00044524669647216797, 0.00046612322330474854, 0.0004869997501373291, 0.0005078762769699097, 0.0005287528038024902, 0.0005496293306350708, 0.0005705058574676514, 0.0005913823843002319, 0.0006122589111328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 6.0, 7.0, 12.0, 12.0, 25.0, 32.0, 40.0, 76.0, 106.0, 158.0, 239.0, 368.0, 640.0, 998.0, 1737.0, 3573.0, 8462.0, 25804.0, 118512.0, 513073.0, 294368.0, 54214.0, 14573.0, 5477.0, 2615.0, 1281.0, 791.0, 466.0, 299.0, 215.0, 138.0, 70.0, 51.0, 40.0, 29.0, 11.0, 9.0, 10.0, 9.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.98388671875, -0.9508285522460938, -0.9177703857421875, -0.8847122192382812, -0.851654052734375, -0.8185958862304688, -0.7855377197265625, -0.7524795532226562, -0.71942138671875, -0.6863632202148438, -0.6533050537109375, -0.6202468872070312, -0.587188720703125, -0.5541305541992188, -0.5210723876953125, -0.48801422119140625, -0.4549560546875, -0.42189788818359375, -0.3888397216796875, -0.35578155517578125, -0.322723388671875, -0.28966522216796875, -0.2566070556640625, -0.22354888916015625, -0.19049072265625, -0.15743255615234375, -0.1243743896484375, -0.09131622314453125, -0.058258056640625, -0.02519989013671875, 0.0078582763671875, 0.04091644287109375, 0.073974609375, 0.10703277587890625, 0.1400909423828125, 0.17314910888671875, 0.206207275390625, 0.23926544189453125, 0.2723236083984375, 0.30538177490234375, 0.33843994140625, 0.37149810791015625, 0.4045562744140625, 0.43761444091796875, 0.470672607421875, 0.5037307739257812, 0.5367889404296875, 0.5698471069335938, 0.6029052734375, 0.6359634399414062, 0.6690216064453125, 0.7020797729492188, 0.735137939453125, 0.7681961059570312, 0.8012542724609375, 0.8343124389648438, 0.86737060546875, 0.9004287719726562, 0.9334869384765625, 0.9665451049804688, 0.999603271484375, 1.0326614379882812, 1.0657196044921875, 1.0987777709960938, 1.1318359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 3.0, 10.0, 13.0, 17.0, 32.0, 32.0, 74.0, 92.0, 143.0, 119.0, 111.0, 105.0, 83.0, 52.0, 30.0, 27.0, 15.0, 12.0, 6.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.332763671875, -0.32259368896484375, -0.3124237060546875, -0.30225372314453125, -0.292083740234375, -0.28191375732421875, -0.2717437744140625, -0.26157379150390625, -0.25140380859375, -0.24123382568359375, -0.2310638427734375, -0.22089385986328125, -0.210723876953125, -0.20055389404296875, -0.1903839111328125, -0.18021392822265625, -0.1700439453125, -0.15987396240234375, -0.1497039794921875, -0.13953399658203125, -0.129364013671875, -0.11919403076171875, -0.1090240478515625, -0.09885406494140625, -0.08868408203125, -0.07851409912109375, -0.0683441162109375, -0.05817413330078125, -0.048004150390625, -0.03783416748046875, -0.0276641845703125, -0.01749420166015625, -0.00732421875, 0.00284576416015625, 0.0130157470703125, 0.02318572998046875, 0.033355712890625, 0.04352569580078125, 0.0536956787109375, 0.06386566162109375, 0.07403564453125, 0.08420562744140625, 0.0943756103515625, 0.10454559326171875, 0.114715576171875, 0.12488555908203125, 0.1350555419921875, 0.14522552490234375, 0.1553955078125, 0.16556549072265625, 0.1757354736328125, 0.18590545654296875, 0.196075439453125, 0.20624542236328125, 0.2164154052734375, 0.22658538818359375, 0.23675537109375, 0.24692535400390625, 0.2570953369140625, 0.26726531982421875, 0.277435302734375, 0.28760528564453125, 0.2977752685546875, 0.30794525146484375, 0.318115234375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 5.0, 6.0, 14.0, 14.0, 21.0, 22.0, 35.0, 39.0, 50.0, 74.0, 93.0, 95.0, 97.0, 82.0, 89.0, 65.0, 57.0, 33.0, 23.0, 29.0, 15.0, 8.0, 6.0, 6.0, 6.0, 0.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.003165245056152, -5.817866325378418, -5.632567405700684, -5.447268009185791, -5.261969089508057, -5.076670169830322, -4.89137077331543, -4.706071853637695, -4.520772933959961, -4.335474014282227, -4.150175094604492, -3.9648756980895996, -3.7795767784118652, -3.594277858734131, -3.4089787006378174, -3.223679542541504, -3.0383806228637695, -2.853081703186035, -2.6677825450897217, -2.482483386993408, -2.297184467315674, -2.1118855476379395, -1.926586389541626, -1.741287350654602, -1.5559883117675781, -1.3706892728805542, -1.1853902339935303, -1.0000911951065063, -0.8147921562194824, -0.6294931173324585, -0.44419407844543457, -0.25889503955841064, -0.07359600067138672, 0.11170303821563721, 0.29700207710266113, 0.48230111598968506, 0.667600154876709, 0.8528991937637329, 1.0381982326507568, 1.2234972715377808, 1.4087963104248047, 1.5940953493118286, 1.7793943881988525, 1.9646934270858765, 2.1499924659729004, 2.3352913856506348, 2.5205905437469482, 2.7058897018432617, 2.891188621520996, 3.0764875411987305, 3.261786699295044, 3.4470858573913574, 3.632384777069092, 3.817683696746826, 4.002983093261719, 4.188282012939453, 4.3735809326171875, 4.558879852294922, 4.744178771972656, 4.929478168487549, 5.114777088165283, 5.300076007843018, 5.48537540435791, 5.6706743240356445, 5.855973243713379]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 8.0, 8.0, 13.0, 14.0, 24.0, 14.0, 25.0, 22.0, 34.0, 32.0, 43.0, 34.0, 57.0, 57.0, 57.0, 50.0, 56.0, 54.0, 52.0, 47.0, 39.0, 41.0, 44.0, 38.0, 26.0, 29.0, 27.0, 8.0, 11.0, 12.0, 6.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.792591571807861, -4.647952079772949, -4.503312587738037, -4.358673572540283, -4.214034080505371, -4.069394588470459, -3.924755096435547, -3.7801156044006348, -3.6354763507843018, -3.4908368587493896, -3.3461976051330566, -3.2015581130981445, -3.0569186210632324, -2.9122793674468994, -2.7676398754119873, -2.6230006217956543, -2.478361129760742, -2.33372163772583, -2.189082384109497, -2.044442892074585, -1.8998035192489624, -1.7551641464233398, -1.6105246543884277, -1.4658852815628052, -1.3212459087371826, -1.17660653591156, -1.0319671630859375, -0.8873276710510254, -0.7426882982254028, -0.5980489253997803, -0.45340949296951294, -0.3087700605392456, -0.16413068771362305, -0.0194912850856781, 0.12514811754226685, 0.2697875201702118, 0.41442692279815674, 0.5590662956237793, 0.7037057280540466, 0.848345160484314, 0.9929845333099365, 1.137623906135559, 1.2822632789611816, 1.4269027709960938, 1.5715421438217163, 1.7161815166473389, 1.860821008682251, 2.005460262298584, 2.150099754333496, 2.294739246368408, 2.439378499984741, 2.5840179920196533, 2.7286572456359863, 2.8732967376708984, 3.0179362297058105, 3.1625757217407227, 3.3072149753570557, 3.4518544673919678, 3.596493721008301, 3.741133213043213, 3.885772705078125, 4.030411720275879, 4.175051212310791, 4.319690704345703, 4.464330196380615]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 8.0, 9.0, 13.0, 25.0, 30.0, 38.0, 65.0, 85.0, 133.0, 208.0, 323.0, 485.0, 1034.0, 1845.0, 3432.0, 6928.0, 15274.0, 37343.0, 142395.0, 622109.0, 147676.0, 38660.0, 15509.0, 7003.0, 3492.0, 1887.0, 1011.0, 575.0, 298.0, 229.0, 134.0, 92.0, 49.0, 40.0, 22.0, 21.0, 23.0, 12.0, 13.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0], "bins": [-4.09375, -3.975128173828125, -3.85650634765625, -3.737884521484375, -3.6192626953125, -3.500640869140625, -3.38201904296875, -3.263397216796875, -3.144775390625, -3.026153564453125, -2.90753173828125, -2.788909912109375, -2.6702880859375, -2.551666259765625, -2.43304443359375, -2.314422607421875, -2.19580078125, -2.077178955078125, -1.95855712890625, -1.839935302734375, -1.7213134765625, -1.602691650390625, -1.48406982421875, -1.365447998046875, -1.246826171875, -1.128204345703125, -1.00958251953125, -0.890960693359375, -0.7723388671875, -0.653717041015625, -0.53509521484375, -0.416473388671875, -0.2978515625, -0.179229736328125, -0.06060791015625, 0.058013916015625, 0.1766357421875, 0.295257568359375, 0.41387939453125, 0.532501220703125, 0.651123046875, 0.769744873046875, 0.88836669921875, 1.006988525390625, 1.1256103515625, 1.244232177734375, 1.36285400390625, 1.481475830078125, 1.60009765625, 1.718719482421875, 1.83734130859375, 1.955963134765625, 2.0745849609375, 2.193206787109375, 2.31182861328125, 2.430450439453125, 2.549072265625, 2.667694091796875, 2.78631591796875, 2.904937744140625, 3.0235595703125, 3.142181396484375, 3.26080322265625, 3.379425048828125, 3.498046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 5.0, 7.0, 9.0, 18.0, 16.0, 17.0, 18.0, 24.0, 35.0, 20.0, 37.0, 48.0, 47.0, 54.0, 51.0, 63.0, 37.0, 66.0, 48.0, 46.0, 48.0, 44.0, 46.0, 34.0, 33.0, 26.0, 24.0, 18.0, 13.0, 9.0, 13.0, 6.0, 8.0, 1.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-10.203125, -9.9088134765625, -9.614501953125, -9.3201904296875, -9.02587890625, -8.7315673828125, -8.437255859375, -8.1429443359375, -7.8486328125, -7.5543212890625, -7.260009765625, -6.9656982421875, -6.67138671875, -6.3770751953125, -6.082763671875, -5.7884521484375, -5.494140625, -5.1998291015625, -4.905517578125, -4.6112060546875, -4.31689453125, -4.0225830078125, -3.728271484375, -3.4339599609375, -3.1396484375, -2.8453369140625, -2.551025390625, -2.2567138671875, -1.96240234375, -1.6680908203125, -1.373779296875, -1.0794677734375, -0.78515625, -0.4908447265625, -0.196533203125, 0.0977783203125, 0.39208984375, 0.6864013671875, 0.980712890625, 1.2750244140625, 1.5693359375, 1.8636474609375, 2.157958984375, 2.4522705078125, 2.74658203125, 3.0408935546875, 3.335205078125, 3.6295166015625, 3.923828125, 4.2181396484375, 4.512451171875, 4.8067626953125, 5.10107421875, 5.3953857421875, 5.689697265625, 5.9840087890625, 6.2783203125, 6.5726318359375, 6.866943359375, 7.1612548828125, 7.45556640625, 7.7498779296875, 8.044189453125, 8.3385009765625, 8.6328125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 1.0, 8.0, 12.0, 13.0, 19.0, 23.0, 46.0, 47.0, 59.0, 75.0, 261.0, 6720.0, 1026567.0, 14029.0, 327.0, 111.0, 70.0, 42.0, 50.0, 20.0, 17.0, 12.0, 8.0, 3.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.4375, -27.59033203125, -26.7431640625, -25.89599609375, -25.048828125, -24.20166015625, -23.3544921875, -22.50732421875, -21.66015625, -20.81298828125, -19.9658203125, -19.11865234375, -18.271484375, -17.42431640625, -16.5771484375, -15.72998046875, -14.8828125, -14.03564453125, -13.1884765625, -12.34130859375, -11.494140625, -10.64697265625, -9.7998046875, -8.95263671875, -8.10546875, -7.25830078125, -6.4111328125, -5.56396484375, -4.716796875, -3.86962890625, -3.0224609375, -2.17529296875, -1.328125, -0.48095703125, 0.3662109375, 1.21337890625, 2.060546875, 2.90771484375, 3.7548828125, 4.60205078125, 5.44921875, 6.29638671875, 7.1435546875, 7.99072265625, 8.837890625, 9.68505859375, 10.5322265625, 11.37939453125, 12.2265625, 13.07373046875, 13.9208984375, 14.76806640625, 15.615234375, 16.46240234375, 17.3095703125, 18.15673828125, 19.00390625, 19.85107421875, 20.6982421875, 21.54541015625, 22.392578125, 23.23974609375, 24.0869140625, 24.93408203125, 25.78125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 4.0, 5.0, 5.0, 8.0, 12.0, 15.0, 19.0, 24.0, 32.0, 35.0, 59.0, 54.0, 65.0, 75.0, 76.0, 74.0, 86.0, 82.0, 56.0, 58.0, 54.0, 31.0, 22.0, 14.0, 11.0, 13.0, 4.0, 4.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.28125, -16.756103515625, -16.23095703125, -15.705810546875, -15.1806640625, -14.655517578125, -14.13037109375, -13.605224609375, -13.080078125, -12.554931640625, -12.02978515625, -11.504638671875, -10.9794921875, -10.454345703125, -9.92919921875, -9.404052734375, -8.87890625, -8.353759765625, -7.82861328125, -7.303466796875, -6.7783203125, -6.253173828125, -5.72802734375, -5.202880859375, -4.677734375, -4.152587890625, -3.62744140625, -3.102294921875, -2.5771484375, -2.052001953125, -1.52685546875, -1.001708984375, -0.4765625, 0.048583984375, 0.57373046875, 1.098876953125, 1.6240234375, 2.149169921875, 2.67431640625, 3.199462890625, 3.724609375, 4.249755859375, 4.77490234375, 5.300048828125, 5.8251953125, 6.350341796875, 6.87548828125, 7.400634765625, 7.92578125, 8.450927734375, 8.97607421875, 9.501220703125, 10.0263671875, 10.551513671875, 11.07666015625, 11.601806640625, 12.126953125, 12.652099609375, 13.17724609375, 13.702392578125, 14.2275390625, 14.752685546875, 15.27783203125, 15.802978515625, 16.328125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 3.0, 6.0, 13.0, 30.0, 29.0, 50.0, 134.0, 294.0, 952.0, 4428.0, 51788.0, 877371.0, 104455.0, 7015.0, 1267.0, 414.0, 127.0, 64.0, 35.0, 28.0, 12.0, 12.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.60546875, -2.523040771484375, -2.44061279296875, -2.358184814453125, -2.2757568359375, -2.193328857421875, -2.11090087890625, -2.028472900390625, -1.946044921875, -1.863616943359375, -1.78118896484375, -1.698760986328125, -1.6163330078125, -1.533905029296875, -1.45147705078125, -1.369049072265625, -1.28662109375, -1.204193115234375, -1.12176513671875, -1.039337158203125, -0.9569091796875, -0.874481201171875, -0.79205322265625, -0.709625244140625, -0.627197265625, -0.544769287109375, -0.46234130859375, -0.379913330078125, -0.2974853515625, -0.215057373046875, -0.13262939453125, -0.050201416015625, 0.0322265625, 0.114654541015625, 0.19708251953125, 0.279510498046875, 0.3619384765625, 0.444366455078125, 0.52679443359375, 0.609222412109375, 0.691650390625, 0.774078369140625, 0.85650634765625, 0.938934326171875, 1.0213623046875, 1.103790283203125, 1.18621826171875, 1.268646240234375, 1.35107421875, 1.433502197265625, 1.51593017578125, 1.598358154296875, 1.6807861328125, 1.763214111328125, 1.84564208984375, 1.928070068359375, 2.010498046875, 2.092926025390625, 2.17535400390625, 2.257781982421875, 2.3402099609375, 2.422637939453125, 2.50506591796875, 2.587493896484375, 2.669921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 14.0, 12.0, 6.0, 11.0, 17.0, 18.0, 24.0, 33.0, 44.0, 58.0, 94.0, 180.0, 150.0, 88.0, 54.0, 56.0, 26.0, 34.0, 26.0, 16.0, 10.0, 10.0, 5.0, 8.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001659393310546875, -0.00015866756439208984, -0.0001513957977294922, -0.00014412403106689453, -0.00013685226440429688, -0.00012958049774169922, -0.00012230873107910156, -0.0001150369644165039, -0.00010776519775390625, -0.0001004934310913086, -9.322166442871094e-05, -8.594989776611328e-05, -7.867813110351562e-05, -7.140636444091797e-05, -6.413459777832031e-05, -5.6862831115722656e-05, -4.9591064453125e-05, -4.2319297790527344e-05, -3.504753112792969e-05, -2.777576446533203e-05, -2.0503997802734375e-05, -1.3232231140136719e-05, -5.9604644775390625e-06, 1.3113021850585938e-06, 8.58306884765625e-06, 1.5854835510253906e-05, 2.3126602172851562e-05, 3.039836883544922e-05, 3.7670135498046875e-05, 4.494190216064453e-05, 5.221366882324219e-05, 5.9485435485839844e-05, 6.67572021484375e-05, 7.402896881103516e-05, 8.130073547363281e-05, 8.857250213623047e-05, 9.584426879882812e-05, 0.00010311603546142578, 0.00011038780212402344, 0.0001176595687866211, 0.00012493133544921875, 0.0001322031021118164, 0.00013947486877441406, 0.00014674663543701172, 0.00015401840209960938, 0.00016129016876220703, 0.0001685619354248047, 0.00017583370208740234, 0.00018310546875, 0.00019037723541259766, 0.0001976490020751953, 0.00020492076873779297, 0.00021219253540039062, 0.00021946430206298828, 0.00022673606872558594, 0.0002340078353881836, 0.00024127960205078125, 0.0002485513687133789, 0.00025582313537597656, 0.0002630949020385742, 0.0002703666687011719, 0.00027763843536376953, 0.0002849102020263672, 0.00029218196868896484, 0.0002994537353515625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 5.0, 6.0, 14.0, 21.0, 32.0, 43.0, 73.0, 118.0, 254.0, 428.0, 1098.0, 2965.0, 10747.0, 60660.0, 642532.0, 283239.0, 35243.0, 7178.0, 2220.0, 811.0, 371.0, 172.0, 104.0, 68.0, 51.0, 28.0, 19.0, 13.0, 15.0, 5.0, 10.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8349609375, -1.77911376953125, -1.7232666015625, -1.66741943359375, -1.611572265625, -1.55572509765625, -1.4998779296875, -1.44403076171875, -1.38818359375, -1.33233642578125, -1.2764892578125, -1.22064208984375, -1.164794921875, -1.10894775390625, -1.0531005859375, -0.99725341796875, -0.94140625, -0.88555908203125, -0.8297119140625, -0.77386474609375, -0.718017578125, -0.66217041015625, -0.6063232421875, -0.55047607421875, -0.49462890625, -0.43878173828125, -0.3829345703125, -0.32708740234375, -0.271240234375, -0.21539306640625, -0.1595458984375, -0.10369873046875, -0.0478515625, 0.00799560546875, 0.0638427734375, 0.11968994140625, 0.175537109375, 0.23138427734375, 0.2872314453125, 0.34307861328125, 0.39892578125, 0.45477294921875, 0.5106201171875, 0.56646728515625, 0.622314453125, 0.67816162109375, 0.7340087890625, 0.78985595703125, 0.845703125, 0.90155029296875, 0.9573974609375, 1.01324462890625, 1.069091796875, 1.12493896484375, 1.1807861328125, 1.23663330078125, 1.29248046875, 1.34832763671875, 1.4041748046875, 1.46002197265625, 1.515869140625, 1.57171630859375, 1.6275634765625, 1.68341064453125, 1.7392578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 4.0, 11.0, 11.0, 21.0, 22.0, 28.0, 42.0, 66.0, 86.0, 210.0, 177.0, 78.0, 71.0, 48.0, 31.0, 22.0, 19.0, 10.0, 6.0, 5.0, 4.0, 8.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84765625, -0.8193893432617188, -0.7911224365234375, -0.7628555297851562, -0.734588623046875, -0.7063217163085938, -0.6780548095703125, -0.6497879028320312, -0.62152099609375, -0.5932540893554688, -0.5649871826171875, -0.5367202758789062, -0.508453369140625, -0.48018646240234375, -0.4519195556640625, -0.42365264892578125, -0.3953857421875, -0.36711883544921875, -0.3388519287109375, -0.31058502197265625, -0.282318115234375, -0.25405120849609375, -0.2257843017578125, -0.19751739501953125, -0.16925048828125, -0.14098358154296875, -0.1127166748046875, -0.08444976806640625, -0.056182861328125, -0.02791595458984375, 0.0003509521484375, 0.02861785888671875, 0.056884765625, 0.08515167236328125, 0.1134185791015625, 0.14168548583984375, 0.169952392578125, 0.19821929931640625, 0.2264862060546875, 0.25475311279296875, 0.28302001953125, 0.31128692626953125, 0.3395538330078125, 0.36782073974609375, 0.396087646484375, 0.42435455322265625, 0.4526214599609375, 0.48088836669921875, 0.5091552734375, 0.5374221801757812, 0.5656890869140625, 0.5939559936523438, 0.622222900390625, 0.6504898071289062, 0.6787567138671875, 0.7070236206054688, 0.73529052734375, 0.7635574340820312, 0.7918243408203125, 0.8200912475585938, 0.848358154296875, 0.8766250610351562, 0.9048919677734375, 0.9331588745117188, 0.96142578125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 9.0, 15.0, 51.0, 124.0, 286.0, 304.0, 142.0, 54.0, 16.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.22747039794922, -20.92431640625, -19.621164321899414, -18.318012237548828, -17.01485824584961, -15.711705207824707, -14.408552169799805, -13.105399131774902, -11.80224609375, -10.499093055725098, -9.195940017700195, -7.892786979675293, -6.589633941650391, -5.286480903625488, -3.983327865600586, -2.6801748275756836, -1.3770217895507812, -0.0738687515258789, 1.2292842864990234, 2.532437324523926, 3.835590362548828, 5.1387434005737305, 6.441896438598633, 7.745049476623535, 9.048202514648438, 10.35135555267334, 11.654508590698242, 12.957661628723145, 14.260814666748047, 15.56396770477295, 16.86712074279785, 18.170272827148438, 19.473426818847656, 20.776580810546875, 22.07973289489746, 23.382884979248047, 24.686038970947266, 25.989192962646484, 27.29234504699707, 28.595497131347656, 29.898651123046875, 31.201805114746094, 32.50495910644531, 33.808109283447266, 35.111263275146484, 36.4144172668457, 37.717567443847656, 39.020721435546875, 40.323875427246094, 41.62702941894531, 42.93018341064453, 44.233333587646484, 45.5364875793457, 46.83964157104492, 48.142791748046875, 49.445945739746094, 50.74909973144531, 52.05225372314453, 53.35540771484375, 54.6585578918457, 55.96171188354492, 57.26486587524414, 58.568016052246094, 59.87117004394531, 61.17432403564453]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 7.0, 11.0, 6.0, 17.0, 8.0, 8.0, 12.0, 21.0, 32.0, 21.0, 23.0, 26.0, 31.0, 23.0, 25.0, 30.0, 43.0, 37.0, 40.0, 37.0, 47.0, 38.0, 33.0, 51.0, 44.0, 33.0, 28.0, 33.0, 31.0, 28.0, 22.0, 22.0, 21.0, 17.0, 21.0, 12.0, 4.0, 18.0, 11.0, 3.0, 6.0, 9.0, 6.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.924169540405273, -12.483590126037598, -12.043009757995605, -11.60243034362793, -11.161849975585938, -10.721270561218262, -10.280691146850586, -9.840110778808594, -9.399531364440918, -8.958951950073242, -8.51837158203125, -8.077792167663574, -7.63721227645874, -7.196632385253906, -6.756052494049072, -6.315472602844238, -5.874892711639404, -5.43431282043457, -4.993732929229736, -4.553153038024902, -4.112573623657227, -3.6719937324523926, -3.2314138412475586, -2.7908341884613037, -2.3502542972564697, -1.9096745252609253, -1.4690947532653809, -1.0285148620605469, -0.5879350900650024, -0.147355318069458, 0.293224573135376, 0.7338042259216309, 1.1743841171264648, 1.6149638891220093, 2.0555436611175537, 2.4961235523223877, 2.9367032051086426, 3.3772830963134766, 3.8178629875183105, 4.2584428787231445, 4.69902229309082, 5.139602184295654, 5.580182075500488, 6.020761489868164, 6.461341381072998, 6.901921272277832, 7.342501163482666, 7.7830810546875, 8.223661422729492, 8.664240837097168, 9.10482120513916, 9.545400619506836, 9.985980987548828, 10.426560401916504, 10.86713981628418, 11.307720184326172, 11.748299598693848, 12.188879013061523, 12.629459381103516, 13.070038795471191, 13.510619163513184, 13.95119857788086, 14.391778945922852, 14.832358360290527, 15.272937774658203]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 7.0, 2.0, 14.0, 13.0, 10.0, 10.0, 16.0, 20.0, 39.0, 43.0, 49.0, 89.0, 113.0, 241.0, 436.0, 998.0, 2277.0, 6915.0, 33747.0, 473932.0, 3380103.0, 262922.0, 23156.0, 5407.0, 1900.0, 754.0, 398.0, 220.0, 131.0, 102.0, 58.0, 36.0, 37.0, 18.0, 26.0, 13.0, 7.0, 11.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9609375, -10.5882568359375, -10.215576171875, -9.8428955078125, -9.47021484375, -9.0975341796875, -8.724853515625, -8.3521728515625, -7.9794921875, -7.6068115234375, -7.234130859375, -6.8614501953125, -6.48876953125, -6.1160888671875, -5.743408203125, -5.3707275390625, -4.998046875, -4.6253662109375, -4.252685546875, -3.8800048828125, -3.50732421875, -3.1346435546875, -2.761962890625, -2.3892822265625, -2.0166015625, -1.6439208984375, -1.271240234375, -0.8985595703125, -0.52587890625, -0.1531982421875, 0.219482421875, 0.5921630859375, 0.96484375, 1.3375244140625, 1.710205078125, 2.0828857421875, 2.45556640625, 2.8282470703125, 3.200927734375, 3.5736083984375, 3.9462890625, 4.3189697265625, 4.691650390625, 5.0643310546875, 5.43701171875, 5.8096923828125, 6.182373046875, 6.5550537109375, 6.927734375, 7.3004150390625, 7.673095703125, 8.0457763671875, 8.41845703125, 8.7911376953125, 9.163818359375, 9.5364990234375, 9.9091796875, 10.2818603515625, 10.654541015625, 11.0272216796875, 11.39990234375, 11.7725830078125, 12.145263671875, 12.5179443359375, 12.890625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 12.0, 16.0, 6.0, 17.0, 21.0, 26.0, 22.0, 35.0, 32.0, 41.0, 45.0, 48.0, 61.0, 72.0, 61.0, 66.0, 54.0, 43.0, 52.0, 52.0, 34.0, 48.0, 25.0, 21.0, 24.0, 16.0, 12.0, 11.0, 7.0, 8.0, 2.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.12109375, -4.94317626953125, -4.7652587890625, -4.58734130859375, -4.409423828125, -4.23150634765625, -4.0535888671875, -3.87567138671875, -3.69775390625, -3.51983642578125, -3.3419189453125, -3.16400146484375, -2.986083984375, -2.80816650390625, -2.6302490234375, -2.45233154296875, -2.2744140625, -2.09649658203125, -1.9185791015625, -1.74066162109375, -1.562744140625, -1.38482666015625, -1.2069091796875, -1.02899169921875, -0.85107421875, -0.67315673828125, -0.4952392578125, -0.31732177734375, -0.139404296875, 0.03851318359375, 0.2164306640625, 0.39434814453125, 0.572265625, 0.75018310546875, 0.9281005859375, 1.10601806640625, 1.283935546875, 1.46185302734375, 1.6397705078125, 1.81768798828125, 1.99560546875, 2.17352294921875, 2.3514404296875, 2.52935791015625, 2.707275390625, 2.88519287109375, 3.0631103515625, 3.24102783203125, 3.4189453125, 3.59686279296875, 3.7747802734375, 3.95269775390625, 4.130615234375, 4.30853271484375, 4.4864501953125, 4.66436767578125, 4.84228515625, 5.02020263671875, 5.1981201171875, 5.37603759765625, 5.553955078125, 5.73187255859375, 5.9097900390625, 6.08770751953125, 6.265625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 15.0, 19.0, 16.0, 36.0, 94.0, 173.0, 465.0, 1386.0, 6255.0, 52703.0, 2954886.0, 1141646.0, 30541.0, 4266.0, 1069.0, 347.0, 166.0, 70.0, 41.0, 30.0, 20.0, 7.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0], "bins": [-22.125, -21.6429443359375, -21.160888671875, -20.6788330078125, -20.19677734375, -19.7147216796875, -19.232666015625, -18.7506103515625, -18.2685546875, -17.7864990234375, -17.304443359375, -16.8223876953125, -16.34033203125, -15.8582763671875, -15.376220703125, -14.8941650390625, -14.412109375, -13.9300537109375, -13.447998046875, -12.9659423828125, -12.48388671875, -12.0018310546875, -11.519775390625, -11.0377197265625, -10.5556640625, -10.0736083984375, -9.591552734375, -9.1094970703125, -8.62744140625, -8.1453857421875, -7.663330078125, -7.1812744140625, -6.69921875, -6.2171630859375, -5.735107421875, -5.2530517578125, -4.77099609375, -4.2889404296875, -3.806884765625, -3.3248291015625, -2.8427734375, -2.3607177734375, -1.878662109375, -1.3966064453125, -0.91455078125, -0.4324951171875, 0.049560546875, 0.5316162109375, 1.013671875, 1.4957275390625, 1.977783203125, 2.4598388671875, 2.94189453125, 3.4239501953125, 3.906005859375, 4.3880615234375, 4.8701171875, 5.3521728515625, 5.834228515625, 6.3162841796875, 6.79833984375, 7.2803955078125, 7.762451171875, 8.2445068359375, 8.7265625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 13.0, 12.0, 15.0, 18.0, 27.0, 56.0, 79.0, 129.0, 215.0, 350.0, 629.0, 845.0, 703.0, 397.0, 219.0, 126.0, 83.0, 51.0, 32.0, 25.0, 23.0, 2.0, 10.0, 5.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.298828125, -2.192291259765625, -2.08575439453125, -1.979217529296875, -1.8726806640625, -1.766143798828125, -1.65960693359375, -1.553070068359375, -1.446533203125, -1.339996337890625, -1.23345947265625, -1.126922607421875, -1.0203857421875, -0.913848876953125, -0.80731201171875, -0.700775146484375, -0.59423828125, -0.487701416015625, -0.38116455078125, -0.274627685546875, -0.1680908203125, -0.061553955078125, 0.04498291015625, 0.151519775390625, 0.258056640625, 0.364593505859375, 0.47113037109375, 0.577667236328125, 0.6842041015625, 0.790740966796875, 0.89727783203125, 1.003814697265625, 1.1103515625, 1.216888427734375, 1.32342529296875, 1.429962158203125, 1.5364990234375, 1.643035888671875, 1.74957275390625, 1.856109619140625, 1.962646484375, 2.069183349609375, 2.17572021484375, 2.282257080078125, 2.3887939453125, 2.495330810546875, 2.60186767578125, 2.708404541015625, 2.81494140625, 2.921478271484375, 3.02801513671875, 3.134552001953125, 3.2410888671875, 3.347625732421875, 3.45416259765625, 3.560699462890625, 3.667236328125, 3.773773193359375, 3.88031005859375, 3.986846923828125, 4.0933837890625, 4.199920654296875, 4.30645751953125, 4.412994384765625, 4.51953125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 10.0, 14.0, 19.0, 23.0, 40.0, 57.0, 87.0, 85.0, 119.0, 111.0, 84.0, 83.0, 78.0, 66.0, 40.0, 26.0, 16.0, 15.0, 10.0, 7.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-15.659774780273438, -15.306262969970703, -14.952751159667969, -14.599238395690918, -14.245726585388184, -13.89221477508545, -13.538702011108398, -13.185190200805664, -12.83167839050293, -12.478166580200195, -12.124654769897461, -11.77114200592041, -11.417630195617676, -11.064118385314941, -10.71060562133789, -10.357093811035156, -10.003582000732422, -9.650070190429688, -9.296558380126953, -8.943045616149902, -8.589533805847168, -8.236021995544434, -7.882509708404541, -7.528997421264648, -7.175485610961914, -6.82197380065918, -6.468461513519287, -6.1149492263793945, -5.76143741607666, -5.407925605773926, -5.054413318634033, -4.700901031494141, -4.347388744354248, -3.9938766956329346, -3.640364646911621, -3.2868525981903076, -2.933340549468994, -2.5798285007476807, -2.226316452026367, -1.8728044033050537, -1.5192923545837402, -1.1657803058624268, -0.8122682571411133, -0.4587562084197998, -0.10524415969848633, 0.24826788902282715, 0.6017799377441406, 0.9552919864654541, 1.3088040351867676, 1.662316083908081, 2.0158281326293945, 2.369340181350708, 2.7228522300720215, 3.076364278793335, 3.4298763275146484, 3.783388376235962, 4.136900424957275, 4.490412712097168, 4.843924522399902, 5.197436332702637, 5.550948619842529, 5.904460906982422, 6.257972717285156, 6.611484527587891, 6.964996814727783]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 6.0, 5.0, 7.0, 13.0, 10.0, 9.0, 21.0, 19.0, 12.0, 25.0, 24.0, 29.0, 23.0, 34.0, 30.0, 23.0, 34.0, 41.0, 40.0, 38.0, 51.0, 46.0, 52.0, 31.0, 35.0, 37.0, 36.0, 27.0, 28.0, 23.0, 27.0, 19.0, 31.0, 18.0, 21.0, 20.0, 14.0, 6.0, 13.0, 4.0, 6.0, 3.0, 0.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.379697322845459, -5.215372562408447, -5.0510478019714355, -4.886722564697266, -4.722397804260254, -4.558073043823242, -4.3937482833862305, -4.229423522949219, -4.065098762512207, -3.9007740020751953, -3.7364490032196045, -3.5721242427825928, -3.407799243927002, -3.2434744834899902, -3.0791497230529785, -2.914824962615967, -2.750499725341797, -2.586174964904785, -2.4218499660491943, -2.2575252056121826, -2.093200206756592, -1.92887544631958, -1.7645506858825684, -1.600225806236267, -1.4359009265899658, -1.2715760469436646, -1.1072511672973633, -0.9429264068603516, -0.7786015272140503, -0.614276647567749, -0.44995182752609253, -0.28562700748443604, -0.12130260467529297, 0.04302224516868591, 0.2073470950126648, 0.3716719448566437, 0.5359967947006226, 0.7003216743469238, 0.8646464943885803, 1.0289713144302368, 1.193296194076538, 1.3576210737228394, 1.5219459533691406, 1.6862707138061523, 1.8505955934524536, 2.014920473098755, 2.1792452335357666, 2.3435702323913574, 2.507894992828369, 2.672219753265381, 2.8365447521209717, 3.0008695125579834, 3.165194511413574, 3.329519271850586, 3.4938440322875977, 3.6581687927246094, 3.8224937915802, 3.986818552017212, 4.151143550872803, 4.3154683113098145, 4.479793071746826, 4.644118309020996, 4.808443069458008, 4.9727678298950195, 5.137092590332031]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 0.0, 6.0, 6.0, 7.0, 13.0, 15.0, 26.0, 43.0, 76.0, 125.0, 194.0, 300.0, 467.0, 898.0, 1537.0, 2649.0, 5274.0, 12943.0, 51575.0, 427846.0, 463352.0, 55800.0, 13374.0, 5535.0, 2823.0, 1490.0, 860.0, 508.0, 307.0, 203.0, 111.0, 75.0, 31.0, 30.0, 21.0, 11.0, 12.0, 4.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.578125, -3.481475830078125, -3.38482666015625, -3.288177490234375, -3.1915283203125, -3.094879150390625, -2.99822998046875, -2.901580810546875, -2.804931640625, -2.708282470703125, -2.61163330078125, -2.514984130859375, -2.4183349609375, -2.321685791015625, -2.22503662109375, -2.128387451171875, -2.03173828125, -1.935089111328125, -1.83843994140625, -1.741790771484375, -1.6451416015625, -1.548492431640625, -1.45184326171875, -1.355194091796875, -1.258544921875, -1.161895751953125, -1.06524658203125, -0.968597412109375, -0.8719482421875, -0.775299072265625, -0.67864990234375, -0.582000732421875, -0.4853515625, -0.388702392578125, -0.29205322265625, -0.195404052734375, -0.0987548828125, -0.002105712890625, 0.09454345703125, 0.191192626953125, 0.287841796875, 0.384490966796875, 0.48114013671875, 0.577789306640625, 0.6744384765625, 0.771087646484375, 0.86773681640625, 0.964385986328125, 1.06103515625, 1.157684326171875, 1.25433349609375, 1.350982666015625, 1.4476318359375, 1.544281005859375, 1.64093017578125, 1.737579345703125, 1.834228515625, 1.930877685546875, 2.02752685546875, 2.124176025390625, 2.2208251953125, 2.317474365234375, 2.41412353515625, 2.510772705078125, 2.607421875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 7.0, 7.0, 9.0, 11.0, 15.0, 11.0, 18.0, 19.0, 19.0, 36.0, 34.0, 34.0, 30.0, 41.0, 36.0, 48.0, 42.0, 53.0, 42.0, 56.0, 51.0, 52.0, 44.0, 28.0, 31.0, 27.0, 25.0, 28.0, 27.0, 28.0, 20.0, 14.0, 11.0, 10.0, 8.0, 8.0, 7.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.18359375, -4.05047607421875, -3.9173583984375, -3.78424072265625, -3.651123046875, -3.51800537109375, -3.3848876953125, -3.25177001953125, -3.11865234375, -2.98553466796875, -2.8524169921875, -2.71929931640625, -2.586181640625, -2.45306396484375, -2.3199462890625, -2.18682861328125, -2.0537109375, -1.92059326171875, -1.7874755859375, -1.65435791015625, -1.521240234375, -1.38812255859375, -1.2550048828125, -1.12188720703125, -0.98876953125, -0.85565185546875, -0.7225341796875, -0.58941650390625, -0.456298828125, -0.32318115234375, -0.1900634765625, -0.05694580078125, 0.076171875, 0.20928955078125, 0.3424072265625, 0.47552490234375, 0.608642578125, 0.74176025390625, 0.8748779296875, 1.00799560546875, 1.14111328125, 1.27423095703125, 1.4073486328125, 1.54046630859375, 1.673583984375, 1.80670166015625, 1.9398193359375, 2.07293701171875, 2.2060546875, 2.33917236328125, 2.4722900390625, 2.60540771484375, 2.738525390625, 2.87164306640625, 3.0047607421875, 3.13787841796875, 3.27099609375, 3.40411376953125, 3.5372314453125, 3.67034912109375, 3.803466796875, 3.93658447265625, 4.0697021484375, 4.20281982421875, 4.3359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 6.0, 8.0, 9.0, 10.0, 27.0, 33.0, 37.0, 83.0, 108.0, 192.0, 337.0, 583.0, 1196.0, 2709.0, 7100.0, 42434.0, 757920.0, 213185.0, 14773.0, 4186.0, 1734.0, 815.0, 456.0, 221.0, 127.0, 92.0, 44.0, 45.0, 25.0, 16.0, 9.0, 12.0, 8.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.7689208984375, -2.647216796875, -2.5255126953125, -2.40380859375, -2.2821044921875, -2.160400390625, -2.0386962890625, -1.9169921875, -1.7952880859375, -1.673583984375, -1.5518798828125, -1.43017578125, -1.3084716796875, -1.186767578125, -1.0650634765625, -0.943359375, -0.8216552734375, -0.699951171875, -0.5782470703125, -0.45654296875, -0.3348388671875, -0.213134765625, -0.0914306640625, 0.0302734375, 0.1519775390625, 0.273681640625, 0.3953857421875, 0.51708984375, 0.6387939453125, 0.760498046875, 0.8822021484375, 1.00390625, 1.1256103515625, 1.247314453125, 1.3690185546875, 1.49072265625, 1.6124267578125, 1.734130859375, 1.8558349609375, 1.9775390625, 2.0992431640625, 2.220947265625, 2.3426513671875, 2.46435546875, 2.5860595703125, 2.707763671875, 2.8294677734375, 2.951171875, 3.0728759765625, 3.194580078125, 3.3162841796875, 3.43798828125, 3.5596923828125, 3.681396484375, 3.8031005859375, 3.9248046875, 4.0465087890625, 4.168212890625, 4.2899169921875, 4.41162109375, 4.5333251953125, 4.655029296875, 4.7767333984375, 4.8984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 6.0, 4.0, 6.0, 7.0, 9.0, 6.0, 12.0, 16.0, 19.0, 19.0, 21.0, 26.0, 31.0, 29.0, 34.0, 32.0, 38.0, 46.0, 40.0, 52.0, 45.0, 42.0, 41.0, 42.0, 40.0, 43.0, 44.0, 34.0, 31.0, 20.0, 20.0, 21.0, 21.0, 15.0, 20.0, 20.0, 13.0, 6.0, 12.0, 4.0, 4.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3828125, -7.1285400390625, -6.874267578125, -6.6199951171875, -6.36572265625, -6.1114501953125, -5.857177734375, -5.6029052734375, -5.3486328125, -5.0943603515625, -4.840087890625, -4.5858154296875, -4.33154296875, -4.0772705078125, -3.822998046875, -3.5687255859375, -3.314453125, -3.0601806640625, -2.805908203125, -2.5516357421875, -2.29736328125, -2.0430908203125, -1.788818359375, -1.5345458984375, -1.2802734375, -1.0260009765625, -0.771728515625, -0.5174560546875, -0.26318359375, -0.0089111328125, 0.245361328125, 0.4996337890625, 0.75390625, 1.0081787109375, 1.262451171875, 1.5167236328125, 1.77099609375, 2.0252685546875, 2.279541015625, 2.5338134765625, 2.7880859375, 3.0423583984375, 3.296630859375, 3.5509033203125, 3.80517578125, 4.0594482421875, 4.313720703125, 4.5679931640625, 4.822265625, 5.0765380859375, 5.330810546875, 5.5850830078125, 5.83935546875, 6.0936279296875, 6.347900390625, 6.6021728515625, 6.8564453125, 7.1107177734375, 7.364990234375, 7.6192626953125, 7.87353515625, 8.1278076171875, 8.382080078125, 8.6363525390625, 8.890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 13.0, 8.0, 20.0, 19.0, 34.0, 54.0, 96.0, 152.0, 259.0, 402.0, 748.0, 1419.0, 2966.0, 7080.0, 34223.0, 775223.0, 202193.0, 14413.0, 4560.0, 2120.0, 1087.0, 608.0, 332.0, 190.0, 111.0, 79.0, 47.0, 26.0, 25.0, 11.0, 11.0, 4.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8662109375, -1.80926513671875, -1.7523193359375, -1.69537353515625, -1.638427734375, -1.58148193359375, -1.5245361328125, -1.46759033203125, -1.41064453125, -1.35369873046875, -1.2967529296875, -1.23980712890625, -1.182861328125, -1.12591552734375, -1.0689697265625, -1.01202392578125, -0.955078125, -0.89813232421875, -0.8411865234375, -0.78424072265625, -0.727294921875, -0.67034912109375, -0.6134033203125, -0.55645751953125, -0.49951171875, -0.44256591796875, -0.3856201171875, -0.32867431640625, -0.271728515625, -0.21478271484375, -0.1578369140625, -0.10089111328125, -0.0439453125, 0.01300048828125, 0.0699462890625, 0.12689208984375, 0.183837890625, 0.24078369140625, 0.2977294921875, 0.35467529296875, 0.41162109375, 0.46856689453125, 0.5255126953125, 0.58245849609375, 0.639404296875, 0.69635009765625, 0.7532958984375, 0.81024169921875, 0.8671875, 0.92413330078125, 0.9810791015625, 1.03802490234375, 1.094970703125, 1.15191650390625, 1.2088623046875, 1.26580810546875, 1.32275390625, 1.37969970703125, 1.4366455078125, 1.49359130859375, 1.550537109375, 1.60748291015625, 1.6644287109375, 1.72137451171875, 1.7783203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 14.0, 29.0, 66.0, 149.0, 264.0, 256.0, 111.0, 55.0, 20.0, 9.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009222030639648438, -0.0008923858404159546, -0.0008625686168670654, -0.0008327513933181763, -0.0008029341697692871, -0.000773116946220398, -0.0007432997226715088, -0.0007134824991226196, -0.0006836652755737305, -0.0006538480520248413, -0.0006240308284759521, -0.000594213604927063, -0.0005643963813781738, -0.0005345791578292847, -0.0005047619342803955, -0.00047494471073150635, -0.0004451274871826172, -0.00041531026363372803, -0.00038549304008483887, -0.0003556758165359497, -0.00032585859298706055, -0.0002960413694381714, -0.0002662241458892822, -0.00023640692234039307, -0.0002065896987915039, -0.00017677247524261475, -0.00014695525169372559, -0.00011713802814483643, -8.732080459594727e-05, -5.7503581047058105e-05, -2.7686357498168945e-05, 2.130866050720215e-06, 3.1948089599609375e-05, 6.176531314849854e-05, 9.15825366973877e-05, 0.00012139976024627686, 0.00015121698379516602, 0.00018103420734405518, 0.00021085143089294434, 0.0002406686544418335, 0.00027048587799072266, 0.0003003031015396118, 0.000330120325088501, 0.00035993754863739014, 0.0003897547721862793, 0.00041957199573516846, 0.0004493892192840576, 0.0004792064428329468, 0.0005090236663818359, 0.0005388408899307251, 0.0005686581134796143, 0.0005984753370285034, 0.0006282925605773926, 0.0006581097841262817, 0.0006879270076751709, 0.0007177442312240601, 0.0007475614547729492, 0.0007773786783218384, 0.0008071959018707275, 0.0008370131254196167, 0.0008668303489685059, 0.000896647572517395, 0.0009264647960662842, 0.0009562820196151733, 0.0009860992431640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 2.0, 6.0, 4.0, 9.0, 15.0, 15.0, 37.0, 50.0, 88.0, 130.0, 249.0, 463.0, 817.0, 1649.0, 3100.0, 7666.0, 35628.0, 691034.0, 278785.0, 18048.0, 5409.0, 2574.0, 1218.0, 665.0, 379.0, 220.0, 107.0, 64.0, 39.0, 19.0, 23.0, 7.0, 10.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.880859375, -1.819854736328125, -1.75885009765625, -1.697845458984375, -1.6368408203125, -1.575836181640625, -1.51483154296875, -1.453826904296875, -1.392822265625, -1.331817626953125, -1.27081298828125, -1.209808349609375, -1.1488037109375, -1.087799072265625, -1.02679443359375, -0.965789794921875, -0.90478515625, -0.843780517578125, -0.78277587890625, -0.721771240234375, -0.6607666015625, -0.599761962890625, -0.53875732421875, -0.477752685546875, -0.416748046875, -0.355743408203125, -0.29473876953125, -0.233734130859375, -0.1727294921875, -0.111724853515625, -0.05072021484375, 0.010284423828125, 0.0712890625, 0.132293701171875, 0.19329833984375, 0.254302978515625, 0.3153076171875, 0.376312255859375, 0.43731689453125, 0.498321533203125, 0.559326171875, 0.620330810546875, 0.68133544921875, 0.742340087890625, 0.8033447265625, 0.864349365234375, 0.92535400390625, 0.986358642578125, 1.04736328125, 1.108367919921875, 1.16937255859375, 1.230377197265625, 1.2913818359375, 1.352386474609375, 1.41339111328125, 1.474395751953125, 1.535400390625, 1.596405029296875, 1.65740966796875, 1.718414306640625, 1.7794189453125, 1.840423583984375, 1.90142822265625, 1.962432861328125, 2.0234375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 3.0, 7.0, 24.0, 69.0, 89.0, 159.0, 206.0, 182.0, 120.0, 52.0, 29.0, 13.0, 9.0, 6.0, 6.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.60986328125, -0.5927658081054688, -0.5756683349609375, -0.5585708618164062, -0.541473388671875, -0.5243759155273438, -0.5072784423828125, -0.49018096923828125, -0.47308349609375, -0.45598602294921875, -0.4388885498046875, -0.42179107666015625, -0.404693603515625, -0.38759613037109375, -0.3704986572265625, -0.35340118408203125, -0.3363037109375, -0.31920623779296875, -0.3021087646484375, -0.28501129150390625, -0.267913818359375, -0.25081634521484375, -0.2337188720703125, -0.21662139892578125, -0.19952392578125, -0.18242645263671875, -0.1653289794921875, -0.14823150634765625, -0.131134033203125, -0.11403656005859375, -0.0969390869140625, -0.07984161376953125, -0.062744140625, -0.04564666748046875, -0.0285491943359375, -0.01145172119140625, 0.005645751953125, 0.02274322509765625, 0.0398406982421875, 0.05693817138671875, 0.07403564453125, 0.09113311767578125, 0.1082305908203125, 0.12532806396484375, 0.142425537109375, 0.15952301025390625, 0.1766204833984375, 0.19371795654296875, 0.2108154296875, 0.22791290283203125, 0.2450103759765625, 0.26210784912109375, 0.279205322265625, 0.29630279541015625, 0.3134002685546875, 0.33049774169921875, 0.34759521484375, 0.36469268798828125, 0.3817901611328125, 0.39888763427734375, 0.415985107421875, 0.43308258056640625, 0.4501800537109375, 0.46727752685546875, 0.484375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 9.0, 8.0, 6.0, 19.0, 28.0, 25.0, 35.0, 44.0, 59.0, 66.0, 79.0, 83.0, 79.0, 62.0, 72.0, 51.0, 46.0, 49.0, 51.0, 23.0, 27.0, 14.0, 15.0, 8.0, 9.0, 4.0, 2.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.988307952880859, -6.818626403808594, -6.648944854736328, -6.479263782501221, -6.309582233428955, -6.1399006843566895, -5.970219612121582, -5.800538063049316, -5.630856513977051, -5.461174964904785, -5.2914934158325195, -5.121812343597412, -4.9521307945251465, -4.782449245452881, -4.612768173217773, -4.443086624145508, -4.273405075073242, -4.103723526000977, -3.93404221534729, -3.7643609046936035, -3.594679355621338, -3.4249978065490723, -3.2553164958953857, -3.085635185241699, -2.9159536361694336, -2.746272087097168, -2.5765907764434814, -2.406909465789795, -2.2372279167175293, -2.0675463676452637, -1.8978650569915771, -1.728183627128601, -1.5585026741027832, -1.3888212442398071, -1.219139814376831, -1.049458384513855, -0.8797769546508789, -0.7100955247879028, -0.5404140949249268, -0.3707326650619507, -0.2010512351989746, -0.031369805335998535, 0.13831162452697754, 0.3079930543899536, 0.4776744842529297, 0.6473559141159058, 0.8170373439788818, 0.9867187738418579, 1.156400203704834, 1.32608163356781, 1.4957630634307861, 1.6654444932937622, 1.8351259231567383, 2.004807472229004, 2.1744887828826904, 2.344170093536377, 2.5138516426086426, 2.683533191680908, 2.8532145023345947, 3.0228958129882812, 3.192577362060547, 3.3622589111328125, 3.531940221786499, 3.7016215324401855, 3.871303081512451]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 5.0, 8.0, 11.0, 11.0, 11.0, 18.0, 18.0, 23.0, 21.0, 31.0, 41.0, 43.0, 43.0, 36.0, 33.0, 48.0, 49.0, 57.0, 60.0, 48.0, 48.0, 42.0, 40.0, 42.0, 22.0, 42.0, 28.0, 20.0, 15.0, 21.0, 19.0, 12.0, 12.0, 2.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.94316291809082, -4.803643703460693, -4.664124488830566, -4.5246052742004395, -4.3850860595703125, -4.245566368103027, -4.106047630310059, -3.9665281772613525, -3.8270087242126465, -3.6874895095825195, -3.5479702949523926, -3.4084510803222656, -3.2689316272735596, -3.1294124126434326, -2.9898931980133057, -2.8503739833831787, -2.7108547687530518, -2.571335554122925, -2.431816339492798, -2.292296886444092, -2.152777671813965, -2.013258457183838, -1.873739242553711, -1.734220027923584, -1.5947006940841675, -1.4551814794540405, -1.315662145614624, -1.176142930984497, -1.0366237163543701, -0.8971043825149536, -0.7575851678848267, -0.6180658936500549, -0.4785468578338623, -0.3390275835990906, -0.19950833916664124, -0.059989094734191895, 0.07953017950057983, 0.21904945373535156, 0.3585686683654785, 0.49808794260025024, 0.637607216835022, 0.7771264910697937, 0.9166457653045654, 1.0561649799346924, 1.1956841945648193, 1.3352035284042358, 1.4747227430343628, 1.6142420768737793, 1.7537612915039062, 1.8932805061340332, 2.03279972076416, 2.172318935394287, 2.311838388442993, 2.45135760307312, 2.590876817703247, 2.730396032333374, 2.86991548538208, 3.009434700012207, 3.148953914642334, 3.288473129272461, 3.427992582321167, 3.567511796951294, 3.707031011581421, 3.846550226211548, 3.986069440841675]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 4.0, 7.0, 10.0, 18.0, 25.0, 31.0, 64.0, 81.0, 168.0, 279.0, 522.0, 1141.0, 2910.0, 9029.0, 31421.0, 132733.0, 602886.0, 203837.0, 44458.0, 12178.0, 3896.0, 1448.0, 631.0, 298.0, 162.0, 94.0, 78.0, 40.0, 28.0, 21.0, 12.0, 19.0, 7.0, 8.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.54296875, -6.36907958984375, -6.1951904296875, -6.02130126953125, -5.847412109375, -5.67352294921875, -5.4996337890625, -5.32574462890625, -5.15185546875, -4.97796630859375, -4.8040771484375, -4.63018798828125, -4.456298828125, -4.28240966796875, -4.1085205078125, -3.93463134765625, -3.7607421875, -3.58685302734375, -3.4129638671875, -3.23907470703125, -3.065185546875, -2.89129638671875, -2.7174072265625, -2.54351806640625, -2.36962890625, -2.19573974609375, -2.0218505859375, -1.84796142578125, -1.674072265625, -1.50018310546875, -1.3262939453125, -1.15240478515625, -0.978515625, -0.80462646484375, -0.6307373046875, -0.45684814453125, -0.282958984375, -0.10906982421875, 0.0648193359375, 0.23870849609375, 0.41259765625, 0.58648681640625, 0.7603759765625, 0.93426513671875, 1.108154296875, 1.28204345703125, 1.4559326171875, 1.62982177734375, 1.8037109375, 1.97760009765625, 2.1514892578125, 2.32537841796875, 2.499267578125, 2.67315673828125, 2.8470458984375, 3.02093505859375, 3.19482421875, 3.36871337890625, 3.5426025390625, 3.71649169921875, 3.890380859375, 4.06427001953125, 4.2381591796875, 4.41204833984375, 4.5859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 7.0, 9.0, 11.0, 11.0, 8.0, 13.0, 11.0, 34.0, 28.0, 31.0, 36.0, 38.0, 44.0, 46.0, 39.0, 60.0, 51.0, 54.0, 46.0, 43.0, 47.0, 54.0, 43.0, 36.0, 41.0, 29.0, 21.0, 22.0, 13.0, 15.0, 20.0, 8.0, 5.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.2265625, -8.9482421875, -8.669921875, -8.3916015625, -8.11328125, -7.8349609375, -7.556640625, -7.2783203125, -7.0, -6.7216796875, -6.443359375, -6.1650390625, -5.88671875, -5.6083984375, -5.330078125, -5.0517578125, -4.7734375, -4.4951171875, -4.216796875, -3.9384765625, -3.66015625, -3.3818359375, -3.103515625, -2.8251953125, -2.546875, -2.2685546875, -1.990234375, -1.7119140625, -1.43359375, -1.1552734375, -0.876953125, -0.5986328125, -0.3203125, -0.0419921875, 0.236328125, 0.5146484375, 0.79296875, 1.0712890625, 1.349609375, 1.6279296875, 1.90625, 2.1845703125, 2.462890625, 2.7412109375, 3.01953125, 3.2978515625, 3.576171875, 3.8544921875, 4.1328125, 4.4111328125, 4.689453125, 4.9677734375, 5.24609375, 5.5244140625, 5.802734375, 6.0810546875, 6.359375, 6.6376953125, 6.916015625, 7.1943359375, 7.47265625, 7.7509765625, 8.029296875, 8.3076171875, 8.5859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 7.0, 3.0, 2.0, 9.0, 10.0, 17.0, 15.0, 25.0, 20.0, 31.0, 46.0, 64.0, 65.0, 118.0, 339.0, 1750.0, 53697.0, 967391.0, 23045.0, 1144.0, 302.0, 144.0, 75.0, 48.0, 42.0, 25.0, 19.0, 21.0, 19.0, 11.0, 11.0, 5.0, 7.0, 10.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.734375, -15.16015625, -14.5859375, -14.01171875, -13.4375, -12.86328125, -12.2890625, -11.71484375, -11.140625, -10.56640625, -9.9921875, -9.41796875, -8.84375, -8.26953125, -7.6953125, -7.12109375, -6.546875, -5.97265625, -5.3984375, -4.82421875, -4.25, -3.67578125, -3.1015625, -2.52734375, -1.953125, -1.37890625, -0.8046875, -0.23046875, 0.34375, 0.91796875, 1.4921875, 2.06640625, 2.640625, 3.21484375, 3.7890625, 4.36328125, 4.9375, 5.51171875, 6.0859375, 6.66015625, 7.234375, 7.80859375, 8.3828125, 8.95703125, 9.53125, 10.10546875, 10.6796875, 11.25390625, 11.828125, 12.40234375, 12.9765625, 13.55078125, 14.125, 14.69921875, 15.2734375, 15.84765625, 16.421875, 16.99609375, 17.5703125, 18.14453125, 18.71875, 19.29296875, 19.8671875, 20.44140625, 21.015625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 5.0, 4.0, 16.0, 13.0, 14.0, 18.0, 23.0, 27.0, 39.0, 40.0, 32.0, 37.0, 44.0, 56.0, 57.0, 57.0, 59.0, 58.0, 52.0, 50.0, 38.0, 37.0, 40.0, 35.0, 26.0, 21.0, 20.0, 9.0, 15.0, 8.0, 11.0, 10.0, 6.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3671875, -9.033203125, -8.69921875, -8.365234375, -8.03125, -7.697265625, -7.36328125, -7.029296875, -6.6953125, -6.361328125, -6.02734375, -5.693359375, -5.359375, -5.025390625, -4.69140625, -4.357421875, -4.0234375, -3.689453125, -3.35546875, -3.021484375, -2.6875, -2.353515625, -2.01953125, -1.685546875, -1.3515625, -1.017578125, -0.68359375, -0.349609375, -0.015625, 0.318359375, 0.65234375, 0.986328125, 1.3203125, 1.654296875, 1.98828125, 2.322265625, 2.65625, 2.990234375, 3.32421875, 3.658203125, 3.9921875, 4.326171875, 4.66015625, 4.994140625, 5.328125, 5.662109375, 5.99609375, 6.330078125, 6.6640625, 6.998046875, 7.33203125, 7.666015625, 8.0, 8.333984375, 8.66796875, 9.001953125, 9.3359375, 9.669921875, 10.00390625, 10.337890625, 10.671875, 11.005859375, 11.33984375, 11.673828125, 12.0078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 18.0, 14.0, 45.0, 51.0, 93.0, 176.0, 488.0, 1933.0, 13847.0, 197246.0, 778499.0, 49447.0, 5276.0, 867.0, 253.0, 109.0, 76.0, 42.0, 29.0, 9.0, 11.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.75390625, -2.656463623046875, -2.55902099609375, -2.461578369140625, -2.3641357421875, -2.266693115234375, -2.16925048828125, -2.071807861328125, -1.974365234375, -1.876922607421875, -1.77947998046875, -1.682037353515625, -1.5845947265625, -1.487152099609375, -1.38970947265625, -1.292266845703125, -1.19482421875, -1.097381591796875, -0.99993896484375, -0.902496337890625, -0.8050537109375, -0.707611083984375, -0.61016845703125, -0.512725830078125, -0.415283203125, -0.317840576171875, -0.22039794921875, -0.122955322265625, -0.0255126953125, 0.071929931640625, 0.16937255859375, 0.266815185546875, 0.3642578125, 0.461700439453125, 0.55914306640625, 0.656585693359375, 0.7540283203125, 0.851470947265625, 0.94891357421875, 1.046356201171875, 1.143798828125, 1.241241455078125, 1.33868408203125, 1.436126708984375, 1.5335693359375, 1.631011962890625, 1.72845458984375, 1.825897216796875, 1.92333984375, 2.020782470703125, 2.11822509765625, 2.215667724609375, 2.3131103515625, 2.410552978515625, 2.50799560546875, 2.605438232421875, 2.702880859375, 2.800323486328125, 2.89776611328125, 2.995208740234375, 3.0926513671875, 3.190093994140625, 3.28753662109375, 3.384979248046875, 3.482421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 7.0, 7.0, 16.0, 18.0, 26.0, 33.0, 49.0, 53.0, 78.0, 89.0, 125.0, 112.0, 83.0, 78.0, 52.0, 34.0, 20.0, 16.0, 18.0, 14.0, 13.0, 10.0, 7.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023102760314941406, -0.00022373348474502563, -0.0002164393663406372, -0.00020914524793624878, -0.00020185112953186035, -0.00019455701112747192, -0.0001872628927230835, -0.00017996877431869507, -0.00017267465591430664, -0.0001653805375099182, -0.00015808641910552979, -0.00015079230070114136, -0.00014349818229675293, -0.0001362040638923645, -0.00012890994548797607, -0.00012161582708358765, -0.00011432170867919922, -0.00010702759027481079, -9.973347187042236e-05, -9.243935346603394e-05, -8.514523506164551e-05, -7.785111665725708e-05, -7.055699825286865e-05, -6.326287984848022e-05, -5.59687614440918e-05, -4.867464303970337e-05, -4.138052463531494e-05, -3.4086406230926514e-05, -2.6792287826538086e-05, -1.9498169422149658e-05, -1.220405101776123e-05, -4.909932613372803e-06, 2.384185791015625e-06, 9.678304195404053e-06, 1.697242259979248e-05, 2.4266541004180908e-05, 3.1560659408569336e-05, 3.8854777812957764e-05, 4.614889621734619e-05, 5.344301462173462e-05, 6.073713302612305e-05, 6.803125143051147e-05, 7.53253698348999e-05, 8.261948823928833e-05, 8.991360664367676e-05, 9.720772504806519e-05, 0.00010450184345245361, 0.00011179596185684204, 0.00011909008026123047, 0.0001263841986656189, 0.00013367831707000732, 0.00014097243547439575, 0.00014826655387878418, 0.0001555606722831726, 0.00016285479068756104, 0.00017014890909194946, 0.0001774430274963379, 0.00018473714590072632, 0.00019203126430511475, 0.00019932538270950317, 0.0002066195011138916, 0.00021391361951828003, 0.00022120773792266846, 0.00022850185632705688, 0.0002357959747314453]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 6.0, 9.0, 14.0, 26.0, 42.0, 101.0, 244.0, 747.0, 3381.0, 25801.0, 562855.0, 429341.0, 21868.0, 3051.0, 670.0, 224.0, 85.0, 44.0, 27.0, 8.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4140625, -3.303802490234375, -3.19354248046875, -3.083282470703125, -2.9730224609375, -2.862762451171875, -2.75250244140625, -2.642242431640625, -2.531982421875, -2.421722412109375, -2.31146240234375, -2.201202392578125, -2.0909423828125, -1.980682373046875, -1.87042236328125, -1.760162353515625, -1.64990234375, -1.539642333984375, -1.42938232421875, -1.319122314453125, -1.2088623046875, -1.098602294921875, -0.98834228515625, -0.878082275390625, -0.767822265625, -0.657562255859375, -0.54730224609375, -0.437042236328125, -0.3267822265625, -0.216522216796875, -0.10626220703125, 0.003997802734375, 0.1142578125, 0.224517822265625, 0.33477783203125, 0.445037841796875, 0.5552978515625, 0.665557861328125, 0.77581787109375, 0.886077880859375, 0.996337890625, 1.106597900390625, 1.21685791015625, 1.327117919921875, 1.4373779296875, 1.547637939453125, 1.65789794921875, 1.768157958984375, 1.87841796875, 1.988677978515625, 2.09893798828125, 2.209197998046875, 2.3194580078125, 2.429718017578125, 2.53997802734375, 2.650238037109375, 2.760498046875, 2.870758056640625, 2.98101806640625, 3.091278076171875, 3.2015380859375, 3.311798095703125, 3.42205810546875, 3.532318115234375, 3.642578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 7.0, 6.0, 6.0, 11.0, 12.0, 13.0, 24.0, 21.0, 24.0, 36.0, 36.0, 73.0, 87.0, 109.0, 110.0, 111.0, 63.0, 49.0, 45.0, 36.0, 22.0, 26.0, 16.0, 17.0, 8.0, 12.0, 4.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 2.0], "bins": [-1.083984375, -1.0569915771484375, -1.029998779296875, -1.0030059814453125, -0.97601318359375, -0.9490203857421875, -0.922027587890625, -0.8950347900390625, -0.8680419921875, -0.8410491943359375, -0.814056396484375, -0.7870635986328125, -0.76007080078125, -0.7330780029296875, -0.706085205078125, -0.6790924072265625, -0.652099609375, -0.6251068115234375, -0.598114013671875, -0.5711212158203125, -0.54412841796875, -0.5171356201171875, -0.490142822265625, -0.4631500244140625, -0.4361572265625, -0.4091644287109375, -0.382171630859375, -0.3551788330078125, -0.32818603515625, -0.3011932373046875, -0.274200439453125, -0.2472076416015625, -0.22021484375, -0.1932220458984375, -0.166229248046875, -0.1392364501953125, -0.11224365234375, -0.0852508544921875, -0.058258056640625, -0.0312652587890625, -0.0042724609375, 0.0227203369140625, 0.049713134765625, 0.0767059326171875, 0.10369873046875, 0.1306915283203125, 0.157684326171875, 0.1846771240234375, 0.211669921875, 0.2386627197265625, 0.265655517578125, 0.2926483154296875, 0.31964111328125, 0.3466339111328125, 0.373626708984375, 0.4006195068359375, 0.4276123046875, 0.4546051025390625, 0.481597900390625, 0.5085906982421875, 0.53558349609375, 0.5625762939453125, 0.589569091796875, 0.6165618896484375, 0.6435546875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 8.0, 8.0, 14.0, 30.0, 48.0, 77.0, 118.0, 172.0, 147.0, 141.0, 94.0, 61.0, 45.0, 20.0, 13.0, 10.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.494327545166016, -10.783188819885254, -10.072050094604492, -9.360910415649414, -8.649772644042969, -7.938633441925049, -7.227494239807129, -6.516355514526367, -5.8052167892456055, -5.094078063964844, -4.382939338684082, -3.671800136566162, -2.9606614112854004, -2.2495226860046387, -1.5383834838867188, -0.827244758605957, -0.11610603332519531, 0.595032811164856, 1.3061716556549072, 2.017310619354248, 2.7284493446350098, 3.4395880699157715, 4.150727272033691, 4.861865997314453, 5.573004722595215, 6.284143447875977, 6.995282173156738, 7.706421375274658, 8.417560577392578, 9.128698348999023, 9.839838027954102, 10.550976753234863, 11.262115478515625, 11.973254203796387, 12.684392929077148, 13.395532608032227, 14.106670379638672, 14.81781005859375, 15.528948783874512, 16.240087509155273, 16.95122528076172, 17.662364959716797, 18.373502731323242, 19.08464241027832, 19.795780181884766, 20.506919860839844, 21.218059539794922, 21.929197311401367, 22.640336990356445, 23.351476669311523, 24.06261444091797, 24.773754119873047, 25.484891891479492, 26.19603157043457, 26.907169342041016, 27.618309020996094, 28.329448699951172, 29.04058837890625, 29.751726150512695, 30.462865829467773, 31.17400360107422, 31.885143280029297, 32.596282958984375, 33.30741882324219, 34.018558502197266]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 6.0, 10.0, 8.0, 15.0, 5.0, 6.0, 16.0, 18.0, 10.0, 7.0, 16.0, 16.0, 17.0, 24.0, 21.0, 30.0, 32.0, 27.0, 36.0, 35.0, 33.0, 28.0, 39.0, 31.0, 39.0, 43.0, 45.0, 41.0, 40.0, 21.0, 34.0, 33.0, 24.0, 25.0, 25.0, 17.0, 26.0, 12.0, 18.0, 12.0, 13.0, 10.0, 10.0, 11.0, 6.0, 1.0, 9.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-12.265440940856934, -11.862866401672363, -11.460291862487793, -11.057717323303223, -10.655141830444336, -10.252567291259766, -9.849992752075195, -9.447418212890625, -9.044843673706055, -8.642269134521484, -8.239694595336914, -7.8371195793151855, -7.434545040130615, -7.031970500946045, -6.629395484924316, -6.226820945739746, -5.824246406555176, -5.4216718673706055, -5.019097328186035, -4.616522312164307, -4.213947772979736, -3.811373233795166, -3.4087984561920166, -3.006223678588867, -2.603649139404297, -2.2010746002197266, -1.7984998226165771, -1.3959251642227173, -0.9933505058288574, -0.5907759666442871, -0.1882011890411377, 0.21437358856201172, 0.616948127746582, 1.019522786140442, 1.4220974445343018, 1.8246721029281616, 2.2272467613220215, 2.629821300506592, 3.032396078109741, 3.4349708557128906, 3.837545394897461, 4.240119934082031, 4.642694473266602, 5.04526948928833, 5.4478440284729, 5.850418567657471, 6.252993583679199, 6.6555681228637695, 7.05814266204834, 7.46071720123291, 7.8632917404174805, 8.26586627960205, 8.668441772460938, 9.071016311645508, 9.473590850830078, 9.876165390014648, 10.278739929199219, 10.681314468383789, 11.08388900756836, 11.48646354675293, 11.8890380859375, 12.29161262512207, 12.694188117980957, 13.096762657165527, 13.499337196350098]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 9.0, 4.0, 13.0, 30.0, 28.0, 44.0, 83.0, 105.0, 204.0, 362.0, 567.0, 1137.0, 2397.0, 6070.0, 20252.0, 114390.0, 1618395.0, 2218780.0, 173149.0, 25777.0, 7182.0, 2596.0, 1209.0, 631.0, 325.0, 201.0, 121.0, 83.0, 40.0, 36.0, 28.0, 8.0, 14.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0703125, -8.768798828125, -8.46728515625, -8.165771484375, -7.8642578125, -7.562744140625, -7.26123046875, -6.959716796875, -6.658203125, -6.356689453125, -6.05517578125, -5.753662109375, -5.4521484375, -5.150634765625, -4.84912109375, -4.547607421875, -4.24609375, -3.944580078125, -3.64306640625, -3.341552734375, -3.0400390625, -2.738525390625, -2.43701171875, -2.135498046875, -1.833984375, -1.532470703125, -1.23095703125, -0.929443359375, -0.6279296875, -0.326416015625, -0.02490234375, 0.276611328125, 0.578125, 0.879638671875, 1.18115234375, 1.482666015625, 1.7841796875, 2.085693359375, 2.38720703125, 2.688720703125, 2.990234375, 3.291748046875, 3.59326171875, 3.894775390625, 4.1962890625, 4.497802734375, 4.79931640625, 5.100830078125, 5.40234375, 5.703857421875, 6.00537109375, 6.306884765625, 6.6083984375, 6.909912109375, 7.21142578125, 7.512939453125, 7.814453125, 8.115966796875, 8.41748046875, 8.718994140625, 9.0205078125, 9.322021484375, 9.62353515625, 9.925048828125, 10.2265625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 10.0, 17.0, 12.0, 21.0, 30.0, 35.0, 39.0, 46.0, 49.0, 41.0, 53.0, 50.0, 60.0, 63.0, 60.0, 46.0, 50.0, 63.0, 47.0, 41.0, 35.0, 24.0, 30.0, 17.0, 16.0, 8.0, 8.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.80078125, -5.62042236328125, -5.4400634765625, -5.25970458984375, -5.079345703125, -4.89898681640625, -4.7186279296875, -4.53826904296875, -4.35791015625, -4.17755126953125, -3.9971923828125, -3.81683349609375, -3.636474609375, -3.45611572265625, -3.2757568359375, -3.09539794921875, -2.9150390625, -2.73468017578125, -2.5543212890625, -2.37396240234375, -2.193603515625, -2.01324462890625, -1.8328857421875, -1.65252685546875, -1.47216796875, -1.29180908203125, -1.1114501953125, -0.93109130859375, -0.750732421875, -0.57037353515625, -0.3900146484375, -0.20965576171875, -0.029296875, 0.15106201171875, 0.3314208984375, 0.51177978515625, 0.692138671875, 0.87249755859375, 1.0528564453125, 1.23321533203125, 1.41357421875, 1.59393310546875, 1.7742919921875, 1.95465087890625, 2.135009765625, 2.31536865234375, 2.4957275390625, 2.67608642578125, 2.8564453125, 3.03680419921875, 3.2171630859375, 3.39752197265625, 3.577880859375, 3.75823974609375, 3.9385986328125, 4.11895751953125, 4.29931640625, 4.47967529296875, 4.6600341796875, 4.84039306640625, 5.020751953125, 5.20111083984375, 5.3814697265625, 5.56182861328125, 5.7421875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 6.0, 8.0, 7.0, 17.0, 21.0, 46.0, 46.0, 72.0, 164.0, 302.0, 817.0, 3070.0, 16470.0, 177310.0, 3619384.0, 346495.0, 24273.0, 4057.0, 995.0, 335.0, 166.0, 77.0, 47.0, 30.0, 16.0, 16.0, 7.0, 7.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.859375, -14.4171142578125, -13.974853515625, -13.5325927734375, -13.09033203125, -12.6480712890625, -12.205810546875, -11.7635498046875, -11.3212890625, -10.8790283203125, -10.436767578125, -9.9945068359375, -9.55224609375, -9.1099853515625, -8.667724609375, -8.2254638671875, -7.783203125, -7.3409423828125, -6.898681640625, -6.4564208984375, -6.01416015625, -5.5718994140625, -5.129638671875, -4.6873779296875, -4.2451171875, -3.8028564453125, -3.360595703125, -2.9183349609375, -2.47607421875, -2.0338134765625, -1.591552734375, -1.1492919921875, -0.70703125, -0.2647705078125, 0.177490234375, 0.6197509765625, 1.06201171875, 1.5042724609375, 1.946533203125, 2.3887939453125, 2.8310546875, 3.2733154296875, 3.715576171875, 4.1578369140625, 4.60009765625, 5.0423583984375, 5.484619140625, 5.9268798828125, 6.369140625, 6.8114013671875, 7.253662109375, 7.6959228515625, 8.13818359375, 8.5804443359375, 9.022705078125, 9.4649658203125, 9.9072265625, 10.3494873046875, 10.791748046875, 11.2340087890625, 11.67626953125, 12.1185302734375, 12.560791015625, 13.0030517578125, 13.4453125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 3.0, 6.0, 12.0, 9.0, 4.0, 9.0, 18.0, 21.0, 22.0, 39.0, 72.0, 70.0, 121.0, 160.0, 207.0, 279.0, 451.0, 476.0, 500.0, 431.0, 336.0, 200.0, 148.0, 126.0, 75.0, 88.0, 49.0, 26.0, 24.0, 22.0, 18.0, 9.0, 10.0, 8.0, 5.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.046875, -1.97119140625, -1.8955078125, -1.81982421875, -1.744140625, -1.66845703125, -1.5927734375, -1.51708984375, -1.44140625, -1.36572265625, -1.2900390625, -1.21435546875, -1.138671875, -1.06298828125, -0.9873046875, -0.91162109375, -0.8359375, -0.76025390625, -0.6845703125, -0.60888671875, -0.533203125, -0.45751953125, -0.3818359375, -0.30615234375, -0.23046875, -0.15478515625, -0.0791015625, -0.00341796875, 0.072265625, 0.14794921875, 0.2236328125, 0.29931640625, 0.375, 0.45068359375, 0.5263671875, 0.60205078125, 0.677734375, 0.75341796875, 0.8291015625, 0.90478515625, 0.98046875, 1.05615234375, 1.1318359375, 1.20751953125, 1.283203125, 1.35888671875, 1.4345703125, 1.51025390625, 1.5859375, 1.66162109375, 1.7373046875, 1.81298828125, 1.888671875, 1.96435546875, 2.0400390625, 2.11572265625, 2.19140625, 2.26708984375, 2.3427734375, 2.41845703125, 2.494140625, 2.56982421875, 2.6455078125, 2.72119140625, 2.796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 9.0, 10.0, 21.0, 20.0, 37.0, 41.0, 47.0, 49.0, 57.0, 93.0, 94.0, 90.0, 84.0, 66.0, 52.0, 53.0, 43.0, 34.0, 28.0, 23.0, 12.0, 10.0, 7.0, 3.0, 2.0, 6.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.043330192565918, -10.745776176452637, -10.448223114013672, -10.15066909790039, -9.85311508178711, -9.555561065673828, -9.258008003234863, -8.960453987121582, -8.662900924682617, -8.365346908569336, -8.067793846130371, -7.77023983001709, -7.472685813903809, -7.1751322746276855, -6.8775787353515625, -6.580024719238281, -6.282470703125, -5.984917163848877, -5.687363147735596, -5.389809608459473, -5.092255592346191, -4.794702053070068, -4.497148513793945, -4.199594497680664, -3.902040958404541, -3.604487180709839, -3.3069334030151367, -3.0093798637390137, -2.7118260860443115, -2.4142723083496094, -2.1167187690734863, -1.8191649913787842, -1.5216121673583984, -1.2240583896636963, -0.9265047311782837, -0.6289510130882263, -0.33139729499816895, -0.0338435173034668, 0.2637101411819458, 0.5612637996673584, 0.8588175773620605, 1.1563713550567627, 1.4539250135421753, 1.751478672027588, 2.04903244972229, 2.346586227416992, 2.6441397666931152, 2.9416935443878174, 3.2392473220825195, 3.5368010997772217, 3.834354877471924, 4.131908416748047, 4.429462432861328, 4.727015972137451, 5.024569511413574, 5.3221235275268555, 5.6196770668029785, 5.917230606079102, 6.214784622192383, 6.512338161468506, 6.809891700744629, 7.10744571685791, 7.404999256134033, 7.702552795410156, 8.000106811523438]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 10.0, 7.0, 8.0, 7.0, 11.0, 11.0, 18.0, 18.0, 26.0, 27.0, 25.0, 32.0, 24.0, 31.0, 37.0, 43.0, 36.0, 47.0, 44.0, 31.0, 44.0, 46.0, 30.0, 44.0, 32.0, 42.0, 32.0, 31.0, 38.0, 26.0, 26.0, 23.0, 23.0, 18.0, 9.0, 1.0, 7.0, 6.0, 3.0, 4.0, 6.0, 3.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.768219947814941, -4.596986293792725, -4.425752639770508, -4.254518985748291, -4.083285331726074, -3.9120514392852783, -3.7408177852630615, -3.5695838928222656, -3.398350238800049, -3.227116584777832, -3.0558829307556152, -2.8846492767333984, -2.7134153842926025, -2.5421817302703857, -2.370948076248169, -2.199714183807373, -2.0284807682037354, -1.8572471141815186, -1.6860133409500122, -1.5147796869277954, -1.343545913696289, -1.1723122596740723, -1.0010786056518555, -0.8298448324203491, -0.6586111783981323, -0.48737746477127075, -0.31614378094673157, -0.14491009712219238, 0.02632361650466919, 0.19755733013153076, 0.36879098415374756, 0.5400247573852539, 0.7112584114074707, 0.8824921250343323, 1.0537258386611938, 1.2249594926834106, 1.396193265914917, 1.5674269199371338, 1.7386605739593506, 1.909894347190857, 2.0811281204223633, 2.25236177444458, 2.423595428466797, 2.5948290824890137, 2.7660629749298096, 2.9372966289520264, 3.108530282974243, 3.279764175415039, 3.4509975910186768, 3.6222312450408936, 3.7934648990631104, 3.9646987915039062, 4.135932445526123, 4.30716609954834, 4.478399753570557, 4.649633407592773, 4.82086706161499, 4.992100715637207, 5.163334369659424, 5.334568023681641, 5.505801677703857, 5.677035331726074, 5.848269462585449, 6.019503116607666, 6.190736770629883]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 3.0, 15.0, 13.0, 21.0, 28.0, 57.0, 69.0, 115.0, 181.0, 310.0, 547.0, 958.0, 1735.0, 3547.0, 7443.0, 16772.0, 43866.0, 139621.0, 403482.0, 291043.0, 85992.0, 29478.0, 11919.0, 5352.0, 2792.0, 1336.0, 757.0, 445.0, 230.0, 137.0, 104.0, 54.0, 43.0, 34.0, 22.0, 12.0, 6.0, 9.0, 1.0, 6.0, 3.0, 2.0, 0.0, 1.0], "bins": [-2.22265625, -2.165374755859375, -2.10809326171875, -2.050811767578125, -1.9935302734375, -1.936248779296875, -1.87896728515625, -1.821685791015625, -1.764404296875, -1.707122802734375, -1.64984130859375, -1.592559814453125, -1.5352783203125, -1.477996826171875, -1.42071533203125, -1.363433837890625, -1.30615234375, -1.248870849609375, -1.19158935546875, -1.134307861328125, -1.0770263671875, -1.019744873046875, -0.96246337890625, -0.905181884765625, -0.847900390625, -0.790618896484375, -0.73333740234375, -0.676055908203125, -0.6187744140625, -0.561492919921875, -0.50421142578125, -0.446929931640625, -0.3896484375, -0.332366943359375, -0.27508544921875, -0.217803955078125, -0.1605224609375, -0.103240966796875, -0.04595947265625, 0.011322021484375, 0.068603515625, 0.125885009765625, 0.18316650390625, 0.240447998046875, 0.2977294921875, 0.355010986328125, 0.41229248046875, 0.469573974609375, 0.52685546875, 0.584136962890625, 0.64141845703125, 0.698699951171875, 0.7559814453125, 0.813262939453125, 0.87054443359375, 0.927825927734375, 0.985107421875, 1.042388916015625, 1.09967041015625, 1.156951904296875, 1.2142333984375, 1.271514892578125, 1.32879638671875, 1.386077880859375, 1.443359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 6.0, 6.0, 7.0, 12.0, 6.0, 8.0, 11.0, 23.0, 19.0, 21.0, 30.0, 26.0, 22.0, 35.0, 38.0, 35.0, 52.0, 27.0, 40.0, 40.0, 41.0, 50.0, 45.0, 38.0, 33.0, 37.0, 36.0, 37.0, 28.0, 31.0, 23.0, 27.0, 20.0, 17.0, 13.0, 14.0, 2.0, 8.0, 6.0, 6.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.00390625, -2.9024658203125, -2.801025390625, -2.6995849609375, -2.59814453125, -2.4967041015625, -2.395263671875, -2.2938232421875, -2.1923828125, -2.0909423828125, -1.989501953125, -1.8880615234375, -1.78662109375, -1.6851806640625, -1.583740234375, -1.4822998046875, -1.380859375, -1.2794189453125, -1.177978515625, -1.0765380859375, -0.97509765625, -0.8736572265625, -0.772216796875, -0.6707763671875, -0.5693359375, -0.4678955078125, -0.366455078125, -0.2650146484375, -0.16357421875, -0.0621337890625, 0.039306640625, 0.1407470703125, 0.2421875, 0.3436279296875, 0.445068359375, 0.5465087890625, 0.64794921875, 0.7493896484375, 0.850830078125, 0.9522705078125, 1.0537109375, 1.1551513671875, 1.256591796875, 1.3580322265625, 1.45947265625, 1.5609130859375, 1.662353515625, 1.7637939453125, 1.865234375, 1.9666748046875, 2.068115234375, 2.1695556640625, 2.27099609375, 2.3724365234375, 2.473876953125, 2.5753173828125, 2.6767578125, 2.7781982421875, 2.879638671875, 2.9810791015625, 3.08251953125, 3.1839599609375, 3.285400390625, 3.3868408203125, 3.48828125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 5.0, 5.0, 11.0, 13.0, 27.0, 30.0, 40.0, 67.0, 111.0, 170.0, 327.0, 596.0, 1266.0, 3417.0, 11485.0, 56425.0, 381888.0, 494487.0, 76938.0, 14351.0, 3941.0, 1414.0, 696.0, 338.0, 181.0, 106.0, 59.0, 49.0, 36.0, 20.0, 13.0, 13.0, 9.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1640625, -2.092132568359375, -2.02020263671875, -1.948272705078125, -1.8763427734375, -1.804412841796875, -1.73248291015625, -1.660552978515625, -1.588623046875, -1.516693115234375, -1.44476318359375, -1.372833251953125, -1.3009033203125, -1.228973388671875, -1.15704345703125, -1.085113525390625, -1.01318359375, -0.941253662109375, -0.86932373046875, -0.797393798828125, -0.7254638671875, -0.653533935546875, -0.58160400390625, -0.509674072265625, -0.437744140625, -0.365814208984375, -0.29388427734375, -0.221954345703125, -0.1500244140625, -0.078094482421875, -0.00616455078125, 0.065765380859375, 0.1376953125, 0.209625244140625, 0.28155517578125, 0.353485107421875, 0.4254150390625, 0.497344970703125, 0.56927490234375, 0.641204833984375, 0.713134765625, 0.785064697265625, 0.85699462890625, 0.928924560546875, 1.0008544921875, 1.072784423828125, 1.14471435546875, 1.216644287109375, 1.28857421875, 1.360504150390625, 1.43243408203125, 1.504364013671875, 1.5762939453125, 1.648223876953125, 1.72015380859375, 1.792083740234375, 1.864013671875, 1.935943603515625, 2.00787353515625, 2.079803466796875, 2.1517333984375, 2.223663330078125, 2.29559326171875, 2.367523193359375, 2.439453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 8.0, 8.0, 4.0, 4.0, 5.0, 15.0, 13.0, 11.0, 7.0, 14.0, 23.0, 28.0, 31.0, 33.0, 42.0, 47.0, 42.0, 51.0, 56.0, 70.0, 65.0, 46.0, 52.0, 42.0, 40.0, 36.0, 32.0, 32.0, 37.0, 19.0, 20.0, 17.0, 16.0, 18.0, 8.0, 5.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.73828125, -7.48712158203125, -7.2359619140625, -6.98480224609375, -6.733642578125, -6.48248291015625, -6.2313232421875, -5.98016357421875, -5.72900390625, -5.47784423828125, -5.2266845703125, -4.97552490234375, -4.724365234375, -4.47320556640625, -4.2220458984375, -3.97088623046875, -3.7197265625, -3.46856689453125, -3.2174072265625, -2.96624755859375, -2.715087890625, -2.46392822265625, -2.2127685546875, -1.96160888671875, -1.71044921875, -1.45928955078125, -1.2081298828125, -0.95697021484375, -0.705810546875, -0.45465087890625, -0.2034912109375, 0.04766845703125, 0.298828125, 0.54998779296875, 0.8011474609375, 1.05230712890625, 1.303466796875, 1.55462646484375, 1.8057861328125, 2.05694580078125, 2.30810546875, 2.55926513671875, 2.8104248046875, 3.06158447265625, 3.312744140625, 3.56390380859375, 3.8150634765625, 4.06622314453125, 4.3173828125, 4.56854248046875, 4.8197021484375, 5.07086181640625, 5.322021484375, 5.57318115234375, 5.8243408203125, 6.07550048828125, 6.32666015625, 6.57781982421875, 6.8289794921875, 7.08013916015625, 7.331298828125, 7.58245849609375, 7.8336181640625, 8.08477783203125, 8.3359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 18.0, 22.0, 22.0, 46.0, 65.0, 113.0, 165.0, 285.0, 506.0, 936.0, 1919.0, 4086.0, 10404.0, 30321.0, 112541.0, 454095.0, 323419.0, 74038.0, 21347.0, 7634.0, 3225.0, 1461.0, 758.0, 417.0, 249.0, 177.0, 93.0, 58.0, 46.0, 27.0, 23.0, 9.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.986328125, -0.9588165283203125, -0.931304931640625, -0.9037933349609375, -0.87628173828125, -0.8487701416015625, -0.821258544921875, -0.7937469482421875, -0.7662353515625, -0.7387237548828125, -0.711212158203125, -0.6837005615234375, -0.65618896484375, -0.6286773681640625, -0.601165771484375, -0.5736541748046875, -0.546142578125, -0.5186309814453125, -0.491119384765625, -0.4636077880859375, -0.43609619140625, -0.4085845947265625, -0.381072998046875, -0.3535614013671875, -0.3260498046875, -0.2985382080078125, -0.271026611328125, -0.2435150146484375, -0.21600341796875, -0.1884918212890625, -0.160980224609375, -0.1334686279296875, -0.10595703125, -0.0784454345703125, -0.050933837890625, -0.0234222412109375, 0.00408935546875, 0.0316009521484375, 0.059112548828125, 0.0866241455078125, 0.1141357421875, 0.1416473388671875, 0.169158935546875, 0.1966705322265625, 0.22418212890625, 0.2516937255859375, 0.279205322265625, 0.3067169189453125, 0.334228515625, 0.3617401123046875, 0.389251708984375, 0.4167633056640625, 0.44427490234375, 0.4717864990234375, 0.499298095703125, 0.5268096923828125, 0.5543212890625, 0.5818328857421875, 0.609344482421875, 0.6368560791015625, 0.66436767578125, 0.6918792724609375, 0.719390869140625, 0.7469024658203125, 0.7744140625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 5.0, 8.0, 11.0, 19.0, 19.0, 29.0, 39.0, 43.0, 59.0, 96.0, 103.0, 128.0, 108.0, 89.0, 54.0, 40.0, 40.0, 30.0, 19.0, 20.0, 11.0, 8.0, 3.0, 5.0, 0.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0005736351013183594, -0.000559099018573761, -0.0005445629358291626, -0.0005300268530845642, -0.0005154907703399658, -0.0005009546875953674, -0.00048641860485076904, -0.00047188252210617065, -0.00045734643936157227, -0.0004428103566169739, -0.0004282742738723755, -0.0004137381911277771, -0.0003992021083831787, -0.0003846660256385803, -0.00037012994289398193, -0.00035559386014938354, -0.00034105777740478516, -0.00032652169466018677, -0.0003119856119155884, -0.00029744952917099, -0.0002829134464263916, -0.0002683773636817932, -0.0002538412809371948, -0.00023930519819259644, -0.00022476911544799805, -0.00021023303270339966, -0.00019569694995880127, -0.00018116086721420288, -0.0001666247844696045, -0.0001520887017250061, -0.00013755261898040771, -0.00012301653623580933, -0.00010848045349121094, -9.394437074661255e-05, -7.940828800201416e-05, -6.487220525741577e-05, -5.033612251281738e-05, -3.5800039768218994e-05, -2.1263957023620605e-05, -6.727874279022217e-06, 7.808208465576172e-06, 2.234429121017456e-05, 3.688037395477295e-05, 5.141645669937134e-05, 6.595253944396973e-05, 8.048862218856812e-05, 9.50247049331665e-05, 0.00010956078767776489, 0.00012409687042236328, 0.00013863295316696167, 0.00015316903591156006, 0.00016770511865615845, 0.00018224120140075684, 0.00019677728414535522, 0.0002113133668899536, 0.000225849449634552, 0.0002403855323791504, 0.0002549216151237488, 0.00026945769786834717, 0.00028399378061294556, 0.00029852986335754395, 0.00031306594610214233, 0.0003276020288467407, 0.0003421381115913391, 0.0003566741943359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 12.0, 19.0, 17.0, 35.0, 42.0, 50.0, 98.0, 158.0, 262.0, 414.0, 699.0, 1208.0, 2141.0, 3831.0, 7078.0, 13691.0, 27463.0, 58475.0, 138618.0, 304934.0, 271944.0, 116939.0, 50114.0, 23779.0, 12064.0, 6368.0, 3406.0, 1904.0, 1066.0, 646.0, 389.0, 244.0, 156.0, 90.0, 70.0, 39.0, 26.0, 24.0, 10.0, 9.0, 4.0, 8.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.61962890625, -0.599578857421875, -0.57952880859375, -0.559478759765625, -0.5394287109375, -0.519378662109375, -0.49932861328125, -0.479278564453125, -0.459228515625, -0.439178466796875, -0.41912841796875, -0.399078369140625, -0.3790283203125, -0.358978271484375, -0.33892822265625, -0.318878173828125, -0.298828125, -0.278778076171875, -0.25872802734375, -0.238677978515625, -0.2186279296875, -0.198577880859375, -0.17852783203125, -0.158477783203125, -0.138427734375, -0.118377685546875, -0.09832763671875, -0.078277587890625, -0.0582275390625, -0.038177490234375, -0.01812744140625, 0.001922607421875, 0.02197265625, 0.042022705078125, 0.06207275390625, 0.082122802734375, 0.1021728515625, 0.122222900390625, 0.14227294921875, 0.162322998046875, 0.182373046875, 0.202423095703125, 0.22247314453125, 0.242523193359375, 0.2625732421875, 0.282623291015625, 0.30267333984375, 0.322723388671875, 0.3427734375, 0.362823486328125, 0.38287353515625, 0.402923583984375, 0.4229736328125, 0.443023681640625, 0.46307373046875, 0.483123779296875, 0.503173828125, 0.523223876953125, 0.54327392578125, 0.563323974609375, 0.5833740234375, 0.603424072265625, 0.62347412109375, 0.643524169921875, 0.66357421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 4.0, 2.0, 6.0, 3.0, 7.0, 9.0, 6.0, 13.0, 8.0, 19.0, 24.0, 27.0, 32.0, 36.0, 40.0, 55.0, 58.0, 71.0, 71.0, 69.0, 73.0, 54.0, 73.0, 49.0, 30.0, 37.0, 19.0, 19.0, 14.0, 19.0, 11.0, 10.0, 5.0, 3.0, 5.0, 3.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.184326171875, -0.17853927612304688, -0.17275238037109375, -0.16696548461914062, -0.1611785888671875, -0.15539169311523438, -0.14960479736328125, -0.14381790161132812, -0.138031005859375, -0.13224411010742188, -0.12645721435546875, -0.12067031860351562, -0.1148834228515625, -0.10909652709960938, -0.10330963134765625, -0.09752273559570312, -0.09173583984375, -0.08594894409179688, -0.08016204833984375, -0.07437515258789062, -0.0685882568359375, -0.06280136108398438, -0.05701446533203125, -0.051227569580078125, -0.045440673828125, -0.039653778076171875, -0.03386688232421875, -0.028079986572265625, -0.0222930908203125, -0.016506195068359375, -0.01071929931640625, -0.004932403564453125, 0.0008544921875, 0.006641387939453125, 0.01242828369140625, 0.018215179443359375, 0.0240020751953125, 0.029788970947265625, 0.03557586669921875, 0.041362762451171875, 0.047149658203125, 0.052936553955078125, 0.05872344970703125, 0.06451034545898438, 0.0702972412109375, 0.07608413696289062, 0.08187103271484375, 0.08765792846679688, 0.09344482421875, 0.09923171997070312, 0.10501861572265625, 0.11080551147460938, 0.1165924072265625, 0.12237930297851562, 0.12816619873046875, 0.13395309448242188, 0.139739990234375, 0.14552688598632812, 0.15131378173828125, 0.15710067749023438, 0.1628875732421875, 0.16867446899414062, 0.17446136474609375, 0.18024826049804688, 0.18603515625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 13.0, 10.0, 13.0, 18.0, 15.0, 15.0, 34.0, 47.0, 53.0, 51.0, 55.0, 81.0, 81.0, 81.0, 71.0, 56.0, 52.0, 52.0, 43.0, 38.0, 38.0, 14.0, 18.0, 11.0, 10.0, 6.0, 3.0, 5.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-6.147309303283691, -5.9977803230285645, -5.8482513427734375, -5.6987223625183105, -5.549193382263184, -5.399663925170898, -5.2501349449157715, -5.1006059646606445, -4.951076984405518, -4.801548004150391, -4.652019023895264, -4.502490043640137, -4.352960586547852, -4.203431606292725, -4.053902626037598, -3.9043736457824707, -3.7548446655273438, -3.605315685272217, -3.45578670501709, -3.306257486343384, -3.156728506088257, -3.00719952583313, -2.857670307159424, -2.708141326904297, -2.55861234664917, -2.409083366394043, -2.259554386138916, -2.11002516746521, -1.960496187210083, -1.810967206954956, -1.6614381074905396, -1.511909008026123, -1.3623805046081543, -1.2128515243530273, -1.0633224248886108, -0.9137933850288391, -0.7642643451690674, -0.6147353053092957, -0.4652062654495239, -0.3156771659851074, -0.16614818572998047, -0.01661914587020874, 0.132909893989563, 0.2824389338493347, 0.43196797370910645, 0.5814970135688782, 0.7310260534286499, 0.8805551528930664, 1.0300841331481934, 1.1796131134033203, 1.3291422128677368, 1.4786713123321533, 1.6282002925872803, 1.7777292728424072, 1.9272583723068237, 2.0767874717712402, 2.226316452026367, 2.375845432281494, 2.525374412536621, 2.674903631210327, 2.824432611465454, 2.973961591720581, 3.123490810394287, 3.273019790649414, 3.422548770904541]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 9.0, 12.0, 4.0, 11.0, 18.0, 13.0, 29.0, 18.0, 34.0, 33.0, 29.0, 40.0, 37.0, 36.0, 55.0, 48.0, 49.0, 49.0, 48.0, 49.0, 51.0, 38.0, 38.0, 27.0, 35.0, 38.0, 37.0, 26.0, 24.0, 13.0, 11.0, 6.0, 11.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1414794921875, -3.027379035949707, -2.913278579711914, -2.799178123474121, -2.685077667236328, -2.570977210998535, -2.456876754760742, -2.342776298522949, -2.2286758422851562, -2.1145753860473633, -2.0004749298095703, -1.8863744735717773, -1.7722740173339844, -1.6581735610961914, -1.5440729856491089, -1.429972529411316, -1.3158719539642334, -1.2017714977264404, -1.0876710414886475, -0.9735705256462097, -0.8594700694084167, -0.7453696131706238, -0.631269097328186, -0.5171686410903931, -0.4030681848526001, -0.28896772861480713, -0.17486724257469177, -0.060766756534576416, 0.05333369970321655, 0.16743415594100952, 0.28153467178344727, 0.39563512802124023, 0.5097355842590332, 0.6238360404968262, 0.7379364967346191, 0.8520370125770569, 0.9661374688148499, 1.080237865447998, 1.1943384408950806, 1.3084388971328735, 1.4225393533706665, 1.5366398096084595, 1.6507402658462524, 1.764840841293335, 1.878941297531128, 1.993041753768921, 2.107142210006714, 2.221242666244507, 2.3353431224823, 2.4494435787200928, 2.5635440349578857, 2.6776444911956787, 2.7917449474334717, 2.9058454036712646, 3.0199460983276367, 3.1340465545654297, 3.2481470108032227, 3.3622474670410156, 3.4763479232788086, 3.5904483795166016, 3.7045488357543945, 3.8186492919921875, 3.9327497482299805, 4.046850204467773, 4.160950660705566]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 2.0, 9.0, 12.0, 22.0, 40.0, 56.0, 106.0, 182.0, 364.0, 905.0, 2425.0, 8018.0, 29229.0, 125563.0, 567568.0, 245083.0, 49814.0, 12992.0, 3755.0, 1309.0, 531.0, 270.0, 114.0, 84.0, 39.0, 24.0, 16.0, 10.0, 7.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-10.0859375, -9.8551025390625, -9.624267578125, -9.3934326171875, -9.16259765625, -8.9317626953125, -8.700927734375, -8.4700927734375, -8.2392578125, -8.0084228515625, -7.777587890625, -7.5467529296875, -7.31591796875, -7.0850830078125, -6.854248046875, -6.6234130859375, -6.392578125, -6.1617431640625, -5.930908203125, -5.7000732421875, -5.46923828125, -5.2384033203125, -5.007568359375, -4.7767333984375, -4.5458984375, -4.3150634765625, -4.084228515625, -3.8533935546875, -3.62255859375, -3.3917236328125, -3.160888671875, -2.9300537109375, -2.69921875, -2.4683837890625, -2.237548828125, -2.0067138671875, -1.77587890625, -1.5450439453125, -1.314208984375, -1.0833740234375, -0.8525390625, -0.6217041015625, -0.390869140625, -0.1600341796875, 0.07080078125, 0.3016357421875, 0.532470703125, 0.7633056640625, 0.994140625, 1.2249755859375, 1.455810546875, 1.6866455078125, 1.91748046875, 2.1483154296875, 2.379150390625, 2.6099853515625, 2.8408203125, 3.0716552734375, 3.302490234375, 3.5333251953125, 3.76416015625, 3.9949951171875, 4.225830078125, 4.4566650390625, 4.6875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 9.0, 9.0, 12.0, 20.0, 19.0, 25.0, 28.0, 21.0, 20.0, 39.0, 32.0, 34.0, 35.0, 49.0, 59.0, 57.0, 42.0, 46.0, 53.0, 49.0, 53.0, 42.0, 35.0, 27.0, 35.0, 26.0, 31.0, 17.0, 15.0, 9.0, 13.0, 7.0, 4.0, 6.0, 6.0, 3.0, 1.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.39453125, -7.15264892578125, -6.9107666015625, -6.66888427734375, -6.427001953125, -6.18511962890625, -5.9432373046875, -5.70135498046875, -5.45947265625, -5.21759033203125, -4.9757080078125, -4.73382568359375, -4.491943359375, -4.25006103515625, -4.0081787109375, -3.76629638671875, -3.5244140625, -3.28253173828125, -3.0406494140625, -2.79876708984375, -2.556884765625, -2.31500244140625, -2.0731201171875, -1.83123779296875, -1.58935546875, -1.34747314453125, -1.1055908203125, -0.86370849609375, -0.621826171875, -0.37994384765625, -0.1380615234375, 0.10382080078125, 0.345703125, 0.58758544921875, 0.8294677734375, 1.07135009765625, 1.313232421875, 1.55511474609375, 1.7969970703125, 2.03887939453125, 2.28076171875, 2.52264404296875, 2.7645263671875, 3.00640869140625, 3.248291015625, 3.49017333984375, 3.7320556640625, 3.97393798828125, 4.2158203125, 4.45770263671875, 4.6995849609375, 4.94146728515625, 5.183349609375, 5.42523193359375, 5.6671142578125, 5.90899658203125, 6.15087890625, 6.39276123046875, 6.6346435546875, 6.87652587890625, 7.118408203125, 7.36029052734375, 7.6021728515625, 7.84405517578125, 8.0859375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 10.0, 7.0, 15.0, 22.0, 27.0, 52.0, 67.0, 139.0, 315.0, 808.0, 3521.0, 21999.0, 197268.0, 713207.0, 95888.0, 11910.0, 2158.0, 560.0, 254.0, 107.0, 81.0, 53.0, 35.0, 16.0, 12.0, 7.0, 5.0, 5.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.859375, -9.5545654296875, -9.249755859375, -8.9449462890625, -8.64013671875, -8.3353271484375, -8.030517578125, -7.7257080078125, -7.4208984375, -7.1160888671875, -6.811279296875, -6.5064697265625, -6.20166015625, -5.8968505859375, -5.592041015625, -5.2872314453125, -4.982421875, -4.6776123046875, -4.372802734375, -4.0679931640625, -3.76318359375, -3.4583740234375, -3.153564453125, -2.8487548828125, -2.5439453125, -2.2391357421875, -1.934326171875, -1.6295166015625, -1.32470703125, -1.0198974609375, -0.715087890625, -0.4102783203125, -0.10546875, 0.1993408203125, 0.504150390625, 0.8089599609375, 1.11376953125, 1.4185791015625, 1.723388671875, 2.0281982421875, 2.3330078125, 2.6378173828125, 2.942626953125, 3.2474365234375, 3.55224609375, 3.8570556640625, 4.161865234375, 4.4666748046875, 4.771484375, 5.0762939453125, 5.381103515625, 5.6859130859375, 5.99072265625, 6.2955322265625, 6.600341796875, 6.9051513671875, 7.2099609375, 7.5147705078125, 7.819580078125, 8.1243896484375, 8.42919921875, 8.7340087890625, 9.038818359375, 9.3436279296875, 9.6484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 7.0, 3.0, 3.0, 5.0, 10.0, 7.0, 7.0, 11.0, 17.0, 20.0, 14.0, 26.0, 25.0, 27.0, 36.0, 51.0, 45.0, 46.0, 42.0, 57.0, 56.0, 51.0, 48.0, 49.0, 38.0, 51.0, 33.0, 38.0, 38.0, 20.0, 18.0, 25.0, 15.0, 5.0, 15.0, 13.0, 12.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 7.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.8828125, -8.6182861328125, -8.353759765625, -8.0892333984375, -7.82470703125, -7.5601806640625, -7.295654296875, -7.0311279296875, -6.7666015625, -6.5020751953125, -6.237548828125, -5.9730224609375, -5.70849609375, -5.4439697265625, -5.179443359375, -4.9149169921875, -4.650390625, -4.3858642578125, -4.121337890625, -3.8568115234375, -3.59228515625, -3.3277587890625, -3.063232421875, -2.7987060546875, -2.5341796875, -2.2696533203125, -2.005126953125, -1.7406005859375, -1.47607421875, -1.2115478515625, -0.947021484375, -0.6824951171875, -0.41796875, -0.1534423828125, 0.111083984375, 0.3756103515625, 0.64013671875, 0.9046630859375, 1.169189453125, 1.4337158203125, 1.6982421875, 1.9627685546875, 2.227294921875, 2.4918212890625, 2.75634765625, 3.0208740234375, 3.285400390625, 3.5499267578125, 3.814453125, 4.0789794921875, 4.343505859375, 4.6080322265625, 4.87255859375, 5.1370849609375, 5.401611328125, 5.6661376953125, 5.9306640625, 6.1951904296875, 6.459716796875, 6.7242431640625, 6.98876953125, 7.2532958984375, 7.517822265625, 7.7823486328125, 8.046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 4.0, 8.0, 4.0, 7.0, 8.0, 18.0, 19.0, 14.0, 32.0, 37.0, 74.0, 91.0, 181.0, 325.0, 614.0, 1290.0, 2950.0, 6953.0, 18706.0, 58429.0, 236936.0, 519584.0, 141358.0, 38378.0, 12954.0, 5156.0, 2143.0, 1019.0, 531.0, 259.0, 151.0, 104.0, 67.0, 35.0, 34.0, 28.0, 16.0, 17.0, 5.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.380859375, -1.333770751953125, -1.28668212890625, -1.239593505859375, -1.1925048828125, -1.145416259765625, -1.09832763671875, -1.051239013671875, -1.004150390625, -0.957061767578125, -0.90997314453125, -0.862884521484375, -0.8157958984375, -0.768707275390625, -0.72161865234375, -0.674530029296875, -0.62744140625, -0.580352783203125, -0.53326416015625, -0.486175537109375, -0.4390869140625, -0.391998291015625, -0.34490966796875, -0.297821044921875, -0.250732421875, -0.203643798828125, -0.15655517578125, -0.109466552734375, -0.0623779296875, -0.015289306640625, 0.03179931640625, 0.078887939453125, 0.1259765625, 0.173065185546875, 0.22015380859375, 0.267242431640625, 0.3143310546875, 0.361419677734375, 0.40850830078125, 0.455596923828125, 0.502685546875, 0.549774169921875, 0.59686279296875, 0.643951416015625, 0.6910400390625, 0.738128662109375, 0.78521728515625, 0.832305908203125, 0.87939453125, 0.926483154296875, 0.97357177734375, 1.020660400390625, 1.0677490234375, 1.114837646484375, 1.16192626953125, 1.209014892578125, 1.256103515625, 1.303192138671875, 1.35028076171875, 1.397369384765625, 1.4444580078125, 1.491546630859375, 1.53863525390625, 1.585723876953125, 1.6328125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 10.0, 13.0, 11.0, 19.0, 17.0, 21.0, 37.0, 42.0, 43.0, 86.0, 94.0, 157.0, 102.0, 79.0, 63.0, 47.0, 43.0, 28.0, 18.0, 20.0, 8.0, 7.0, 5.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00039315223693847656, -0.00038371607661247253, -0.0003742799162864685, -0.0003648437559604645, -0.00035540759563446045, -0.0003459714353084564, -0.0003365352749824524, -0.00032709911465644836, -0.00031766295433044434, -0.0003082267940044403, -0.0002987906336784363, -0.00028935447335243225, -0.0002799183130264282, -0.0002704821527004242, -0.00026104599237442017, -0.00025160983204841614, -0.0002421736717224121, -0.00023273751139640808, -0.00022330135107040405, -0.00021386519074440002, -0.000204429030418396, -0.00019499287009239197, -0.00018555670976638794, -0.0001761205494403839, -0.00016668438911437988, -0.00015724822878837585, -0.00014781206846237183, -0.0001383759081363678, -0.00012893974781036377, -0.00011950358748435974, -0.00011006742715835571, -0.00010063126683235168, -9.119510650634766e-05, -8.175894618034363e-05, -7.23227858543396e-05, -6.288662552833557e-05, -5.345046520233154e-05, -4.4014304876327515e-05, -3.4578144550323486e-05, -2.5141984224319458e-05, -1.570582389831543e-05, -6.269663572311401e-06, 3.166496753692627e-06, 1.2602657079696655e-05, 2.2038817405700684e-05, 3.147497773170471e-05, 4.091113805770874e-05, 5.034729838371277e-05, 5.97834587097168e-05, 6.921961903572083e-05, 7.865577936172485e-05, 8.809193968772888e-05, 9.752810001373291e-05, 0.00010696426033973694, 0.00011640042066574097, 0.000125836580991745, 0.00013527274131774902, 0.00014470890164375305, 0.00015414506196975708, 0.0001635812222957611, 0.00017301738262176514, 0.00018245354294776917, 0.0001918897032737732, 0.00020132586359977722, 0.00021076202392578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 11.0, 10.0, 11.0, 26.0, 36.0, 61.0, 139.0, 213.0, 414.0, 876.0, 1906.0, 4423.0, 11017.0, 32182.0, 127593.0, 492744.0, 280834.0, 64512.0, 18755.0, 7179.0, 2938.0, 1313.0, 619.0, 338.0, 165.0, 79.0, 63.0, 22.0, 19.0, 13.0, 11.0, 6.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7138671875, -1.659912109375, -1.60595703125, -1.552001953125, -1.498046875, -1.444091796875, -1.39013671875, -1.336181640625, -1.2822265625, -1.228271484375, -1.17431640625, -1.120361328125, -1.06640625, -1.012451171875, -0.95849609375, -0.904541015625, -0.8505859375, -0.796630859375, -0.74267578125, -0.688720703125, -0.634765625, -0.580810546875, -0.52685546875, -0.472900390625, -0.4189453125, -0.364990234375, -0.31103515625, -0.257080078125, -0.203125, -0.149169921875, -0.09521484375, -0.041259765625, 0.0126953125, 0.066650390625, 0.12060546875, 0.174560546875, 0.228515625, 0.282470703125, 0.33642578125, 0.390380859375, 0.4443359375, 0.498291015625, 0.55224609375, 0.606201171875, 0.66015625, 0.714111328125, 0.76806640625, 0.822021484375, 0.8759765625, 0.929931640625, 0.98388671875, 1.037841796875, 1.091796875, 1.145751953125, 1.19970703125, 1.253662109375, 1.3076171875, 1.361572265625, 1.41552734375, 1.469482421875, 1.5234375, 1.577392578125, 1.63134765625, 1.685302734375, 1.7392578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 1.0, 6.0, 4.0, 8.0, 12.0, 10.0, 16.0, 18.0, 21.0, 27.0, 27.0, 36.0, 54.0, 52.0, 65.0, 80.0, 91.0, 95.0, 62.0, 61.0, 43.0, 29.0, 42.0, 28.0, 21.0, 20.0, 16.0, 6.0, 7.0, 5.0, 8.0, 5.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.74365234375, -0.7202911376953125, -0.696929931640625, -0.6735687255859375, -0.65020751953125, -0.6268463134765625, -0.603485107421875, -0.5801239013671875, -0.5567626953125, -0.5334014892578125, -0.510040283203125, -0.4866790771484375, -0.46331787109375, -0.4399566650390625, -0.416595458984375, -0.3932342529296875, -0.369873046875, -0.3465118408203125, -0.323150634765625, -0.2997894287109375, -0.27642822265625, -0.2530670166015625, -0.229705810546875, -0.2063446044921875, -0.1829833984375, -0.1596221923828125, -0.136260986328125, -0.1128997802734375, -0.08953857421875, -0.0661773681640625, -0.042816162109375, -0.0194549560546875, 0.00390625, 0.0272674560546875, 0.050628662109375, 0.0739898681640625, 0.09735107421875, 0.1207122802734375, 0.144073486328125, 0.1674346923828125, 0.1907958984375, 0.2141571044921875, 0.237518310546875, 0.2608795166015625, 0.28424072265625, 0.3076019287109375, 0.330963134765625, 0.3543243408203125, 0.377685546875, 0.4010467529296875, 0.424407958984375, 0.4477691650390625, 0.47113037109375, 0.4944915771484375, 0.517852783203125, 0.5412139892578125, 0.5645751953125, 0.5879364013671875, 0.611297607421875, 0.6346588134765625, 0.65802001953125, 0.6813812255859375, 0.704742431640625, 0.7281036376953125, 0.75146484375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 14.0, 50.0, 120.0, 199.0, 273.0, 177.0, 98.0, 44.0, 17.0, 8.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.93746566772461, -15.840030670166016, -14.742594718933105, -13.645158767700195, -12.547723770141602, -11.450288772583008, -10.352852821350098, -9.255416870117188, -8.157981872558594, -7.060546398162842, -5.96311092376709, -4.865675449371338, -3.768239974975586, -2.670804500579834, -1.573369026184082, -0.4759335517883301, 0.6215019226074219, 1.7189373970031738, 2.816372871398926, 3.9138083457946777, 5.01124382019043, 6.108679294586182, 7.206114768981934, 8.303550720214844, 9.400985717773438, 10.498420715332031, 11.595856666564941, 12.693292617797852, 13.790727615356445, 14.888162612915039, 15.98559856414795, 17.08303451538086, 18.180469512939453, 19.277904510498047, 20.37533950805664, 21.472776412963867, 22.57021141052246, 23.667646408081055, 24.76508331298828, 25.862518310546875, 26.95995330810547, 28.057388305664062, 29.154823303222656, 30.252260208129883, 31.349695205688477, 32.4471321105957, 33.5445671081543, 34.64200210571289, 35.739437103271484, 36.83687210083008, 37.93430709838867, 39.031742095947266, 40.129180908203125, 41.22661590576172, 42.32405090332031, 43.421485900878906, 44.5189208984375, 45.616355895996094, 46.71379089355469, 47.81122589111328, 48.908660888671875, 50.006099700927734, 51.10353469848633, 52.20096969604492, 53.298404693603516]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 8.0, 8.0, 6.0, 6.0, 12.0, 14.0, 13.0, 6.0, 16.0, 14.0, 26.0, 22.0, 25.0, 30.0, 29.0, 48.0, 35.0, 47.0, 45.0, 42.0, 35.0, 50.0, 51.0, 51.0, 54.0, 35.0, 33.0, 33.0, 34.0, 24.0, 27.0, 29.0, 18.0, 13.0, 13.0, 9.0, 17.0, 7.0, 6.0, 8.0, 3.0, 5.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.889911651611328, -11.467150688171387, -11.044390678405762, -10.62162971496582, -10.198869705200195, -9.776108741760254, -9.353347778320312, -8.930587768554688, -8.507827758789062, -8.085066795349121, -7.662306785583496, -7.239545822143555, -6.81678581237793, -6.394024848937988, -5.971264362335205, -5.548503875732422, -5.1257429122924805, -4.702982425689697, -4.280221939086914, -3.8574612140655518, -3.4347007274627686, -3.0119402408599854, -2.589179515838623, -2.16641902923584, -1.7436585426330566, -1.3208980560302734, -0.8981374502182007, -0.47537684440612793, -0.05261635780334473, 0.3701441287994385, 0.7929048538208008, 1.215665340423584, 1.6384258270263672, 2.0611863136291504, 2.4839468002319336, 2.906707525253296, 3.329468011856079, 3.7522284984588623, 4.174989223480225, 4.597749710083008, 5.020510196685791, 5.443270683288574, 5.866031169891357, 6.288791656494141, 6.711552619934082, 7.134312629699707, 7.557073593139648, 7.979834079742432, 8.402594566345215, 8.825355529785156, 9.248115539550781, 9.670876502990723, 10.093636512756348, 10.516397476196289, 10.939157485961914, 11.361918449401855, 11.784679412841797, 12.207440376281738, 12.630200386047363, 13.052961349487305, 13.47572135925293, 13.898482322692871, 14.321243286132812, 14.744003295898438, 15.166763305664062]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 1.0, 7.0, 6.0, 9.0, 4.0, 7.0, 24.0, 29.0, 31.0, 35.0, 55.0, 67.0, 103.0, 163.0, 243.0, 467.0, 806.0, 1824.0, 4148.0, 11402.0, 41803.0, 303825.0, 2725775.0, 985536.0, 86759.0, 19189.0, 6420.0, 2634.0, 1190.0, 611.0, 339.0, 240.0, 140.0, 84.0, 78.0, 53.0, 45.0, 35.0, 24.0, 18.0, 13.0, 10.0, 9.0, 5.0, 7.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-8.65625, -8.3917236328125, -8.127197265625, -7.8626708984375, -7.59814453125, -7.3336181640625, -7.069091796875, -6.8045654296875, -6.5400390625, -6.2755126953125, -6.010986328125, -5.7464599609375, -5.48193359375, -5.2174072265625, -4.952880859375, -4.6883544921875, -4.423828125, -4.1593017578125, -3.894775390625, -3.6302490234375, -3.36572265625, -3.1011962890625, -2.836669921875, -2.5721435546875, -2.3076171875, -2.0430908203125, -1.778564453125, -1.5140380859375, -1.24951171875, -0.9849853515625, -0.720458984375, -0.4559326171875, -0.19140625, 0.0731201171875, 0.337646484375, 0.6021728515625, 0.86669921875, 1.1312255859375, 1.395751953125, 1.6602783203125, 1.9248046875, 2.1893310546875, 2.453857421875, 2.7183837890625, 2.98291015625, 3.2474365234375, 3.511962890625, 3.7764892578125, 4.041015625, 4.3055419921875, 4.570068359375, 4.8345947265625, 5.09912109375, 5.3636474609375, 5.628173828125, 5.8927001953125, 6.1572265625, 6.4217529296875, 6.686279296875, 6.9508056640625, 7.21533203125, 7.4798583984375, 7.744384765625, 8.0089111328125, 8.2734375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 5.0, 10.0, 8.0, 17.0, 14.0, 19.0, 17.0, 24.0, 19.0, 29.0, 29.0, 36.0, 44.0, 37.0, 39.0, 53.0, 54.0, 52.0, 57.0, 35.0, 34.0, 44.0, 44.0, 33.0, 41.0, 27.0, 24.0, 32.0, 27.0, 25.0, 10.0, 10.0, 10.0, 6.0, 7.0, 6.0, 2.0, 6.0, 2.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.236328125, -3.12359619140625, -3.0108642578125, -2.89813232421875, -2.785400390625, -2.67266845703125, -2.5599365234375, -2.44720458984375, -2.33447265625, -2.22174072265625, -2.1090087890625, -1.99627685546875, -1.883544921875, -1.77081298828125, -1.6580810546875, -1.54534912109375, -1.4326171875, -1.31988525390625, -1.2071533203125, -1.09442138671875, -0.981689453125, -0.86895751953125, -0.7562255859375, -0.64349365234375, -0.53076171875, -0.41802978515625, -0.3052978515625, -0.19256591796875, -0.079833984375, 0.03289794921875, 0.1456298828125, 0.25836181640625, 0.37109375, 0.48382568359375, 0.5965576171875, 0.70928955078125, 0.822021484375, 0.93475341796875, 1.0474853515625, 1.16021728515625, 1.27294921875, 1.38568115234375, 1.4984130859375, 1.61114501953125, 1.723876953125, 1.83660888671875, 1.9493408203125, 2.06207275390625, 2.1748046875, 2.28753662109375, 2.4002685546875, 2.51300048828125, 2.625732421875, 2.73846435546875, 2.8511962890625, 2.96392822265625, 3.07666015625, 3.18939208984375, 3.3021240234375, 3.41485595703125, 3.527587890625, 3.64031982421875, 3.7530517578125, 3.86578369140625, 3.978515625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 6.0, 8.0, 5.0, 14.0, 5.0, 24.0, 23.0, 32.0, 39.0, 47.0, 98.0, 150.0, 261.0, 559.0, 1253.0, 3421.0, 11540.0, 48002.0, 314302.0, 2934529.0, 770415.0, 83217.0, 17926.0, 5082.0, 1740.0, 682.0, 319.0, 190.0, 88.0, 87.0, 49.0, 43.0, 25.0, 26.0, 13.0, 12.0, 13.0, 7.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.7421875, -7.48974609375, -7.2373046875, -6.98486328125, -6.732421875, -6.47998046875, -6.2275390625, -5.97509765625, -5.72265625, -5.47021484375, -5.2177734375, -4.96533203125, -4.712890625, -4.46044921875, -4.2080078125, -3.95556640625, -3.703125, -3.45068359375, -3.1982421875, -2.94580078125, -2.693359375, -2.44091796875, -2.1884765625, -1.93603515625, -1.68359375, -1.43115234375, -1.1787109375, -0.92626953125, -0.673828125, -0.42138671875, -0.1689453125, 0.08349609375, 0.3359375, 0.58837890625, 0.8408203125, 1.09326171875, 1.345703125, 1.59814453125, 1.8505859375, 2.10302734375, 2.35546875, 2.60791015625, 2.8603515625, 3.11279296875, 3.365234375, 3.61767578125, 3.8701171875, 4.12255859375, 4.375, 4.62744140625, 4.8798828125, 5.13232421875, 5.384765625, 5.63720703125, 5.8896484375, 6.14208984375, 6.39453125, 6.64697265625, 6.8994140625, 7.15185546875, 7.404296875, 7.65673828125, 7.9091796875, 8.16162109375, 8.4140625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 8.0, 8.0, 10.0, 12.0, 21.0, 23.0, 24.0, 34.0, 51.0, 35.0, 60.0, 86.0, 109.0, 151.0, 227.0, 276.0, 338.0, 428.0, 419.0, 382.0, 320.0, 270.0, 168.0, 163.0, 93.0, 83.0, 75.0, 44.0, 20.0, 37.0, 21.0, 22.0, 11.0, 7.0, 7.0, 7.0, 3.0, 10.0, 2.0, 4.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.951171875, -1.888824462890625, -1.82647705078125, -1.764129638671875, -1.7017822265625, -1.639434814453125, -1.57708740234375, -1.514739990234375, -1.452392578125, -1.390045166015625, -1.32769775390625, -1.265350341796875, -1.2030029296875, -1.140655517578125, -1.07830810546875, -1.015960693359375, -0.95361328125, -0.891265869140625, -0.82891845703125, -0.766571044921875, -0.7042236328125, -0.641876220703125, -0.57952880859375, -0.517181396484375, -0.454833984375, -0.392486572265625, -0.33013916015625, -0.267791748046875, -0.2054443359375, -0.143096923828125, -0.08074951171875, -0.018402099609375, 0.0439453125, 0.106292724609375, 0.16864013671875, 0.230987548828125, 0.2933349609375, 0.355682373046875, 0.41802978515625, 0.480377197265625, 0.542724609375, 0.605072021484375, 0.66741943359375, 0.729766845703125, 0.7921142578125, 0.854461669921875, 0.91680908203125, 0.979156494140625, 1.04150390625, 1.103851318359375, 1.16619873046875, 1.228546142578125, 1.2908935546875, 1.353240966796875, 1.41558837890625, 1.477935791015625, 1.540283203125, 1.602630615234375, 1.66497802734375, 1.727325439453125, 1.7896728515625, 1.852020263671875, 1.91436767578125, 1.976715087890625, 2.0390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 6.0, 5.0, 9.0, 3.0, 10.0, 12.0, 10.0, 17.0, 16.0, 24.0, 28.0, 40.0, 44.0, 44.0, 42.0, 67.0, 43.0, 53.0, 50.0, 52.0, 45.0, 61.0, 48.0, 41.0, 36.0, 29.0, 18.0, 30.0, 20.0, 21.0, 18.0, 16.0, 12.0, 10.0, 6.0, 6.0, 1.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.964389801025391, -5.785422325134277, -5.606454849243164, -5.427487850189209, -5.248520374298096, -5.069552898406982, -4.890585422515869, -4.711618423461914, -4.532650947570801, -4.3536834716796875, -4.174715995788574, -3.99574875831604, -3.816781520843506, -3.6378140449523926, -3.4588465690612793, -3.279879331588745, -3.100911855697632, -2.9219443798065186, -2.7429771423339844, -2.564009666442871, -2.385042428970337, -2.2060749530792236, -2.0271077156066895, -1.8481402397155762, -1.6691728830337524, -1.4902055263519287, -1.311238169670105, -1.1322708129882812, -0.9533033967018127, -0.774336040019989, -0.5953686237335205, -0.4164012670516968, -0.23743391036987305, -0.05846653878688812, 0.1205008327960968, 0.2994682192802429, 0.47843557596206665, 0.6574029326438904, 0.8363703489303589, 1.0153377056121826, 1.1943050622940063, 1.37327241897583, 1.5522397756576538, 1.7312071323394775, 1.9101746082305908, 2.089141845703125, 2.2681093215942383, 2.4470767974853516, 2.6260440349578857, 2.805011510848999, 2.983978748321533, 3.1629462242126465, 3.3419134616851807, 3.520880937576294, 3.699848175048828, 3.8788156509399414, 4.057783126831055, 4.236750602722168, 4.415718078613281, 4.594685077667236, 4.77365255355835, 4.952620029449463, 5.131587505340576, 5.310554504394531, 5.4895219802856445]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 5.0, 1.0, 5.0, 10.0, 6.0, 17.0, 12.0, 13.0, 25.0, 18.0, 19.0, 20.0, 33.0, 24.0, 32.0, 24.0, 30.0, 40.0, 39.0, 37.0, 41.0, 47.0, 52.0, 40.0, 33.0, 43.0, 42.0, 32.0, 31.0, 20.0, 30.0, 25.0, 26.0, 24.0, 15.0, 19.0, 20.0, 16.0, 11.0, 9.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.539618968963623, -4.399634838104248, -4.259650707244873, -4.119666576385498, -3.979682445526123, -3.839698314666748, -3.699714422225952, -3.559730291366577, -3.419746160507202, -3.279762029647827, -3.139777898788452, -2.999793767929077, -2.8598098754882812, -2.7198257446289062, -2.5798416137695312, -2.4398574829101562, -2.2998733520507812, -2.1598892211914062, -2.0199050903320312, -1.8799210786819458, -1.7399369478225708, -1.5999528169631958, -1.4599688053131104, -1.3199846744537354, -1.1800005435943604, -1.0400164127349854, -0.9000323414802551, -0.7600482702255249, -0.6200641393661499, -0.4800800085067749, -0.3400959372520447, -0.20011186599731445, -0.06012773513793945, 0.07985636591911316, 0.21984046697616577, 0.3598245680332184, 0.499808669090271, 0.639792799949646, 0.7797768712043762, 0.9197609424591064, 1.0597450733184814, 1.1997292041778564, 1.3397133350372314, 1.479697346687317, 1.619681477546692, 1.759665608406067, 1.8996496200561523, 2.0396337509155273, 2.1796178817749023, 2.3196020126342773, 2.4595861434936523, 2.5995702743530273, 2.7395544052124023, 2.8795385360717773, 3.0195224285125732, 3.1595065593719482, 3.2994906902313232, 3.4394748210906982, 3.5794589519500732, 3.7194430828094482, 3.859426975250244, 3.999411106109619, 4.139395236968994, 4.279379367828369, 4.419363498687744]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 3.0, 12.0, 13.0, 16.0, 11.0, 30.0, 46.0, 65.0, 105.0, 206.0, 330.0, 534.0, 911.0, 1569.0, 2572.0, 4225.0, 7941.0, 28675.0, 288489.0, 600814.0, 85374.0, 12833.0, 5564.0, 3301.0, 1919.0, 1228.0, 685.0, 411.0, 248.0, 144.0, 87.0, 56.0, 45.0, 32.0, 16.0, 11.0, 9.0, 9.0, 4.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9189453125, -1.8575286865234375, -1.796112060546875, -1.7346954345703125, -1.67327880859375, -1.6118621826171875, -1.550445556640625, -1.4890289306640625, -1.4276123046875, -1.3661956787109375, -1.304779052734375, -1.2433624267578125, -1.18194580078125, -1.1205291748046875, -1.059112548828125, -0.9976959228515625, -0.936279296875, -0.8748626708984375, -0.813446044921875, -0.7520294189453125, -0.69061279296875, -0.6291961669921875, -0.567779541015625, -0.5063629150390625, -0.4449462890625, -0.3835296630859375, -0.322113037109375, -0.2606964111328125, -0.19927978515625, -0.1378631591796875, -0.076446533203125, -0.0150299072265625, 0.04638671875, 0.1078033447265625, 0.169219970703125, 0.2306365966796875, 0.29205322265625, 0.3534698486328125, 0.414886474609375, 0.4763031005859375, 0.5377197265625, 0.5991363525390625, 0.660552978515625, 0.7219696044921875, 0.78338623046875, 0.8448028564453125, 0.906219482421875, 0.9676361083984375, 1.029052734375, 1.0904693603515625, 1.151885986328125, 1.2133026123046875, 1.27471923828125, 1.3361358642578125, 1.397552490234375, 1.4589691162109375, 1.5203857421875, 1.5818023681640625, 1.643218994140625, 1.7046356201171875, 1.76605224609375, 1.8274688720703125, 1.888885498046875, 1.9503021240234375, 2.01171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 2.0, 5.0, 9.0, 9.0, 14.0, 20.0, 13.0, 24.0, 26.0, 19.0, 28.0, 32.0, 36.0, 49.0, 33.0, 37.0, 52.0, 42.0, 49.0, 51.0, 48.0, 39.0, 40.0, 44.0, 41.0, 23.0, 44.0, 26.0, 22.0, 22.0, 18.0, 14.0, 11.0, 13.0, 9.0, 5.0, 8.0, 7.0, 4.0, 7.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.302734375, -3.201812744140625, -3.10089111328125, -2.999969482421875, -2.8990478515625, -2.798126220703125, -2.69720458984375, -2.596282958984375, -2.495361328125, -2.394439697265625, -2.29351806640625, -2.192596435546875, -2.0916748046875, -1.990753173828125, -1.88983154296875, -1.788909912109375, -1.68798828125, -1.587066650390625, -1.48614501953125, -1.385223388671875, -1.2843017578125, -1.183380126953125, -1.08245849609375, -0.981536865234375, -0.880615234375, -0.779693603515625, -0.67877197265625, -0.577850341796875, -0.4769287109375, -0.376007080078125, -0.27508544921875, -0.174163818359375, -0.0732421875, 0.027679443359375, 0.12860107421875, 0.229522705078125, 0.3304443359375, 0.431365966796875, 0.53228759765625, 0.633209228515625, 0.734130859375, 0.835052490234375, 0.93597412109375, 1.036895751953125, 1.1378173828125, 1.238739013671875, 1.33966064453125, 1.440582275390625, 1.54150390625, 1.642425537109375, 1.74334716796875, 1.844268798828125, 1.9451904296875, 2.046112060546875, 2.14703369140625, 2.247955322265625, 2.348876953125, 2.449798583984375, 2.55072021484375, 2.651641845703125, 2.7525634765625, 2.853485107421875, 2.95440673828125, 3.055328369140625, 3.15625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 7.0, 8.0, 8.0, 19.0, 30.0, 52.0, 63.0, 100.0, 187.0, 340.0, 522.0, 1151.0, 2401.0, 5574.0, 19220.0, 290957.0, 665335.0, 47723.0, 8433.0, 3215.0, 1506.0, 726.0, 379.0, 214.0, 113.0, 87.0, 51.0, 41.0, 21.0, 12.0, 17.0, 9.0, 10.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.150390625, -2.079193115234375, -2.00799560546875, -1.936798095703125, -1.8656005859375, -1.794403076171875, -1.72320556640625, -1.652008056640625, -1.580810546875, -1.509613037109375, -1.43841552734375, -1.367218017578125, -1.2960205078125, -1.224822998046875, -1.15362548828125, -1.082427978515625, -1.01123046875, -0.940032958984375, -0.86883544921875, -0.797637939453125, -0.7264404296875, -0.655242919921875, -0.58404541015625, -0.512847900390625, -0.441650390625, -0.370452880859375, -0.29925537109375, -0.228057861328125, -0.1568603515625, -0.085662841796875, -0.01446533203125, 0.056732177734375, 0.1279296875, 0.199127197265625, 0.27032470703125, 0.341522216796875, 0.4127197265625, 0.483917236328125, 0.55511474609375, 0.626312255859375, 0.697509765625, 0.768707275390625, 0.83990478515625, 0.911102294921875, 0.9822998046875, 1.053497314453125, 1.12469482421875, 1.195892333984375, 1.26708984375, 1.338287353515625, 1.40948486328125, 1.480682373046875, 1.5518798828125, 1.623077392578125, 1.69427490234375, 1.765472412109375, 1.836669921875, 1.907867431640625, 1.97906494140625, 2.050262451171875, 2.1214599609375, 2.192657470703125, 2.26385498046875, 2.335052490234375, 2.40625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 5.0, 3.0, 6.0, 16.0, 9.0, 17.0, 12.0, 18.0, 23.0, 28.0, 21.0, 29.0, 39.0, 37.0, 43.0, 31.0, 43.0, 56.0, 50.0, 55.0, 52.0, 38.0, 40.0, 52.0, 38.0, 28.0, 18.0, 29.0, 28.0, 27.0, 14.0, 18.0, 17.0, 10.0, 6.0, 11.0, 5.0, 4.0, 6.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4609375, -6.223388671875, -5.98583984375, -5.748291015625, -5.5107421875, -5.273193359375, -5.03564453125, -4.798095703125, -4.560546875, -4.322998046875, -4.08544921875, -3.847900390625, -3.6103515625, -3.372802734375, -3.13525390625, -2.897705078125, -2.66015625, -2.422607421875, -2.18505859375, -1.947509765625, -1.7099609375, -1.472412109375, -1.23486328125, -0.997314453125, -0.759765625, -0.522216796875, -0.28466796875, -0.047119140625, 0.1904296875, 0.427978515625, 0.66552734375, 0.903076171875, 1.140625, 1.378173828125, 1.61572265625, 1.853271484375, 2.0908203125, 2.328369140625, 2.56591796875, 2.803466796875, 3.041015625, 3.278564453125, 3.51611328125, 3.753662109375, 3.9912109375, 4.228759765625, 4.46630859375, 4.703857421875, 4.94140625, 5.178955078125, 5.41650390625, 5.654052734375, 5.8916015625, 6.129150390625, 6.36669921875, 6.604248046875, 6.841796875, 7.079345703125, 7.31689453125, 7.554443359375, 7.7919921875, 8.029541015625, 8.26708984375, 8.504638671875, 8.7421875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 12.0, 8.0, 18.0, 29.0, 36.0, 60.0, 122.0, 173.0, 281.0, 473.0, 922.0, 1872.0, 4006.0, 9505.0, 34418.0, 415449.0, 520931.0, 41391.0, 10496.0, 4179.0, 1983.0, 919.0, 504.0, 306.0, 179.0, 114.0, 49.0, 43.0, 31.0, 15.0, 7.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0029296875, -0.9671783447265625, -0.931427001953125, -0.8956756591796875, -0.85992431640625, -0.8241729736328125, -0.788421630859375, -0.7526702880859375, -0.7169189453125, -0.6811676025390625, -0.645416259765625, -0.6096649169921875, -0.57391357421875, -0.5381622314453125, -0.502410888671875, -0.4666595458984375, -0.430908203125, -0.3951568603515625, -0.359405517578125, -0.3236541748046875, -0.28790283203125, -0.2521514892578125, -0.216400146484375, -0.1806488037109375, -0.1448974609375, -0.1091461181640625, -0.073394775390625, -0.0376434326171875, -0.00189208984375, 0.0338592529296875, 0.069610595703125, 0.1053619384765625, 0.14111328125, 0.1768646240234375, 0.212615966796875, 0.2483673095703125, 0.28411865234375, 0.3198699951171875, 0.355621337890625, 0.3913726806640625, 0.4271240234375, 0.4628753662109375, 0.498626708984375, 0.5343780517578125, 0.57012939453125, 0.6058807373046875, 0.641632080078125, 0.6773834228515625, 0.713134765625, 0.7488861083984375, 0.784637451171875, 0.8203887939453125, 0.85614013671875, 0.8918914794921875, 0.927642822265625, 0.9633941650390625, 0.9991455078125, 1.0348968505859375, 1.070648193359375, 1.1063995361328125, 1.14215087890625, 1.1779022216796875, 1.213653564453125, 1.2494049072265625, 1.28515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 0.0, 3.0, 5.0, 7.0, 11.0, 33.0, 42.0, 92.0, 118.0, 169.0, 159.0, 150.0, 74.0, 58.0, 24.0, 17.0, 8.0, 11.0, 1.0, 6.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0006890296936035156, -0.000671830028295517, -0.0006546303629875183, -0.0006374306976795197, -0.000620231032371521, -0.0006030313670635223, -0.0005858317017555237, -0.000568632036447525, -0.0005514323711395264, -0.0005342327058315277, -0.000517033040523529, -0.0004998333752155304, -0.00048263370990753174, -0.0004654340445995331, -0.0004482343792915344, -0.00043103471398353577, -0.0004138350486755371, -0.00039663538336753845, -0.0003794357180595398, -0.00036223605275154114, -0.0003450363874435425, -0.0003278367221355438, -0.00031063705682754517, -0.0002934373915195465, -0.00027623772621154785, -0.0002590380609035492, -0.00024183839559555054, -0.00022463873028755188, -0.00020743906497955322, -0.00019023939967155457, -0.0001730397343635559, -0.00015584006905555725, -0.0001386404037475586, -0.00012144073843955994, -0.00010424107313156128, -8.704140782356262e-05, -6.984174251556396e-05, -5.264207720756531e-05, -3.544241189956665e-05, -1.8242746591567993e-05, -1.043081283569336e-06, 1.615658402442932e-05, 3.335624933242798e-05, 5.0555914640426636e-05, 6.775557994842529e-05, 8.495524525642395e-05, 0.00010215491056442261, 0.00011935457587242126, 0.00013655424118041992, 0.00015375390648841858, 0.00017095357179641724, 0.0001881532371044159, 0.00020535290241241455, 0.0002225525677204132, 0.00023975223302841187, 0.0002569518983364105, 0.0002741515636444092, 0.00029135122895240784, 0.0003085508942604065, 0.00032575055956840515, 0.0003429502248764038, 0.00036014989018440247, 0.0003773495554924011, 0.0003945492208003998, 0.00041174888610839844]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 10.0, 12.0, 15.0, 12.0, 42.0, 44.0, 74.0, 99.0, 129.0, 214.0, 333.0, 490.0, 799.0, 1097.0, 1874.0, 2935.0, 5062.0, 9154.0, 21253.0, 70114.0, 279811.0, 447559.0, 140734.0, 36866.0, 13415.0, 6437.0, 3596.0, 2187.0, 1351.0, 939.0, 627.0, 394.0, 273.0, 187.0, 119.0, 96.0, 47.0, 48.0, 35.0, 19.0, 19.0, 8.0, 10.0, 5.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.7333984375, -0.7125930786132812, -0.6917877197265625, -0.6709823608398438, -0.650177001953125, -0.6293716430664062, -0.6085662841796875, -0.5877609252929688, -0.56695556640625, -0.5461502075195312, -0.5253448486328125, -0.5045394897460938, -0.483734130859375, -0.46292877197265625, -0.4421234130859375, -0.42131805419921875, -0.4005126953125, -0.37970733642578125, -0.3589019775390625, -0.33809661865234375, -0.317291259765625, -0.29648590087890625, -0.2756805419921875, -0.25487518310546875, -0.23406982421875, -0.21326446533203125, -0.1924591064453125, -0.17165374755859375, -0.150848388671875, -0.13004302978515625, -0.1092376708984375, -0.08843231201171875, -0.067626953125, -0.04682159423828125, -0.0260162353515625, -0.00521087646484375, 0.015594482421875, 0.03639984130859375, 0.0572052001953125, 0.07801055908203125, 0.09881591796875, 0.11962127685546875, 0.1404266357421875, 0.16123199462890625, 0.182037353515625, 0.20284271240234375, 0.2236480712890625, 0.24445343017578125, 0.2652587890625, 0.28606414794921875, 0.3068695068359375, 0.32767486572265625, 0.348480224609375, 0.36928558349609375, 0.3900909423828125, 0.41089630126953125, 0.43170166015625, 0.45250701904296875, 0.4733123779296875, 0.49411773681640625, 0.514923095703125, 0.5357284545898438, 0.5565338134765625, 0.5773391723632812, 0.59814453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 13.0, 12.0, 21.0, 28.0, 55.0, 80.0, 113.0, 127.0, 147.0, 111.0, 91.0, 66.0, 39.0, 31.0, 17.0, 8.0, 10.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.297119140625, -0.2878990173339844, -0.27867889404296875, -0.2694587707519531, -0.2602386474609375, -0.2510185241699219, -0.24179840087890625, -0.23257827758789062, -0.223358154296875, -0.21413803100585938, -0.20491790771484375, -0.19569778442382812, -0.1864776611328125, -0.17725753784179688, -0.16803741455078125, -0.15881729125976562, -0.14959716796875, -0.14037704467773438, -0.13115692138671875, -0.12193679809570312, -0.1127166748046875, -0.10349655151367188, -0.09427642822265625, -0.08505630493164062, -0.075836181640625, -0.06661605834960938, -0.05739593505859375, -0.048175811767578125, -0.0389556884765625, -0.029735565185546875, -0.02051544189453125, -0.011295318603515625, -0.0020751953125, 0.007144927978515625, 0.01636505126953125, 0.025585174560546875, 0.0348052978515625, 0.044025421142578125, 0.05324554443359375, 0.062465667724609375, 0.071685791015625, 0.08090591430664062, 0.09012603759765625, 0.09934616088867188, 0.1085662841796875, 0.11778640747070312, 0.12700653076171875, 0.13622665405273438, 0.14544677734375, 0.15466690063476562, 0.16388702392578125, 0.17310714721679688, 0.1823272705078125, 0.19154739379882812, 0.20076751708984375, 0.20998764038085938, 0.219207763671875, 0.22842788696289062, 0.23764801025390625, 0.24686813354492188, 0.2560882568359375, 0.2653083801269531, 0.27452850341796875, 0.2837486267089844, 0.29296875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 4.0, 5.0, 12.0, 12.0, 3.0, 15.0, 21.0, 23.0, 26.0, 27.0, 39.0, 46.0, 43.0, 39.0, 44.0, 44.0, 47.0, 51.0, 42.0, 51.0, 55.0, 44.0, 33.0, 34.0, 34.0, 35.0, 20.0, 27.0, 16.0, 20.0, 13.0, 11.0, 15.0, 10.0, 6.0, 5.0, 2.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.048722982406616, -2.9492123126983643, -2.8497016429901123, -2.7501909732818604, -2.6506800651550293, -2.5511693954467773, -2.4516587257385254, -2.3521480560302734, -2.2526373863220215, -2.1531267166137695, -2.0536160469055176, -1.954105257987976, -1.8545945882797241, -1.7550839185714722, -1.6555731296539307, -1.5560624599456787, -1.4565517902374268, -1.3570411205291748, -1.2575304508209229, -1.1580196619033813, -1.0585089921951294, -0.9589983224868774, -0.8594875931739807, -0.759976863861084, -0.660466194152832, -0.5609555244445801, -0.46144479513168335, -0.361934095621109, -0.26242339611053467, -0.16291269659996033, -0.06340199708938599, 0.03610873222351074, 0.1356196403503418, 0.23513033986091614, 0.3346410393714905, 0.4341517388820648, 0.5336624383926392, 0.6331731081008911, 0.7326838374137878, 0.8321945667266846, 0.9317052364349365, 1.0312159061431885, 1.1307265758514404, 1.230237364768982, 1.3297480344772339, 1.4292587041854858, 1.5287694931030273, 1.6282801628112793, 1.7277908325195312, 1.8273015022277832, 1.9268121719360352, 2.026322841644287, 2.125833511352539, 2.22534441947937, 2.324855089187622, 2.424365758895874, 2.523876428604126, 2.623387098312378, 2.72289776802063, 2.822408437728882, 2.921919345855713, 3.021430015563965, 3.120940685272217, 3.2204513549804688, 3.3199620246887207]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 7.0, 10.0, 8.0, 6.0, 12.0, 26.0, 25.0, 18.0, 22.0, 27.0, 21.0, 37.0, 39.0, 31.0, 38.0, 36.0, 40.0, 47.0, 34.0, 45.0, 46.0, 49.0, 37.0, 38.0, 33.0, 38.0, 25.0, 26.0, 23.0, 24.0, 28.0, 21.0, 17.0, 15.0, 11.0, 6.0, 5.0, 8.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0627079010009766, -2.9714515209198, -2.880195140838623, -2.7889387607574463, -2.6976823806762695, -2.606426239013672, -2.515169858932495, -2.4239134788513184, -2.3326570987701416, -2.241400718688965, -2.150144338607788, -2.0588879585266113, -1.9676316976547241, -1.8763753175735474, -1.7851190567016602, -1.6938626766204834, -1.6026062965393066, -1.5113499164581299, -1.4200935363769531, -1.328837275505066, -1.2375808954238892, -1.1463245153427124, -1.0550682544708252, -0.9638118743896484, -0.8725554943084717, -0.7812991142272949, -0.6900427937507629, -0.598786473274231, -0.5075300931930542, -0.41627374291419983, -0.32501739263534546, -0.23376107215881348, -0.14250493049621582, -0.05124858021736145, 0.04000777006149292, 0.1312641203403473, 0.22252047061920166, 0.31377682089805603, 0.4050331711769104, 0.4962894916534424, 0.5875458717346191, 0.6788022518157959, 0.7700585722923279, 0.8613148927688599, 0.9525712728500366, 1.0438276529312134, 1.1350839138031006, 1.2263402938842773, 1.317596673965454, 1.4088530540466309, 1.5001094341278076, 1.5913656949996948, 1.6826220750808716, 1.7738784551620483, 1.8651347160339355, 1.9563910961151123, 2.047647476196289, 2.138903856277466, 2.2301602363586426, 2.3214166164398193, 2.412672996520996, 2.5039291381835938, 2.5951855182647705, 2.6864418983459473, 2.777698278427124]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 7.0, 4.0, 12.0, 9.0, 19.0, 16.0, 27.0, 38.0, 50.0, 79.0, 115.0, 192.0, 342.0, 614.0, 1000.0, 1969.0, 3720.0, 7264.0, 14708.0, 32174.0, 75117.0, 189601.0, 369991.0, 205276.0, 80068.0, 34199.0, 15817.0, 7664.0, 3870.0, 1919.0, 1093.0, 581.0, 392.0, 205.0, 134.0, 65.0, 54.0, 43.0, 22.0, 23.0, 13.0, 18.0, 8.0, 9.0, 5.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-4.83203125, -4.68353271484375, -4.5350341796875, -4.38653564453125, -4.238037109375, -4.08953857421875, -3.9410400390625, -3.79254150390625, -3.64404296875, -3.49554443359375, -3.3470458984375, -3.19854736328125, -3.050048828125, -2.90155029296875, -2.7530517578125, -2.60455322265625, -2.4560546875, -2.30755615234375, -2.1590576171875, -2.01055908203125, -1.862060546875, -1.71356201171875, -1.5650634765625, -1.41656494140625, -1.26806640625, -1.11956787109375, -0.9710693359375, -0.82257080078125, -0.674072265625, -0.52557373046875, -0.3770751953125, -0.22857666015625, -0.080078125, 0.06842041015625, 0.2169189453125, 0.36541748046875, 0.513916015625, 0.66241455078125, 0.8109130859375, 0.95941162109375, 1.10791015625, 1.25640869140625, 1.4049072265625, 1.55340576171875, 1.701904296875, 1.85040283203125, 1.9989013671875, 2.14739990234375, 2.2958984375, 2.44439697265625, 2.5928955078125, 2.74139404296875, 2.889892578125, 3.03839111328125, 3.1868896484375, 3.33538818359375, 3.48388671875, 3.63238525390625, 3.7808837890625, 3.92938232421875, 4.077880859375, 4.22637939453125, 4.3748779296875, 4.52337646484375, 4.671875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 6.0, 11.0, 7.0, 6.0, 19.0, 14.0, 19.0, 18.0, 29.0, 24.0, 20.0, 28.0, 28.0, 40.0, 33.0, 37.0, 36.0, 42.0, 40.0, 49.0, 48.0, 40.0, 36.0, 42.0, 36.0, 29.0, 20.0, 37.0, 29.0, 29.0, 21.0, 24.0, 13.0, 20.0, 14.0, 11.0, 10.0, 9.0, 9.0, 1.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.93359375, -4.77789306640625, -4.6221923828125, -4.46649169921875, -4.310791015625, -4.15509033203125, -3.9993896484375, -3.84368896484375, -3.68798828125, -3.53228759765625, -3.3765869140625, -3.22088623046875, -3.065185546875, -2.90948486328125, -2.7537841796875, -2.59808349609375, -2.4423828125, -2.28668212890625, -2.1309814453125, -1.97528076171875, -1.819580078125, -1.66387939453125, -1.5081787109375, -1.35247802734375, -1.19677734375, -1.04107666015625, -0.8853759765625, -0.72967529296875, -0.573974609375, -0.41827392578125, -0.2625732421875, -0.10687255859375, 0.048828125, 0.20452880859375, 0.3602294921875, 0.51593017578125, 0.671630859375, 0.82733154296875, 0.9830322265625, 1.13873291015625, 1.29443359375, 1.45013427734375, 1.6058349609375, 1.76153564453125, 1.917236328125, 2.07293701171875, 2.2286376953125, 2.38433837890625, 2.5400390625, 2.69573974609375, 2.8514404296875, 3.00714111328125, 3.162841796875, 3.31854248046875, 3.4742431640625, 3.62994384765625, 3.78564453125, 3.94134521484375, 4.0970458984375, 4.25274658203125, 4.408447265625, 4.56414794921875, 4.7198486328125, 4.87554931640625, 5.03125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 2.0, 5.0, 9.0, 2.0, 14.0, 23.0, 28.0, 39.0, 37.0, 42.0, 57.0, 108.0, 132.0, 195.0, 318.0, 502.0, 912.0, 1722.0, 3270.0, 6538.0, 13852.0, 30645.0, 74466.0, 189426.0, 364446.0, 213667.0, 83304.0, 34274.0, 15188.0, 7322.0, 3522.0, 1874.0, 992.0, 562.0, 317.0, 192.0, 143.0, 79.0, 78.0, 58.0, 38.0, 30.0, 32.0, 23.0, 21.0, 20.0, 6.0, 9.0, 3.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0], "bins": [-4.85546875, -4.7108154296875, -4.566162109375, -4.4215087890625, -4.27685546875, -4.1322021484375, -3.987548828125, -3.8428955078125, -3.6982421875, -3.5535888671875, -3.408935546875, -3.2642822265625, -3.11962890625, -2.9749755859375, -2.830322265625, -2.6856689453125, -2.541015625, -2.3963623046875, -2.251708984375, -2.1070556640625, -1.96240234375, -1.8177490234375, -1.673095703125, -1.5284423828125, -1.3837890625, -1.2391357421875, -1.094482421875, -0.9498291015625, -0.80517578125, -0.6605224609375, -0.515869140625, -0.3712158203125, -0.2265625, -0.0819091796875, 0.062744140625, 0.2073974609375, 0.35205078125, 0.4967041015625, 0.641357421875, 0.7860107421875, 0.9306640625, 1.0753173828125, 1.219970703125, 1.3646240234375, 1.50927734375, 1.6539306640625, 1.798583984375, 1.9432373046875, 2.087890625, 2.2325439453125, 2.377197265625, 2.5218505859375, 2.66650390625, 2.8111572265625, 2.955810546875, 3.1004638671875, 3.2451171875, 3.3897705078125, 3.534423828125, 3.6790771484375, 3.82373046875, 3.9683837890625, 4.113037109375, 4.2576904296875, 4.40234375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 2.0, 4.0, 7.0, 4.0, 12.0, 19.0, 8.0, 14.0, 21.0, 17.0, 29.0, 25.0, 34.0, 35.0, 30.0, 43.0, 45.0, 40.0, 48.0, 52.0, 43.0, 42.0, 37.0, 41.0, 42.0, 28.0, 25.0, 25.0, 27.0, 23.0, 33.0, 26.0, 13.0, 13.0, 16.0, 12.0, 9.0, 13.0, 10.0, 6.0, 3.0, 7.0, 2.0, 2.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4921875, -5.31634521484375, -5.1405029296875, -4.96466064453125, -4.788818359375, -4.61297607421875, -4.4371337890625, -4.26129150390625, -4.08544921875, -3.90960693359375, -3.7337646484375, -3.55792236328125, -3.382080078125, -3.20623779296875, -3.0303955078125, -2.85455322265625, -2.6787109375, -2.50286865234375, -2.3270263671875, -2.15118408203125, -1.975341796875, -1.79949951171875, -1.6236572265625, -1.44781494140625, -1.27197265625, -1.09613037109375, -0.9202880859375, -0.74444580078125, -0.568603515625, -0.39276123046875, -0.2169189453125, -0.04107666015625, 0.134765625, 0.31060791015625, 0.4864501953125, 0.66229248046875, 0.838134765625, 1.01397705078125, 1.1898193359375, 1.36566162109375, 1.54150390625, 1.71734619140625, 1.8931884765625, 2.06903076171875, 2.244873046875, 2.42071533203125, 2.5965576171875, 2.77239990234375, 2.9482421875, 3.12408447265625, 3.2999267578125, 3.47576904296875, 3.651611328125, 3.82745361328125, 4.0032958984375, 4.17913818359375, 4.35498046875, 4.53082275390625, 4.7066650390625, 4.88250732421875, 5.058349609375, 5.23419189453125, 5.4100341796875, 5.58587646484375, 5.76171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 9.0, 7.0, 8.0, 23.0, 19.0, 55.0, 71.0, 81.0, 127.0, 221.0, 377.0, 582.0, 901.0, 1582.0, 2594.0, 4948.0, 9537.0, 19655.0, 40587.0, 83670.0, 170865.0, 299157.0, 208100.0, 105029.0, 50100.0, 24515.0, 11826.0, 6080.0, 3197.0, 1798.0, 1056.0, 661.0, 390.0, 272.0, 150.0, 99.0, 53.0, 52.0, 27.0, 27.0, 13.0, 15.0, 11.0, 8.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.0234375, -0.995513916015625, -0.96759033203125, -0.939666748046875, -0.9117431640625, -0.883819580078125, -0.85589599609375, -0.827972412109375, -0.800048828125, -0.772125244140625, -0.74420166015625, -0.716278076171875, -0.6883544921875, -0.660430908203125, -0.63250732421875, -0.604583740234375, -0.57666015625, -0.548736572265625, -0.52081298828125, -0.492889404296875, -0.4649658203125, -0.437042236328125, -0.40911865234375, -0.381195068359375, -0.353271484375, -0.325347900390625, -0.29742431640625, -0.269500732421875, -0.2415771484375, -0.213653564453125, -0.18572998046875, -0.157806396484375, -0.1298828125, -0.101959228515625, -0.07403564453125, -0.046112060546875, -0.0181884765625, 0.009735107421875, 0.03765869140625, 0.065582275390625, 0.093505859375, 0.121429443359375, 0.14935302734375, 0.177276611328125, 0.2052001953125, 0.233123779296875, 0.26104736328125, 0.288970947265625, 0.31689453125, 0.344818115234375, 0.37274169921875, 0.400665283203125, 0.4285888671875, 0.456512451171875, 0.48443603515625, 0.512359619140625, 0.540283203125, 0.568206787109375, 0.59613037109375, 0.624053955078125, 0.6519775390625, 0.679901123046875, 0.70782470703125, 0.735748291015625, 0.763671875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 12.0, 10.0, 16.0, 18.0, 25.0, 27.0, 25.0, 50.0, 56.0, 65.0, 84.0, 85.0, 104.0, 85.0, 55.0, 68.0, 44.0, 30.0, 26.0, 25.0, 12.0, 11.0, 14.0, 13.0, 9.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.000308990478515625, -0.0003004148602485657, -0.00029183924198150635, -0.000283263623714447, -0.0002746880054473877, -0.00026611238718032837, -0.00025753676891326904, -0.0002489611506462097, -0.0002403855323791504, -0.00023180991411209106, -0.00022323429584503174, -0.0002146586775779724, -0.00020608305931091309, -0.00019750744104385376, -0.00018893182277679443, -0.0001803562045097351, -0.00017178058624267578, -0.00016320496797561646, -0.00015462934970855713, -0.0001460537314414978, -0.00013747811317443848, -0.00012890249490737915, -0.00012032687664031982, -0.0001117512583732605, -0.00010317564010620117, -9.460002183914185e-05, -8.602440357208252e-05, -7.74487853050232e-05, -6.887316703796387e-05, -6.029754877090454e-05, -5.1721930503845215e-05, -4.314631223678589e-05, -3.457069396972656e-05, -2.5995075702667236e-05, -1.741945743560791e-05, -8.843839168548584e-06, -2.682209014892578e-07, 8.307397365570068e-06, 1.6883015632629395e-05, 2.545863389968872e-05, 3.403425216674805e-05, 4.260987043380737e-05, 5.11854887008667e-05, 5.9761106967926025e-05, 6.833672523498535e-05, 7.691234350204468e-05, 8.5487961769104e-05, 9.406358003616333e-05, 0.00010263919830322266, 0.00011121481657028198, 0.00011979043483734131, 0.00012836605310440063, 0.00013694167137145996, 0.0001455172896385193, 0.0001540929079055786, 0.00016266852617263794, 0.00017124414443969727, 0.0001798197627067566, 0.00018839538097381592, 0.00019697099924087524, 0.00020554661750793457, 0.0002141222357749939, 0.00022269785404205322, 0.00023127347230911255, 0.00023984909057617188]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 14.0, 17.0, 19.0, 26.0, 35.0, 67.0, 94.0, 130.0, 211.0, 261.0, 371.0, 617.0, 896.0, 1334.0, 2191.0, 3743.0, 6558.0, 12356.0, 25114.0, 57456.0, 135502.0, 310804.0, 273081.0, 118207.0, 50540.0, 22466.0, 11032.0, 6008.0, 3467.0, 2039.0, 1276.0, 814.0, 564.0, 364.0, 290.0, 172.0, 133.0, 87.0, 66.0, 35.0, 32.0, 20.0, 18.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1845703125, -1.1474609375, -1.1103515625, -1.0732421875, -1.0361328125, -0.9990234375, -0.9619140625, -0.9248046875, -0.8876953125, -0.8505859375, -0.8134765625, -0.7763671875, -0.7392578125, -0.7021484375, -0.6650390625, -0.6279296875, -0.5908203125, -0.5537109375, -0.5166015625, -0.4794921875, -0.4423828125, -0.4052734375, -0.3681640625, -0.3310546875, -0.2939453125, -0.2568359375, -0.2197265625, -0.1826171875, -0.1455078125, -0.1083984375, -0.0712890625, -0.0341796875, 0.0029296875, 0.0400390625, 0.0771484375, 0.1142578125, 0.1513671875, 0.1884765625, 0.2255859375, 0.2626953125, 0.2998046875, 0.3369140625, 0.3740234375, 0.4111328125, 0.4482421875, 0.4853515625, 0.5224609375, 0.5595703125, 0.5966796875, 0.6337890625, 0.6708984375, 0.7080078125, 0.7451171875, 0.7822265625, 0.8193359375, 0.8564453125, 0.8935546875, 0.9306640625, 0.9677734375, 1.0048828125, 1.0419921875, 1.0791015625, 1.1162109375, 1.1533203125, 1.1904296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 7.0, 7.0, 11.0, 9.0, 17.0, 31.0, 38.0, 55.0, 57.0, 85.0, 94.0, 112.0, 108.0, 80.0, 84.0, 56.0, 34.0, 31.0, 22.0, 19.0, 12.0, 10.0, 6.0, 3.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.19140625, -1.1590805053710938, -1.1267547607421875, -1.0944290161132812, -1.062103271484375, -1.0297775268554688, -0.9974517822265625, -0.9651260375976562, -0.93280029296875, -0.9004745483398438, -0.8681488037109375, -0.8358230590820312, -0.803497314453125, -0.7711715698242188, -0.7388458251953125, -0.7065200805664062, -0.6741943359375, -0.6418685913085938, -0.6095428466796875, -0.5772171020507812, -0.544891357421875, -0.5125656127929688, -0.4802398681640625, -0.44791412353515625, -0.41558837890625, -0.38326263427734375, -0.3509368896484375, -0.31861114501953125, -0.286285400390625, -0.25395965576171875, -0.2216339111328125, -0.18930816650390625, -0.156982421875, -0.12465667724609375, -0.0923309326171875, -0.06000518798828125, -0.027679443359375, 0.00464630126953125, 0.0369720458984375, 0.06929779052734375, 0.10162353515625, 0.13394927978515625, 0.1662750244140625, 0.19860076904296875, 0.230926513671875, 0.26325225830078125, 0.2955780029296875, 0.32790374755859375, 0.3602294921875, 0.39255523681640625, 0.4248809814453125, 0.45720672607421875, 0.489532470703125, 0.5218582153320312, 0.5541839599609375, 0.5865097045898438, 0.61883544921875, 0.6511611938476562, 0.6834869384765625, 0.7158126831054688, 0.748138427734375, 0.7804641723632812, 0.8127899169921875, 0.8451156616210938, 0.87744140625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 16.0, 19.0, 31.0, 45.0, 62.0, 115.0, 111.0, 129.0, 132.0, 90.0, 89.0, 65.0, 38.0, 22.0, 16.0, 6.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.564505577087402, -8.078540802001953, -7.5925750732421875, -7.10660982131958, -6.620644569396973, -6.134679317474365, -5.648714065551758, -5.16274881362915, -4.676783561706543, -4.1908183097839355, -3.704853057861328, -3.2188878059387207, -2.7329225540161133, -2.246957302093506, -1.7609920501708984, -1.275026798248291, -0.7890615463256836, -0.30309629440307617, 0.18286895751953125, 0.6688342094421387, 1.154799461364746, 1.6407647132873535, 2.126729965209961, 2.6126952171325684, 3.098660469055176, 3.584625720977783, 4.070590972900391, 4.556556224822998, 5.0425214767456055, 5.528486728668213, 6.01445198059082, 6.500417232513428, 6.986383438110352, 7.472348690032959, 7.958313941955566, 8.444278717041016, 8.930244445800781, 9.416210174560547, 9.902174949645996, 10.388139724731445, 10.874105453491211, 11.360071182250977, 11.846035957336426, 12.332000732421875, 12.81796646118164, 13.303932189941406, 13.789896965026855, 14.275861740112305, 14.76182746887207, 15.247793197631836, 15.733757972717285, 16.219722747802734, 16.7056884765625, 17.191654205322266, 17.67761993408203, 18.163583755493164, 18.64954948425293, 19.135515213012695, 19.621479034423828, 20.107444763183594, 20.59341049194336, 21.079376220703125, 21.56534194946289, 22.051305770874023, 22.53727149963379]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 9.0, 9.0, 13.0, 17.0, 13.0, 16.0, 21.0, 22.0, 25.0, 20.0, 28.0, 27.0, 33.0, 41.0, 25.0, 30.0, 40.0, 40.0, 52.0, 56.0, 37.0, 38.0, 32.0, 47.0, 30.0, 37.0, 31.0, 15.0, 21.0, 24.0, 23.0, 20.0, 17.0, 11.0, 16.0, 10.0, 13.0, 8.0, 8.0, 4.0, 7.0, 5.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.538307189941406, -9.251288414001465, -8.96427059173584, -8.677251815795898, -8.390233993530273, -8.103215217590332, -7.816196918487549, -7.529178619384766, -7.242160320281982, -6.955142021179199, -6.668123722076416, -6.381105422973633, -6.094086647033691, -5.807068824768066, -5.520050048828125, -5.233031749725342, -4.946013450622559, -4.658995151519775, -4.371976852416992, -4.084958553314209, -3.7979400157928467, -3.5109217166900635, -3.223903179168701, -2.936884880065918, -2.6498665809631348, -2.3628482818603516, -2.0758299827575684, -1.788811445236206, -1.5017931461334229, -1.2147748470306396, -0.9277564287185669, -0.6407380104064941, -0.35372066497802734, -0.06670230627059937, 0.2203160524368286, 0.5073344111442566, 0.7943527698516846, 1.0813710689544678, 1.3683894872665405, 1.6554079055786133, 1.9424262046813965, 2.2294445037841797, 2.516462802886963, 2.803481340408325, 3.0904996395111084, 3.3775179386138916, 3.664536476135254, 3.951554775238037, 4.23857307434082, 4.5255913734436035, 4.812609672546387, 5.09962797164917, 5.386646270751953, 5.6736650466918945, 5.960683345794678, 6.247701644897461, 6.534719944000244, 6.821738243103027, 7.1087565422058105, 7.395774841308594, 7.682793617248535, 7.96981143951416, 8.256830215454102, 8.543848037719727, 8.830866813659668]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 8.0, 11.0, 5.0, 9.0, 14.0, 20.0, 26.0, 37.0, 61.0, 62.0, 89.0, 137.0, 131.0, 189.0, 260.0, 366.0, 486.0, 685.0, 863.0, 1247.0, 1745.0, 1036708.0, 2033.0, 1467.0, 1016.0, 735.0, 520.0, 443.0, 313.0, 220.0, 156.0, 133.0, 84.0, 80.0, 49.0, 50.0, 38.0, 28.0, 16.0, 16.0, 11.0, 7.0, 10.0, 3.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.248028755187988, -12.816913604736328, -12.385797500610352, -11.954682350158691, -11.523567199707031, -11.092451095581055, -10.661335945129395, -10.230220794677734, -9.799105644226074, -9.367990493774414, -8.936874389648438, -8.505759239196777, -8.074644088745117, -7.643528461456299, -7.2124128341674805, -6.78129768371582, -6.350182056427002, -5.919066429138184, -5.487951278686523, -5.056835651397705, -4.625720500946045, -4.194604873657227, -3.7634894847869873, -3.332374095916748, -2.901258707046509, -2.4701433181762695, -2.0390279293060303, -1.6079124212265015, -1.1767970323562622, -0.7456815242767334, -0.31456613540649414, 0.11654925346374512, 0.5476646423339844, 0.9787800312042236, 1.409895420074463, 1.8410109281539917, 2.2721261978149414, 2.7032418251037598, 3.134357213973999, 3.5654726028442383, 3.9965879917144775, 4.427703380584717, 4.858819007873535, 5.289934158325195, 5.721049785614014, 6.152165412902832, 6.583280563354492, 7.014395713806152, 7.445511341094971, 7.876626968383789, 8.30774211883545, 8.73885726928711, 9.169973373413086, 9.601088523864746, 10.032203674316406, 10.463319778442383, 10.894434928894043, 11.325550079345703, 11.75666618347168, 12.18778133392334, 12.618896484375, 13.050012588500977, 13.481127738952637, 13.912242889404297, 14.343358039855957]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 16.0, 35.0, 57.0, 148.0, 525.0, 1923.0, 6834.0, 38246.0, 51407236.0, 11557.0, 3333.0, 963.0, 270.0, 89.0, 38.0, 15.0, 12.0, 13.0, 7.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-93.48684692382812, -91.15953826904297, -88.83222961425781, -86.50492095947266, -84.1776123046875, -81.85030364990234, -79.52299499511719, -77.19568634033203, -74.86837768554688, -72.54106903076172, -70.21376037597656, -67.8864517211914, -65.55914306640625, -63.231834411621094, -60.90452575683594, -58.57721710205078, -56.249908447265625, -53.92259979248047, -51.59529113769531, -49.267982482910156, -46.940673828125, -44.613365173339844, -42.28605651855469, -39.95874786376953, -37.631439208984375, -35.30413055419922, -32.97682189941406, -30.649513244628906, -28.32220458984375, -25.994895935058594, -23.667587280273438, -21.34027862548828, -19.01297378540039, -16.685665130615234, -14.358356475830078, -12.031047821044922, -9.703739166259766, -7.376430511474609, -5.049121856689453, -2.721813201904297, -0.3945045471191406, 1.9328041076660156, 4.260112762451172, 6.587421417236328, 8.914730072021484, 11.24203872680664, 13.569347381591797, 15.896656036376953, 18.22396469116211, 20.551273345947266, 22.878582000732422, 25.205890655517578, 27.533199310302734, 29.86050796508789, 32.18781661987305, 34.5151252746582, 36.84243392944336, 39.169742584228516, 41.49705123901367, 43.82435989379883, 46.151668548583984, 48.47897720336914, 50.8062858581543, 53.13359451293945, 55.46090316772461]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 6.0, 12.0, 11.0, 24.0, 49.0, 74.0, 102.0, 159.0, 258.0, 441.0, 672.0, 1154.0, 1964.0, 3234.0, 5262.0, 9172.0, 15631.0, 27541.0, 49529.0, 88868.0, 154457.0, 251955.0, 388539.0, 1047927.0, 2866719.0, 554290.0, 327462.0, 208564.0, 123830.0, 70157.0, 39335.0, 22662.0, 12818.0, 7344.0, 4528.0, 2659.0, 1568.0, 936.0, 578.0, 348.0, 207.0, 144.0, 64.0, 57.0, 44.0, 29.0, 17.0, 12.0, 10.0, 9.0, 4.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.41015625, -4.2542724609375, -4.098388671875, -3.9425048828125, -3.78662109375, -3.6307373046875, -3.474853515625, -3.3189697265625, -3.1630859375, -3.0072021484375, -2.851318359375, -2.6954345703125, -2.53955078125, -2.3836669921875, -2.227783203125, -2.0718994140625, -1.916015625, -1.7601318359375, -1.604248046875, -1.4483642578125, -1.29248046875, -1.1365966796875, -0.980712890625, -0.8248291015625, -0.6689453125, -0.5130615234375, -0.357177734375, -0.2012939453125, -0.04541015625, 0.1104736328125, 0.266357421875, 0.4222412109375, 0.578125, 0.7340087890625, 0.889892578125, 1.0457763671875, 1.20166015625, 1.3575439453125, 1.513427734375, 1.6693115234375, 1.8251953125, 1.9810791015625, 2.136962890625, 2.2928466796875, 2.44873046875, 2.6046142578125, 2.760498046875, 2.9163818359375, 3.072265625, 3.2281494140625, 3.384033203125, 3.5399169921875, 3.69580078125, 3.8516845703125, 4.007568359375, 4.1634521484375, 4.3193359375, 4.4752197265625, 4.631103515625, 4.7869873046875, 4.94287109375, 5.0987548828125, 5.254638671875, 5.4105224609375, 5.56640625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 7.0, 5.0, 5.0, 18.0, 15.0, 16.0, 14.0, 28.0, 26.0, 30.0, 33.0, 25.0, 36.0, 52.0, 49.0, 55.0, 86.0, 674.0, 403.0, 57.0, 52.0, 41.0, 37.0, 53.0, 28.0, 32.0, 31.0, 30.0, 17.0, 21.0, 8.0, 14.0, 9.0, 5.0, 8.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-46.40625, -44.99462890625, -43.5830078125, -42.17138671875, -40.759765625, -39.34814453125, -37.9365234375, -36.52490234375, -35.11328125, -33.70166015625, -32.2900390625, -30.87841796875, -29.466796875, -28.05517578125, -26.6435546875, -25.23193359375, -23.8203125, -22.40869140625, -20.9970703125, -19.58544921875, -18.173828125, -16.76220703125, -15.3505859375, -13.93896484375, -12.52734375, -11.11572265625, -9.7041015625, -8.29248046875, -6.880859375, -5.46923828125, -4.0576171875, -2.64599609375, -1.234375, 0.17724609375, 1.5888671875, 3.00048828125, 4.412109375, 5.82373046875, 7.2353515625, 8.64697265625, 10.05859375, 11.47021484375, 12.8818359375, 14.29345703125, 15.705078125, 17.11669921875, 18.5283203125, 19.93994140625, 21.3515625, 22.76318359375, 24.1748046875, 25.58642578125, 26.998046875, 28.40966796875, 29.8212890625, 31.23291015625, 32.64453125, 34.05615234375, 35.4677734375, 36.87939453125, 38.291015625, 39.70263671875, 41.1142578125, 42.52587890625, 43.9375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 8.0, 16.0, 30.0, 38.0, 77.0, 135.0, 215.0, 370.0, 667.0, 1180.0, 1853.0, 3122.0, 5230.0, 8705.0, 14055.0, 22708.0, 35078.0, 53523.0, 79651.0, 113122.0, 152972.0, 198529.0, 245391.0, 323296.0, 1361015.0, 2200672.0, 435124.0, 261388.0, 215382.0, 168580.0, 126789.0, 90131.0, 62233.0, 40753.0, 26481.0, 16809.0, 10445.0, 6354.0, 3863.0, 2286.0, 1304.0, 760.0, 443.0, 277.0, 159.0, 87.0, 51.0, 33.0, 19.0, 18.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.357421875, -2.28179931640625, -2.2061767578125, -2.13055419921875, -2.054931640625, -1.97930908203125, -1.9036865234375, -1.82806396484375, -1.75244140625, -1.67681884765625, -1.6011962890625, -1.52557373046875, -1.449951171875, -1.37432861328125, -1.2987060546875, -1.22308349609375, -1.1474609375, -1.07183837890625, -0.9962158203125, -0.92059326171875, -0.844970703125, -0.76934814453125, -0.6937255859375, -0.61810302734375, -0.54248046875, -0.46685791015625, -0.3912353515625, -0.31561279296875, -0.239990234375, -0.16436767578125, -0.0887451171875, -0.01312255859375, 0.0625, 0.13812255859375, 0.2137451171875, 0.28936767578125, 0.364990234375, 0.44061279296875, 0.5162353515625, 0.59185791015625, 0.66748046875, 0.74310302734375, 0.8187255859375, 0.89434814453125, 0.969970703125, 1.04559326171875, 1.1212158203125, 1.19683837890625, 1.2724609375, 1.34808349609375, 1.4237060546875, 1.49932861328125, 1.574951171875, 1.65057373046875, 1.7261962890625, 1.80181884765625, 1.87744140625, 1.95306396484375, 2.0286865234375, 2.10430908203125, 2.179931640625, 2.25555419921875, 2.3311767578125, 2.40679931640625, 2.482421875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 6.0, 5.0, 18.0, 12.0, 13.0, 25.0, 27.0, 27.0, 30.0, 28.0, 19.0, 35.0, 32.0, 40.0, 36.0, 36.0, 55.0, 298.0, 705.0, 122.0, 34.0, 51.0, 38.0, 35.0, 31.0, 28.0, 34.0, 19.0, 35.0, 26.0, 16.0, 19.0, 13.0, 14.0, 14.0, 8.0, 6.0, 11.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.1875, -23.333251953125, -22.47900390625, -21.624755859375, -20.7705078125, -19.916259765625, -19.06201171875, -18.207763671875, -17.353515625, -16.499267578125, -15.64501953125, -14.790771484375, -13.9365234375, -13.082275390625, -12.22802734375, -11.373779296875, -10.51953125, -9.665283203125, -8.81103515625, -7.956787109375, -7.1025390625, -6.248291015625, -5.39404296875, -4.539794921875, -3.685546875, -2.831298828125, -1.97705078125, -1.122802734375, -0.2685546875, 0.585693359375, 1.43994140625, 2.294189453125, 3.1484375, 4.002685546875, 4.85693359375, 5.711181640625, 6.5654296875, 7.419677734375, 8.27392578125, 9.128173828125, 9.982421875, 10.836669921875, 11.69091796875, 12.545166015625, 13.3994140625, 14.253662109375, 15.10791015625, 15.962158203125, 16.81640625, 17.670654296875, 18.52490234375, 19.379150390625, 20.2333984375, 21.087646484375, 21.94189453125, 22.796142578125, 23.650390625, 24.504638671875, 25.35888671875, 26.213134765625, 27.0673828125, 27.921630859375, 28.77587890625, 29.630126953125, 30.484375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 10.0, 16.0, 19.0, 31.0, 42.0, 68.0, 118.0, 143.0, 193.0, 256.0, 379.0, 550.0, 698.0, 1127.0, 1909.0, 3667.0, 7583.0, 17847.0, 43728.0, 108343.0, 247757.0, 486353.0, 2739731.0, 1785927.0, 451278.0, 226506.0, 96888.0, 38834.0, 15835.0, 6875.0, 3370.0, 1902.0, 1164.0, 748.0, 459.0, 331.0, 223.0, 161.0, 101.0, 65.0, 56.0, 47.0, 38.0, 22.0, 7.0, 4.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.36328125, -5.200439453125, -5.03759765625, -4.874755859375, -4.7119140625, -4.549072265625, -4.38623046875, -4.223388671875, -4.060546875, -3.897705078125, -3.73486328125, -3.572021484375, -3.4091796875, -3.246337890625, -3.08349609375, -2.920654296875, -2.7578125, -2.594970703125, -2.43212890625, -2.269287109375, -2.1064453125, -1.943603515625, -1.78076171875, -1.617919921875, -1.455078125, -1.292236328125, -1.12939453125, -0.966552734375, -0.8037109375, -0.640869140625, -0.47802734375, -0.315185546875, -0.15234375, 0.010498046875, 0.17333984375, 0.336181640625, 0.4990234375, 0.661865234375, 0.82470703125, 0.987548828125, 1.150390625, 1.313232421875, 1.47607421875, 1.638916015625, 1.8017578125, 1.964599609375, 2.12744140625, 2.290283203125, 2.453125, 2.615966796875, 2.77880859375, 2.941650390625, 3.1044921875, 3.267333984375, 3.43017578125, 3.593017578125, 3.755859375, 3.918701171875, 4.08154296875, 4.244384765625, 4.4072265625, 4.570068359375, 4.73291015625, 4.895751953125, 5.05859375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 6.0, 3.0, 10.0, 10.0, 16.0, 12.0, 14.0, 17.0, 23.0, 26.0, 17.0, 28.0, 34.0, 44.0, 43.0, 28.0, 32.0, 32.0, 45.0, 312.0, 734.0, 94.0, 43.0, 33.0, 44.0, 26.0, 27.0, 34.0, 22.0, 33.0, 26.0, 24.0, 27.0, 9.0, 14.0, 17.0, 10.0, 11.0, 7.0, 10.0, 9.0, 2.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.859375, -23.09619140625, -22.3330078125, -21.56982421875, -20.806640625, -20.04345703125, -19.2802734375, -18.51708984375, -17.75390625, -16.99072265625, -16.2275390625, -15.46435546875, -14.701171875, -13.93798828125, -13.1748046875, -12.41162109375, -11.6484375, -10.88525390625, -10.1220703125, -9.35888671875, -8.595703125, -7.83251953125, -7.0693359375, -6.30615234375, -5.54296875, -4.77978515625, -4.0166015625, -3.25341796875, -2.490234375, -1.72705078125, -0.9638671875, -0.20068359375, 0.5625, 1.32568359375, 2.0888671875, 2.85205078125, 3.615234375, 4.37841796875, 5.1416015625, 5.90478515625, 6.66796875, 7.43115234375, 8.1943359375, 8.95751953125, 9.720703125, 10.48388671875, 11.2470703125, 12.01025390625, 12.7734375, 13.53662109375, 14.2998046875, 15.06298828125, 15.826171875, 16.58935546875, 17.3525390625, 18.11572265625, 18.87890625, 19.64208984375, 20.4052734375, 21.16845703125, 21.931640625, 22.69482421875, 23.4580078125, 24.22119140625, 24.984375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 10.0, 21.0, 61.0, 136.0, 252.0, 272.0, 137.0, 54.0, 24.0, 17.0, 6.0, 2.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-165.81585693359375, -162.36253356933594, -158.90919494628906, -155.45587158203125, -152.00253295898438, -148.54920959472656, -145.0958709716797, -141.64254760742188, -138.189208984375, -134.7358856201172, -131.2825469970703, -127.82921600341797, -124.37588500976562, -120.92256164550781, -117.46922302246094, -114.01589965820312, -110.56257629394531, -107.10924530029297, -103.65591430664062, -100.20258331298828, -96.74925231933594, -93.29592895507812, -89.84259033203125, -86.38926696777344, -82.93592834472656, -79.48259735107422, -76.02926635742188, -72.57593536376953, -69.12260437011719, -65.66928100585938, -62.215946197509766, -58.76261901855469, -55.30929183959961, -51.855960845947266, -48.40262985229492, -44.949302673339844, -41.4959716796875, -38.042640686035156, -34.58930969238281, -31.1359806060791, -27.682649612426758, -24.229318618774414, -20.775989532470703, -17.32265853881836, -13.869328498840332, -10.415998458862305, -6.962667465209961, -3.50933837890625, -0.05600738525390625, 3.3973228931427, 6.850653171539307, 10.303983688354492, 13.75731372833252, 17.210643768310547, 20.66397476196289, 24.1173038482666, 27.570634841918945, 31.02396583557129, 34.477294921875, 37.930625915527344, 41.38395690917969, 44.83728790283203, 48.290618896484375, 51.74394607543945, 55.1972770690918]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 9.0, 12.0, 13.0, 15.0, 17.0, 17.0, 24.0, 27.0, 23.0, 37.0, 40.0, 45.0, 43.0, 44.0, 46.0, 62.0, 48.0, 47.0, 44.0, 47.0, 52.0, 47.0, 40.0, 33.0, 35.0, 24.0, 20.0, 11.0, 12.0, 16.0, 13.0, 7.0, 6.0, 9.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-72.0421371459961, -69.897216796875, -67.7522964477539, -65.60737609863281, -63.46245574951172, -61.317535400390625, -59.172611236572266, -57.02769088745117, -54.88277053833008, -52.737850189208984, -50.59292984008789, -48.4480094909668, -46.30308532714844, -44.158164978027344, -42.01324462890625, -39.868324279785156, -37.72340393066406, -35.57848358154297, -33.433563232421875, -31.28864097595215, -29.143720626831055, -26.99880027770996, -24.853878021240234, -22.70895767211914, -20.564037322998047, -18.419116973876953, -16.27419662475586, -14.129274368286133, -11.984354019165039, -9.839433670043945, -7.694512367248535, -5.549591064453125, -3.4046783447265625, -1.2597575187683105, 0.8851633071899414, 3.0300841331481934, 5.175004959106445, 7.319925308227539, 9.46484661102295, 11.60976791381836, 13.754688262939453, 15.899608612060547, 18.04452896118164, 20.189451217651367, 22.33437156677246, 24.479291915893555, 26.62421417236328, 28.769134521484375, 30.91405487060547, 33.05897521972656, 35.203895568847656, 37.34881591796875, 39.493736267089844, 41.63865661621094, 43.7835807800293, 45.92850112915039, 48.073421478271484, 50.21834182739258, 52.36326217651367, 54.508182525634766, 56.653106689453125, 58.79802703857422, 60.94294738769531, 63.087867736816406, 65.2327880859375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 6.0, 5.0, 7.0, 9.0, 17.0, 14.0, 29.0, 22.0, 31.0, 47.0, 96.0, 154.0, 284.0, 639.0, 1375.0, 3827.0, 11416.0, 59508.0, 2433863.0, 1624079.0, 43747.0, 9492.0, 3171.0, 1248.0, 549.0, 246.0, 135.0, 85.0, 37.0, 35.0, 33.0, 17.0, 19.0, 9.0, 9.0, 5.0, 2.0, 6.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5439453125, -1.49237060546875, -1.4407958984375, -1.38922119140625, -1.337646484375, -1.28607177734375, -1.2344970703125, -1.18292236328125, -1.13134765625, -1.07977294921875, -1.0281982421875, -0.97662353515625, -0.925048828125, -0.87347412109375, -0.8218994140625, -0.77032470703125, -0.71875, -0.66717529296875, -0.6156005859375, -0.56402587890625, -0.512451171875, -0.46087646484375, -0.4093017578125, -0.35772705078125, -0.30615234375, -0.25457763671875, -0.2030029296875, -0.15142822265625, -0.099853515625, -0.04827880859375, 0.0032958984375, 0.05487060546875, 0.1064453125, 0.15802001953125, 0.2095947265625, 0.26116943359375, 0.312744140625, 0.36431884765625, 0.4158935546875, 0.46746826171875, 0.51904296875, 0.57061767578125, 0.6221923828125, 0.67376708984375, 0.725341796875, 0.77691650390625, 0.8284912109375, 0.88006591796875, 0.931640625, 0.98321533203125, 1.0347900390625, 1.08636474609375, 1.137939453125, 1.18951416015625, 1.2410888671875, 1.29266357421875, 1.34423828125, 1.39581298828125, 1.4473876953125, 1.49896240234375, 1.550537109375, 1.60211181640625, 1.6536865234375, 1.70526123046875, 1.7568359375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 2.0, 5.0, 12.0, 14.0, 15.0, 19.0, 18.0, 21.0, 27.0, 33.0, 44.0, 57.0, 51.0, 54.0, 66.0, 79.0, 86.0, 85.0, 52.0, 54.0, 45.0, 25.0, 33.0, 22.0, 20.0, 13.0, 8.0, 17.0, 4.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5400390625, -0.51953125, -0.4990234375, -0.478515625, -0.4580078125, -0.4375, -0.4169921875, -0.396484375, -0.3759765625, -0.35546875, -0.3349609375, -0.314453125, -0.2939453125, -0.2734375, -0.2529296875, -0.232421875, -0.2119140625, -0.19140625, -0.1708984375, -0.150390625, -0.1298828125, -0.109375, -0.0888671875, -0.068359375, -0.0478515625, -0.02734375, -0.0068359375, 0.013671875, 0.0341796875, 0.0546875, 0.0751953125, 0.095703125, 0.1162109375, 0.13671875, 0.1572265625, 0.177734375, 0.1982421875, 0.21875, 0.2392578125, 0.259765625, 0.2802734375, 0.30078125, 0.3212890625, 0.341796875, 0.3623046875, 0.3828125, 0.4033203125, 0.423828125, 0.4443359375, 0.46484375, 0.4853515625, 0.505859375, 0.5263671875, 0.546875, 0.5673828125, 0.587890625, 0.6083984375, 0.62890625, 0.6494140625, 0.669921875, 0.6904296875, 0.7109375, 0.7314453125, 0.751953125, 0.7724609375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 7.0, 5.0, 8.0, 4.0, 14.0, 15.0, 39.0, 33.0, 77.0, 98.0, 154.0, 287.0, 626.0, 2188.0, 16135.0, 811051.0, 3319755.0, 38217.0, 3877.0, 853.0, 315.0, 171.0, 126.0, 86.0, 41.0, 32.0, 20.0, 11.0, 4.0, 6.0, 5.0, 6.0, 2.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6611328125, -1.6060638427734375, -1.550994873046875, -1.4959259033203125, -1.44085693359375, -1.3857879638671875, -1.330718994140625, -1.2756500244140625, -1.2205810546875, -1.1655120849609375, -1.110443115234375, -1.0553741455078125, -1.00030517578125, -0.9452362060546875, -0.890167236328125, -0.8350982666015625, -0.780029296875, -0.7249603271484375, -0.669891357421875, -0.6148223876953125, -0.55975341796875, -0.5046844482421875, -0.449615478515625, -0.3945465087890625, -0.3394775390625, -0.2844085693359375, -0.229339599609375, -0.1742706298828125, -0.11920166015625, -0.0641326904296875, -0.009063720703125, 0.0460052490234375, 0.10107421875, 0.1561431884765625, 0.211212158203125, 0.2662811279296875, 0.32135009765625, 0.3764190673828125, 0.431488037109375, 0.4865570068359375, 0.5416259765625, 0.5966949462890625, 0.651763916015625, 0.7068328857421875, 0.76190185546875, 0.8169708251953125, 0.872039794921875, 0.9271087646484375, 0.982177734375, 1.0372467041015625, 1.092315673828125, 1.1473846435546875, 1.20245361328125, 1.2575225830078125, 1.312591552734375, 1.3676605224609375, 1.4227294921875, 1.4777984619140625, 1.532867431640625, 1.5879364013671875, 1.64300537109375, 1.6980743408203125, 1.753143310546875, 1.8082122802734375, 1.86328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 7.0, 7.0, 8.0, 10.0, 21.0, 26.0, 29.0, 79.0, 148.0, 314.0, 680.0, 1057.0, 835.0, 421.0, 192.0, 83.0, 52.0, 32.0, 24.0, 8.0, 9.0, 5.0, 3.0, 9.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.95458984375, -0.9224472045898438, -0.8903045654296875, -0.8581619262695312, -0.826019287109375, -0.7938766479492188, -0.7617340087890625, -0.7295913696289062, -0.69744873046875, -0.6653060913085938, -0.6331634521484375, -0.6010208129882812, -0.568878173828125, -0.5367355346679688, -0.5045928955078125, -0.47245025634765625, -0.4403076171875, -0.40816497802734375, -0.3760223388671875, -0.34387969970703125, -0.311737060546875, -0.27959442138671875, -0.2474517822265625, -0.21530914306640625, -0.18316650390625, -0.15102386474609375, -0.1188812255859375, -0.08673858642578125, -0.054595947265625, -0.02245330810546875, 0.0096893310546875, 0.04183197021484375, 0.073974609375, 0.10611724853515625, 0.1382598876953125, 0.17040252685546875, 0.202545166015625, 0.23468780517578125, 0.2668304443359375, 0.29897308349609375, 0.33111572265625, 0.36325836181640625, 0.3954010009765625, 0.42754364013671875, 0.459686279296875, 0.49182891845703125, 0.5239715576171875, 0.5561141967773438, 0.5882568359375, 0.6203994750976562, 0.6525421142578125, 0.6846847534179688, 0.716827392578125, 0.7489700317382812, 0.7811126708984375, 0.8132553100585938, 0.84539794921875, 0.8775405883789062, 0.9096832275390625, 0.9418258666992188, 0.973968505859375, 1.0061111450195312, 1.0382537841796875, 1.0703964233398438, 1.1025390625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 14.0, 38.0, 123.0, 284.0, 331.0, 143.0, 46.0, 10.0, 6.0, 6.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.77174711227417, -3.5238101482391357, -3.2758731842041016, -3.0279359817504883, -2.779999017715454, -2.53206205368042, -2.2841248512268066, -2.0361878871917725, -1.7882509231567383, -1.540313959121704, -1.2923768758773804, -1.0444397926330566, -0.7965028285980225, -0.5485658645629883, -0.30062878131866455, -0.05269169807434082, 0.19524526596069336, 0.4431822896003723, 0.6911193132400513, 0.9390563368797302, 1.1869933605194092, 1.4349303245544434, 1.682867407798767, 1.9308044910430908, 2.178741455078125, 2.426678419113159, 2.6746153831481934, 2.9225525856018066, 3.170489549636841, 3.418426513671875, 3.6663637161254883, 3.9143006801605225, 4.162238121032715, 4.410175323486328, 4.658112049102783, 4.9060492515563965, 5.153985977172852, 5.401923179626465, 5.649860382080078, 5.897797584533691, 6.1457343101501465, 6.39367151260376, 6.641608238220215, 6.889545440673828, 7.137482643127441, 7.3854193687438965, 7.63335657119751, 7.881293296813965, 8.129230499267578, 8.377167701721191, 8.625104904174805, 8.873041152954102, 9.120978355407715, 9.368915557861328, 9.616852760314941, 9.864789962768555, 10.112726211547852, 10.360663414001465, 10.608600616455078, 10.856536865234375, 11.104474067687988, 11.352411270141602, 11.600348472595215, 11.848285675048828, 12.096222877502441]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 4.0, 13.0, 3.0, 18.0, 24.0, 18.0, 30.0, 25.0, 35.0, 39.0, 38.0, 53.0, 44.0, 55.0, 46.0, 41.0, 62.0, 52.0, 53.0, 47.0, 45.0, 46.0, 19.0, 33.0, 31.0, 28.0, 24.0, 12.0, 7.0, 9.0, 8.0, 11.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.0332794189453125, -1.9716863632202148, -1.9100933074951172, -1.8485002517700195, -1.7869071960449219, -1.7253141403198242, -1.6637210845947266, -1.6021279096603394, -1.5405348539352417, -1.478941798210144, -1.4173487424850464, -1.3557556867599487, -1.294162631034851, -1.2325694561004639, -1.1709764003753662, -1.1093833446502686, -1.047790288925171, -0.9861972332000732, -0.9246041774749756, -0.8630111217498779, -0.8014180064201355, -0.7398249506950378, -0.6782318949699402, -0.6166387796401978, -0.5550458431243896, -0.493452787399292, -0.43185970187187195, -0.3702666461467743, -0.30867356061935425, -0.2470805048942566, -0.18548744916915894, -0.12389436364173889, -0.06230127811431885, -0.000708211213350296, 0.060884855687618256, 0.12247791886329651, 0.18407098948955536, 0.2456640601158142, 0.30725711584091187, 0.3688502013683319, 0.43044325709342957, 0.4920363128185272, 0.5536293983459473, 0.6152224540710449, 0.6768155097961426, 0.7384085655212402, 0.8000016212463379, 0.8615947365760803, 0.923187792301178, 0.9847808480262756, 1.046373963356018, 1.1079670190811157, 1.1695600748062134, 1.231153130531311, 1.2927461862564087, 1.3543392419815063, 1.415932297706604, 1.4775253534317017, 1.5391184091567993, 1.600711464881897, 1.6623045206069946, 1.7238976955413818, 1.7854907512664795, 1.8470838069915771, 1.9086768627166748]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 5.0, 6.0, 7.0, 10.0, 18.0, 22.0, 24.0, 42.0, 44.0, 71.0, 109.0, 153.0, 208.0, 332.0, 481.0, 794.0, 1310.0, 2571.0, 4991.0, 12471.0, 72448.0, 748501.0, 171086.0, 19209.0, 6313.0, 3033.0, 1591.0, 968.0, 572.0, 358.0, 250.0, 169.0, 119.0, 83.0, 47.0, 31.0, 23.0, 24.0, 11.0, 14.0, 10.0, 10.0, 6.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.625, -1.571990966796875, -1.51898193359375, -1.465972900390625, -1.4129638671875, -1.359954833984375, -1.30694580078125, -1.253936767578125, -1.200927734375, -1.147918701171875, -1.09490966796875, -1.041900634765625, -0.9888916015625, -0.935882568359375, -0.88287353515625, -0.829864501953125, -0.77685546875, -0.723846435546875, -0.67083740234375, -0.617828369140625, -0.5648193359375, -0.511810302734375, -0.45880126953125, -0.405792236328125, -0.352783203125, -0.299774169921875, -0.24676513671875, -0.193756103515625, -0.1407470703125, -0.087738037109375, -0.03472900390625, 0.018280029296875, 0.0712890625, 0.124298095703125, 0.17730712890625, 0.230316162109375, 0.2833251953125, 0.336334228515625, 0.38934326171875, 0.442352294921875, 0.495361328125, 0.548370361328125, 0.60137939453125, 0.654388427734375, 0.7073974609375, 0.760406494140625, 0.81341552734375, 0.866424560546875, 0.91943359375, 0.972442626953125, 1.02545166015625, 1.078460693359375, 1.1314697265625, 1.184478759765625, 1.23748779296875, 1.290496826171875, 1.343505859375, 1.396514892578125, 1.44952392578125, 1.502532958984375, 1.5555419921875, 1.608551025390625, 1.66156005859375, 1.714569091796875, 1.767578125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 5.0, 3.0, 6.0, 9.0, 13.0, 19.0, 17.0, 21.0, 29.0, 27.0, 31.0, 50.0, 46.0, 53.0, 57.0, 70.0, 79.0, 86.0, 76.0, 65.0, 44.0, 48.0, 29.0, 25.0, 25.0, 12.0, 14.0, 16.0, 7.0, 8.0, 1.0, 4.0, 4.0, 2.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57763671875, -0.55718994140625, -0.5367431640625, -0.51629638671875, -0.495849609375, -0.47540283203125, -0.4549560546875, -0.43450927734375, -0.4140625, -0.39361572265625, -0.3731689453125, -0.35272216796875, -0.332275390625, -0.31182861328125, -0.2913818359375, -0.27093505859375, -0.25048828125, -0.23004150390625, -0.2095947265625, -0.18914794921875, -0.168701171875, -0.14825439453125, -0.1278076171875, -0.10736083984375, -0.0869140625, -0.06646728515625, -0.0460205078125, -0.02557373046875, -0.005126953125, 0.01531982421875, 0.0357666015625, 0.05621337890625, 0.07666015625, 0.09710693359375, 0.1175537109375, 0.13800048828125, 0.158447265625, 0.17889404296875, 0.1993408203125, 0.21978759765625, 0.240234375, 0.26068115234375, 0.2811279296875, 0.30157470703125, 0.322021484375, 0.34246826171875, 0.3629150390625, 0.38336181640625, 0.40380859375, 0.42425537109375, 0.4447021484375, 0.46514892578125, 0.485595703125, 0.50604248046875, 0.5264892578125, 0.54693603515625, 0.5673828125, 0.58782958984375, 0.6082763671875, 0.62872314453125, 0.649169921875, 0.66961669921875, 0.6900634765625, 0.71051025390625, 0.73095703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 8.0, 3.0, 10.0, 5.0, 12.0, 25.0, 25.0, 28.0, 33.0, 44.0, 64.0, 85.0, 141.0, 333.0, 1389.0, 11422.0, 142652.0, 669040.0, 204272.0, 16253.0, 1812.0, 349.0, 154.0, 113.0, 77.0, 40.0, 40.0, 28.0, 18.0, 17.0, 12.0, 9.0, 9.0, 3.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.080078125, -1.0469207763671875, -1.013763427734375, -0.9806060791015625, -0.94744873046875, -0.9142913818359375, -0.881134033203125, -0.8479766845703125, -0.8148193359375, -0.7816619873046875, -0.748504638671875, -0.7153472900390625, -0.68218994140625, -0.6490325927734375, -0.615875244140625, -0.5827178955078125, -0.549560546875, -0.5164031982421875, -0.483245849609375, -0.4500885009765625, -0.41693115234375, -0.3837738037109375, -0.350616455078125, -0.3174591064453125, -0.2843017578125, -0.2511444091796875, -0.217987060546875, -0.1848297119140625, -0.15167236328125, -0.1185150146484375, -0.085357666015625, -0.0522003173828125, -0.01904296875, 0.0141143798828125, 0.047271728515625, 0.0804290771484375, 0.11358642578125, 0.1467437744140625, 0.179901123046875, 0.2130584716796875, 0.2462158203125, 0.2793731689453125, 0.312530517578125, 0.3456878662109375, 0.37884521484375, 0.4120025634765625, 0.445159912109375, 0.4783172607421875, 0.511474609375, 0.5446319580078125, 0.577789306640625, 0.6109466552734375, 0.64410400390625, 0.6772613525390625, 0.710418701171875, 0.7435760498046875, 0.7767333984375, 0.8098907470703125, 0.843048095703125, 0.8762054443359375, 0.90936279296875, 0.9425201416015625, 0.975677490234375, 1.0088348388671875, 1.0419921875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 7.0, 3.0, 7.0, 6.0, 8.0, 9.0, 10.0, 10.0, 17.0, 15.0, 29.0, 19.0, 19.0, 36.0, 31.0, 41.0, 28.0, 37.0, 52.0, 47.0, 47.0, 41.0, 55.0, 38.0, 40.0, 37.0, 38.0, 28.0, 49.0, 23.0, 28.0, 15.0, 20.0, 24.0, 15.0, 14.0, 13.0, 10.0, 13.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.1220703125, -1.0874176025390625, -1.052764892578125, -1.0181121826171875, -0.98345947265625, -0.9488067626953125, -0.914154052734375, -0.8795013427734375, -0.8448486328125, -0.8101959228515625, -0.775543212890625, -0.7408905029296875, -0.70623779296875, -0.6715850830078125, -0.636932373046875, -0.6022796630859375, -0.567626953125, -0.5329742431640625, -0.498321533203125, -0.4636688232421875, -0.42901611328125, -0.3943634033203125, -0.359710693359375, -0.3250579833984375, -0.2904052734375, -0.2557525634765625, -0.221099853515625, -0.1864471435546875, -0.15179443359375, -0.1171417236328125, -0.082489013671875, -0.0478363037109375, -0.01318359375, 0.0214691162109375, 0.056121826171875, 0.0907745361328125, 0.12542724609375, 0.1600799560546875, 0.194732666015625, 0.2293853759765625, 0.2640380859375, 0.2986907958984375, 0.333343505859375, 0.3679962158203125, 0.40264892578125, 0.4373016357421875, 0.471954345703125, 0.5066070556640625, 0.541259765625, 0.5759124755859375, 0.610565185546875, 0.6452178955078125, 0.67987060546875, 0.7145233154296875, 0.749176025390625, 0.7838287353515625, 0.8184814453125, 0.8531341552734375, 0.887786865234375, 0.9224395751953125, 0.95709228515625, 0.9917449951171875, 1.026397705078125, 1.0610504150390625, 1.095703125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 6.0, 6.0, 12.0, 19.0, 20.0, 31.0, 42.0, 62.0, 98.0, 180.0, 255.0, 626.0, 1563.0, 5336.0, 21574.0, 124429.0, 527119.0, 302261.0, 49694.0, 10301.0, 2920.0, 984.0, 438.0, 222.0, 137.0, 78.0, 41.0, 24.0, 26.0, 17.0, 14.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267333984375, -0.2594127655029297, -0.2514915466308594, -0.24357032775878906, -0.23564910888671875, -0.22772789001464844, -0.21980667114257812, -0.2118854522705078, -0.2039642333984375, -0.1960430145263672, -0.18812179565429688, -0.18020057678222656, -0.17227935791015625, -0.16435813903808594, -0.15643692016601562, -0.1485157012939453, -0.140594482421875, -0.1326732635498047, -0.12475204467773438, -0.11683082580566406, -0.10890960693359375, -0.10098838806152344, -0.09306716918945312, -0.08514595031738281, -0.0772247314453125, -0.06930351257324219, -0.061382293701171875, -0.05346107482910156, -0.04553985595703125, -0.03761863708496094, -0.029697418212890625, -0.021776199340820312, -0.01385498046875, -0.0059337615966796875, 0.001987457275390625, 0.009908676147460938, 0.01782989501953125, 0.025751113891601562, 0.033672332763671875, 0.04159355163574219, 0.0495147705078125, 0.05743598937988281, 0.06535720825195312, 0.07327842712402344, 0.08119964599609375, 0.08912086486816406, 0.09704208374023438, 0.10496330261230469, 0.112884521484375, 0.12080574035644531, 0.12872695922851562, 0.13664817810058594, 0.14456939697265625, 0.15249061584472656, 0.16041183471679688, 0.1683330535888672, 0.1762542724609375, 0.1841754913330078, 0.19209671020507812, 0.20001792907714844, 0.20793914794921875, 0.21586036682128906, 0.22378158569335938, 0.2317028045654297, 0.2396240234375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 8.0, 7.0, 9.0, 14.0, 16.0, 34.0, 31.0, 50.0, 57.0, 87.0, 81.0, 109.0, 90.0, 102.0, 65.0, 66.0, 57.0, 34.0, 26.0, 11.0, 17.0, 11.0, 7.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.996755599975586e-05, -1.933891326189041e-05, -1.8710270524024963e-05, -1.8081627786159515e-05, -1.7452985048294067e-05, -1.682434231042862e-05, -1.619569957256317e-05, -1.5567056834697723e-05, -1.4938414096832275e-05, -1.4309771358966827e-05, -1.368112862110138e-05, -1.3052485883235931e-05, -1.2423843145370483e-05, -1.1795200407505035e-05, -1.1166557669639587e-05, -1.053791493177414e-05, -9.909272193908691e-06, -9.280629456043243e-06, -8.651986718177795e-06, -8.023343980312347e-06, -7.394701242446899e-06, -6.766058504581451e-06, -6.137415766716003e-06, -5.508773028850555e-06, -4.880130290985107e-06, -4.2514875531196594e-06, -3.6228448152542114e-06, -2.9942020773887634e-06, -2.3655593395233154e-06, -1.7369166016578674e-06, -1.1082738637924194e-06, -4.796311259269714e-07, 1.4901161193847656e-07, 7.776543498039246e-07, 1.4062970876693726e-06, 2.0349398255348206e-06, 2.6635825634002686e-06, 3.2922253012657166e-06, 3.9208680391311646e-06, 4.5495107769966125e-06, 5.1781535148620605e-06, 5.8067962527275085e-06, 6.4354389905929565e-06, 7.0640817284584045e-06, 7.692724466323853e-06, 8.3213672041893e-06, 8.950009942054749e-06, 9.578652679920197e-06, 1.0207295417785645e-05, 1.0835938155651093e-05, 1.146458089351654e-05, 1.2093223631381989e-05, 1.2721866369247437e-05, 1.3350509107112885e-05, 1.3979151844978333e-05, 1.460779458284378e-05, 1.5236437320709229e-05, 1.5865080058574677e-05, 1.6493722796440125e-05, 1.7122365534305573e-05, 1.775100827217102e-05, 1.837965101003647e-05, 1.9008293747901917e-05, 1.9636936485767365e-05, 2.0265579223632812e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 11.0, 20.0, 25.0, 42.0, 71.0, 121.0, 250.0, 523.0, 1133.0, 2648.0, 7645.0, 36110.0, 297016.0, 583167.0, 97408.0, 14957.0, 4227.0, 1649.0, 751.0, 351.0, 189.0, 101.0, 50.0, 38.0, 15.0, 8.0, 9.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2496337890625, -0.2393360137939453, -0.22903823852539062, -0.21874046325683594, -0.20844268798828125, -0.19814491271972656, -0.18784713745117188, -0.1775493621826172, -0.1672515869140625, -0.1569538116455078, -0.14665603637695312, -0.13635826110839844, -0.12606048583984375, -0.11576271057128906, -0.10546493530273438, -0.09516716003417969, -0.084869384765625, -0.07457160949707031, -0.06427383422851562, -0.05397605895996094, -0.04367828369140625, -0.03338050842285156, -0.023082733154296875, -0.012784957885742188, -0.0024871826171875, 0.0078105926513671875, 0.018108367919921875, 0.028406143188476562, 0.03870391845703125, 0.04900169372558594, 0.059299468994140625, 0.06959724426269531, 0.07989501953125, 0.09019279479980469, 0.10049057006835938, 0.11078834533691406, 0.12108612060546875, 0.13138389587402344, 0.14168167114257812, 0.1519794464111328, 0.1622772216796875, 0.1725749969482422, 0.18287277221679688, 0.19317054748535156, 0.20346832275390625, 0.21376609802246094, 0.22406387329101562, 0.2343616485595703, 0.244659423828125, 0.2549571990966797, 0.2652549743652344, 0.27555274963378906, 0.28585052490234375, 0.29614830017089844, 0.3064460754394531, 0.3167438507080078, 0.3270416259765625, 0.3373394012451172, 0.3476371765136719, 0.35793495178222656, 0.36823272705078125, 0.37853050231933594, 0.3888282775878906, 0.3991260528564453, 0.409423828125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 10.0, 10.0, 9.0, 16.0, 26.0, 25.0, 33.0, 45.0, 64.0, 60.0, 72.0, 90.0, 81.0, 72.0, 75.0, 71.0, 50.0, 52.0, 31.0, 26.0, 21.0, 17.0, 13.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26123046875, -0.2540321350097656, -0.24683380126953125, -0.23963546752929688, -0.2324371337890625, -0.22523880004882812, -0.21804046630859375, -0.21084213256835938, -0.203643798828125, -0.19644546508789062, -0.18924713134765625, -0.18204879760742188, -0.1748504638671875, -0.16765213012695312, -0.16045379638671875, -0.15325546264648438, -0.14605712890625, -0.13885879516601562, -0.13166046142578125, -0.12446212768554688, -0.1172637939453125, -0.11006546020507812, -0.10286712646484375, -0.09566879272460938, -0.088470458984375, -0.08127212524414062, -0.07407379150390625, -0.06687545776367188, -0.0596771240234375, -0.052478790283203125, -0.04528045654296875, -0.038082122802734375, -0.0308837890625, -0.023685455322265625, -0.01648712158203125, -0.009288787841796875, -0.0020904541015625, 0.005107879638671875, 0.01230621337890625, 0.019504547119140625, 0.026702880859375, 0.033901214599609375, 0.04109954833984375, 0.048297882080078125, 0.0554962158203125, 0.06269454956054688, 0.06989288330078125, 0.07709121704101562, 0.08428955078125, 0.09148788452148438, 0.09868621826171875, 0.10588455200195312, 0.1130828857421875, 0.12028121948242188, 0.12747955322265625, 0.13467788696289062, 0.141876220703125, 0.14907455444335938, 0.15627288818359375, 0.16347122192382812, 0.1706695556640625, 0.17786788940429688, 0.18506622314453125, 0.19226455688476562, 0.199462890625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 5.0, 8.0, 10.0, 20.0, 35.0, 74.0, 153.0, 197.0, 178.0, 147.0, 77.0, 56.0, 29.0, 3.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.540344476699829, -2.373117446899414, -2.20589017868042, -2.038662910461426, -1.8714358806610107, -1.7042087316513062, -1.5369815826416016, -1.369754433631897, -1.2025272846221924, -1.0353001356124878, -0.8680729866027832, -0.7008458375930786, -0.533618688583374, -0.36639153957366943, -0.19916439056396484, -0.031937241554260254, 0.13528990745544434, 0.3025170564651489, 0.4697442054748535, 0.6369713544845581, 0.8041985034942627, 0.9714256525039673, 1.1386528015136719, 1.3058799505233765, 1.473107099533081, 1.6403342485427856, 1.8075613975524902, 1.9747885465621948, 2.1420156955718994, 2.3092427253723145, 2.4764699935913086, 2.6436972618103027, 2.810924530029297, 2.978151798248291, 3.145378828048706, 3.312605857849121, 3.4798331260681152, 3.6470603942871094, 3.8142874240875244, 3.9815144538879395, 4.148741722106934, 4.315968990325928, 4.483196258544922, 4.650423049926758, 4.817650318145752, 4.984877586364746, 5.152104377746582, 5.319331645965576, 5.48655891418457, 5.6537861824035645, 5.821013450622559, 5.9882402420043945, 6.155467510223389, 6.322694778442383, 6.489921569824219, 6.657148838043213, 6.824376106262207, 6.991603374481201, 7.158830642700195, 7.326057434082031, 7.493284702301025, 7.6605119705200195, 7.8277387619018555, 7.99496603012085, 8.162193298339844]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 11.0, 9.0, 9.0, 15.0, 16.0, 14.0, 16.0, 30.0, 26.0, 31.0, 38.0, 33.0, 52.0, 51.0, 49.0, 40.0, 56.0, 45.0, 51.0, 47.0, 37.0, 38.0, 35.0, 54.0, 39.0, 30.0, 23.0, 21.0, 22.0, 16.0, 14.0, 9.0, 11.0, 3.0, 3.0, 0.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.675540924072266, -6.467463493347168, -6.259385585784912, -6.051307678222656, -5.843230247497559, -5.635152816772461, -5.427074909210205, -5.218997001647949, -5.010919570922852, -4.802842140197754, -4.594764232635498, -4.386686325073242, -4.1786088943481445, -3.9705312252044678, -3.762453556060791, -3.5543758869171143, -3.3462982177734375, -3.1382205486297607, -2.930142879486084, -2.7220652103424072, -2.5139875411987305, -2.3059098720550537, -2.097832202911377, -1.8897545337677002, -1.6816768646240234, -1.4735991954803467, -1.26552152633667, -1.0574438571929932, -0.8493661880493164, -0.6412885189056396, -0.4332108497619629, -0.22513318061828613, -0.017055034637451172, 0.19102263450622559, 0.39910030364990234, 0.6071779727935791, 0.8152556419372559, 1.0233333110809326, 1.2314109802246094, 1.4394886493682861, 1.647566318511963, 1.8556439876556396, 2.0637216567993164, 2.271799325942993, 2.47987699508667, 2.6879546642303467, 2.8960323333740234, 3.1041100025177, 3.312187671661377, 3.5202653408050537, 3.7283430099487305, 3.9364206790924072, 4.144498348236084, 4.35257625579834, 4.5606536865234375, 4.768731117248535, 4.976809024810791, 5.184886932373047, 5.3929643630981445, 5.601041793823242, 5.809119701385498, 6.017197608947754, 6.225275039672852, 6.433352470397949, 6.641430377960205]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 7.0, 7.0, 4.0, 4.0, 9.0, 11.0, 7.0, 11.0, 19.0, 17.0, 20.0, 31.0, 36.0, 69.0, 81.0, 167.0, 456.0, 1379.0, 11321.0, 1551596.0, 2611007.0, 15213.0, 1772.0, 484.0, 197.0, 89.0, 58.0, 40.0, 35.0, 30.0, 19.0, 18.0, 19.0, 6.0, 7.0, 8.0, 6.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-3.46484375, -3.363067626953125, -3.26129150390625, -3.159515380859375, -3.0577392578125, -2.955963134765625, -2.85418701171875, -2.752410888671875, -2.650634765625, -2.548858642578125, -2.44708251953125, -2.345306396484375, -2.2435302734375, -2.141754150390625, -2.03997802734375, -1.938201904296875, -1.83642578125, -1.734649658203125, -1.63287353515625, -1.531097412109375, -1.4293212890625, -1.327545166015625, -1.22576904296875, -1.123992919921875, -1.022216796875, -0.920440673828125, -0.81866455078125, -0.716888427734375, -0.6151123046875, -0.513336181640625, -0.41156005859375, -0.309783935546875, -0.2080078125, -0.106231689453125, -0.00445556640625, 0.097320556640625, 0.1990966796875, 0.300872802734375, 0.40264892578125, 0.504425048828125, 0.606201171875, 0.707977294921875, 0.80975341796875, 0.911529541015625, 1.0133056640625, 1.115081787109375, 1.21685791015625, 1.318634033203125, 1.42041015625, 1.522186279296875, 1.62396240234375, 1.725738525390625, 1.8275146484375, 1.929290771484375, 2.03106689453125, 2.132843017578125, 2.234619140625, 2.336395263671875, 2.43817138671875, 2.539947509765625, 2.6417236328125, 2.743499755859375, 2.84527587890625, 2.947052001953125, 3.048828125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 7.0, 7.0, 12.0, 8.0, 10.0, 13.0, 14.0, 15.0, 21.0, 35.0, 26.0, 36.0, 35.0, 58.0, 65.0, 57.0, 63.0, 61.0, 60.0, 49.0, 55.0, 47.0, 40.0, 43.0, 25.0, 22.0, 25.0, 26.0, 13.0, 10.0, 8.0, 6.0, 10.0, 4.0, 7.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.552734375, -0.5361328125, -0.51953125, -0.5029296875, -0.486328125, -0.4697265625, -0.453125, -0.4365234375, -0.419921875, -0.4033203125, -0.38671875, -0.3701171875, -0.353515625, -0.3369140625, -0.3203125, -0.3037109375, -0.287109375, -0.2705078125, -0.25390625, -0.2373046875, -0.220703125, -0.2041015625, -0.1875, -0.1708984375, -0.154296875, -0.1376953125, -0.12109375, -0.1044921875, -0.087890625, -0.0712890625, -0.0546875, -0.0380859375, -0.021484375, -0.0048828125, 0.01171875, 0.0283203125, 0.044921875, 0.0615234375, 0.078125, 0.0947265625, 0.111328125, 0.1279296875, 0.14453125, 0.1611328125, 0.177734375, 0.1943359375, 0.2109375, 0.2275390625, 0.244140625, 0.2607421875, 0.27734375, 0.2939453125, 0.310546875, 0.3271484375, 0.34375, 0.3603515625, 0.376953125, 0.3935546875, 0.41015625, 0.4267578125, 0.443359375, 0.4599609375, 0.4765625, 0.4931640625, 0.509765625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 12.0, 16.0, 29.0, 55.0, 110.0, 256.0, 593.0, 1660.0, 5860.0, 24051.0, 120100.0, 650178.0, 2232700.0, 936656.0, 176280.0, 34324.0, 7890.0, 2199.0, 718.0, 285.0, 141.0, 54.0, 35.0, 19.0, 14.0, 10.0, 5.0, 3.0, 3.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1708984375, -1.1370697021484375, -1.103240966796875, -1.0694122314453125, -1.03558349609375, -1.0017547607421875, -0.967926025390625, -0.9340972900390625, -0.9002685546875, -0.8664398193359375, -0.832611083984375, -0.7987823486328125, -0.76495361328125, -0.7311248779296875, -0.697296142578125, -0.6634674072265625, -0.629638671875, -0.5958099365234375, -0.561981201171875, -0.5281524658203125, -0.49432373046875, -0.4604949951171875, -0.426666259765625, -0.3928375244140625, -0.3590087890625, -0.3251800537109375, -0.291351318359375, -0.2575225830078125, -0.22369384765625, -0.1898651123046875, -0.156036376953125, -0.1222076416015625, -0.08837890625, -0.0545501708984375, -0.020721435546875, 0.0131072998046875, 0.04693603515625, 0.0807647705078125, 0.114593505859375, 0.1484222412109375, 0.1822509765625, 0.2160797119140625, 0.249908447265625, 0.2837371826171875, 0.31756591796875, 0.3513946533203125, 0.385223388671875, 0.4190521240234375, 0.452880859375, 0.4867095947265625, 0.520538330078125, 0.5543670654296875, 0.58819580078125, 0.6220245361328125, 0.655853271484375, 0.6896820068359375, 0.7235107421875, 0.7573394775390625, 0.791168212890625, 0.8249969482421875, 0.85882568359375, 0.8926544189453125, 0.926483154296875, 0.9603118896484375, 0.994140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 3.0, 7.0, 7.0, 7.0, 10.0, 17.0, 28.0, 35.0, 46.0, 49.0, 75.0, 85.0, 144.0, 166.0, 208.0, 271.0, 355.0, 419.0, 397.0, 422.0, 304.0, 239.0, 203.0, 138.0, 116.0, 74.0, 66.0, 52.0, 35.0, 19.0, 20.0, 22.0, 7.0, 13.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5078125, -0.4925956726074219, -0.47737884521484375, -0.4621620178222656, -0.4469451904296875, -0.4317283630371094, -0.41651153564453125, -0.4012947082519531, -0.386077880859375, -0.3708610534667969, -0.35564422607421875, -0.3404273986816406, -0.3252105712890625, -0.3099937438964844, -0.29477691650390625, -0.2795600891113281, -0.26434326171875, -0.24912643432617188, -0.23390960693359375, -0.21869277954101562, -0.2034759521484375, -0.18825912475585938, -0.17304229736328125, -0.15782546997070312, -0.142608642578125, -0.12739181518554688, -0.11217498779296875, -0.09695816040039062, -0.0817413330078125, -0.06652450561523438, -0.05130767822265625, -0.036090850830078125, -0.0208740234375, -0.005657196044921875, 0.00955963134765625, 0.024776458740234375, 0.0399932861328125, 0.055210113525390625, 0.07042694091796875, 0.08564376831054688, 0.100860595703125, 0.11607742309570312, 0.13129425048828125, 0.14651107788085938, 0.1617279052734375, 0.17694473266601562, 0.19216156005859375, 0.20737838745117188, 0.22259521484375, 0.23781204223632812, 0.25302886962890625, 0.2682456970214844, 0.2834625244140625, 0.2986793518066406, 0.31389617919921875, 0.3291130065917969, 0.344329833984375, 0.3595466613769531, 0.37476348876953125, 0.3899803161621094, 0.4051971435546875, 0.4204139709472656, 0.43563079833984375, 0.4508476257324219, 0.466064453125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 17.0, 19.0, 54.0, 93.0, 140.0, 173.0, 194.0, 140.0, 93.0, 35.0, 22.0, 10.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.714191436767578, -6.575214385986328, -6.436237812042236, -6.297260761260986, -6.158283710479736, -6.0193071365356445, -5.8803300857543945, -5.7413530349731445, -5.6023759841918945, -5.4633989334106445, -5.324422359466553, -5.185445308685303, -5.046468257904053, -4.907491683959961, -4.768514633178711, -4.629537582397461, -4.490561008453369, -4.351583957672119, -4.212607383728027, -4.073630332946777, -3.9346532821655273, -3.7956764698028564, -3.6566996574401855, -3.5177226066589355, -3.3787457942962646, -3.2397689819335938, -3.1007919311523438, -2.961815118789673, -2.822838306427002, -2.683861255645752, -2.544884443283081, -2.40590763092041, -2.26693058013916, -2.1279537677764893, -1.9889767169952393, -1.8499999046325684, -1.711022973060608, -1.5720460414886475, -1.4330692291259766, -1.2940922975540161, -1.1551153659820557, -1.0161384344100952, -0.8771615624427795, -0.7381846904754639, -0.5992077589035034, -0.46023082733154297, -0.3212539553642273, -0.18227708339691162, -0.04330015182495117, 0.09567674994468689, 0.23465365171432495, 0.373630553483963, 0.5126074552536011, 0.6515843868255615, 0.7905612587928772, 0.9295381307601929, 1.0685150623321533, 1.2074919939041138, 1.3464689254760742, 1.4854457378387451, 1.6244226694107056, 1.763399600982666, 1.902376413345337, 2.041353225708008, 2.180330276489258]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 7.0, 14.0, 13.0, 15.0, 13.0, 27.0, 30.0, 27.0, 34.0, 40.0, 41.0, 39.0, 42.0, 38.0, 37.0, 51.0, 60.0, 66.0, 47.0, 44.0, 43.0, 41.0, 34.0, 38.0, 27.0, 18.0, 18.0, 17.0, 18.0, 18.0, 10.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7768627405166626, -1.7180747985839844, -1.6592869758605957, -1.600499153137207, -1.5417112112045288, -1.4829232692718506, -1.424135446548462, -1.3653476238250732, -1.306559681892395, -1.2477717399597168, -1.1889839172363281, -1.1301960945129395, -1.0714081525802612, -1.012620210647583, -0.9538323879241943, -0.8950445055961609, -0.8362566232681274, -0.777468740940094, -0.7186808586120605, -0.6598929762840271, -0.6011050939559937, -0.5423172116279602, -0.48352932929992676, -0.4247414469718933, -0.36595356464385986, -0.3071656823158264, -0.24837779998779297, -0.18958991765975952, -0.13080203533172607, -0.07201415300369263, -0.01322627067565918, 0.04556161165237427, 0.10434961318969727, 0.1631374955177307, 0.22192537784576416, 0.2807132601737976, 0.33950114250183105, 0.3982890248298645, 0.45707690715789795, 0.5158647894859314, 0.5746526718139648, 0.6334405541419983, 0.6922284364700317, 0.7510163187980652, 0.8098042011260986, 0.8685920834541321, 0.9273799657821655, 0.986167848110199, 1.0449557304382324, 1.103743553161621, 1.1625314950942993, 1.2213194370269775, 1.2801072597503662, 1.3388950824737549, 1.397683024406433, 1.4564709663391113, 1.5152587890625, 1.5740466117858887, 1.632834553718567, 1.6916224956512451, 1.7504103183746338, 1.8091981410980225, 1.8679860830307007, 1.926774024963379, 1.9855618476867676]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 13.0, 25.0, 16.0, 42.0, 44.0, 67.0, 102.0, 209.0, 334.0, 535.0, 1067.0, 2037.0, 4410.0, 10007.0, 24547.0, 61742.0, 154305.0, 301618.0, 272747.0, 128081.0, 49966.0, 20225.0, 8711.0, 3757.0, 1810.0, 901.0, 462.0, 256.0, 186.0, 113.0, 72.0, 44.0, 28.0, 20.0, 15.0, 11.0, 8.0, 5.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7724609375, -0.7489776611328125, -0.725494384765625, -0.7020111083984375, -0.67852783203125, -0.6550445556640625, -0.631561279296875, -0.6080780029296875, -0.5845947265625, -0.5611114501953125, -0.537628173828125, -0.5141448974609375, -0.49066162109375, -0.4671783447265625, -0.443695068359375, -0.4202117919921875, -0.396728515625, -0.3732452392578125, -0.349761962890625, -0.3262786865234375, -0.30279541015625, -0.2793121337890625, -0.255828857421875, -0.2323455810546875, -0.2088623046875, -0.1853790283203125, -0.161895751953125, -0.1384124755859375, -0.11492919921875, -0.0914459228515625, -0.067962646484375, -0.0444793701171875, -0.02099609375, 0.0024871826171875, 0.025970458984375, 0.0494537353515625, 0.07293701171875, 0.0964202880859375, 0.119903564453125, 0.1433868408203125, 0.1668701171875, 0.1903533935546875, 0.213836669921875, 0.2373199462890625, 0.26080322265625, 0.2842864990234375, 0.307769775390625, 0.3312530517578125, 0.354736328125, 0.3782196044921875, 0.401702880859375, 0.4251861572265625, 0.44866943359375, 0.4721527099609375, 0.495635986328125, 0.5191192626953125, 0.5426025390625, 0.5660858154296875, 0.589569091796875, 0.6130523681640625, 0.63653564453125, 0.6600189208984375, 0.683502197265625, 0.7069854736328125, 0.73046875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 12.0, 10.0, 6.0, 13.0, 16.0, 11.0, 10.0, 22.0, 26.0, 26.0, 40.0, 34.0, 61.0, 47.0, 63.0, 62.0, 62.0, 61.0, 51.0, 72.0, 45.0, 43.0, 40.0, 30.0, 33.0, 33.0, 27.0, 15.0, 2.0, 9.0, 8.0, 5.0, 1.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53564453125, -0.5181808471679688, -0.5007171630859375, -0.48325347900390625, -0.465789794921875, -0.44832611083984375, -0.4308624267578125, -0.41339874267578125, -0.39593505859375, -0.37847137451171875, -0.3610076904296875, -0.34354400634765625, -0.326080322265625, -0.30861663818359375, -0.2911529541015625, -0.27368927001953125, -0.2562255859375, -0.23876190185546875, -0.2212982177734375, -0.20383453369140625, -0.186370849609375, -0.16890716552734375, -0.1514434814453125, -0.13397979736328125, -0.11651611328125, -0.09905242919921875, -0.0815887451171875, -0.06412506103515625, -0.046661376953125, -0.02919769287109375, -0.0117340087890625, 0.00572967529296875, 0.023193359375, 0.04065704345703125, 0.0581207275390625, 0.07558441162109375, 0.093048095703125, 0.11051177978515625, 0.1279754638671875, 0.14543914794921875, 0.16290283203125, 0.18036651611328125, 0.1978302001953125, 0.21529388427734375, 0.232757568359375, 0.25022125244140625, 0.2676849365234375, 0.28514862060546875, 0.3026123046875, 0.32007598876953125, 0.3375396728515625, 0.35500335693359375, 0.372467041015625, 0.38993072509765625, 0.4073944091796875, 0.42485809326171875, 0.44232177734375, 0.45978546142578125, 0.4772491455078125, 0.49471282958984375, 0.512176513671875, 0.5296401977539062, 0.5471038818359375, 0.5645675659179688, 0.58203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 3.0, 2.0, 9.0, 12.0, 9.0, 12.0, 21.0, 14.0, 17.0, 23.0, 29.0, 25.0, 40.0, 35.0, 52.0, 84.0, 169.0, 720.0, 13636.0, 695690.0, 331426.0, 5576.0, 447.0, 138.0, 77.0, 51.0, 43.0, 41.0, 21.0, 27.0, 18.0, 20.0, 17.0, 10.0, 11.0, 4.0, 7.0, 4.0, 4.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.3125, -4.195556640625, -4.07861328125, -3.961669921875, -3.8447265625, -3.727783203125, -3.61083984375, -3.493896484375, -3.376953125, -3.260009765625, -3.14306640625, -3.026123046875, -2.9091796875, -2.792236328125, -2.67529296875, -2.558349609375, -2.44140625, -2.324462890625, -2.20751953125, -2.090576171875, -1.9736328125, -1.856689453125, -1.73974609375, -1.622802734375, -1.505859375, -1.388916015625, -1.27197265625, -1.155029296875, -1.0380859375, -0.921142578125, -0.80419921875, -0.687255859375, -0.5703125, -0.453369140625, -0.33642578125, -0.219482421875, -0.1025390625, 0.014404296875, 0.13134765625, 0.248291015625, 0.365234375, 0.482177734375, 0.59912109375, 0.716064453125, 0.8330078125, 0.949951171875, 1.06689453125, 1.183837890625, 1.30078125, 1.417724609375, 1.53466796875, 1.651611328125, 1.7685546875, 1.885498046875, 2.00244140625, 2.119384765625, 2.236328125, 2.353271484375, 2.47021484375, 2.587158203125, 2.7041015625, 2.821044921875, 2.93798828125, 3.054931640625, 3.171875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 6.0, 7.0, 8.0, 11.0, 9.0, 8.0, 17.0, 14.0, 18.0, 21.0, 25.0, 23.0, 30.0, 30.0, 28.0, 40.0, 41.0, 43.0, 37.0, 41.0, 37.0, 43.0, 51.0, 44.0, 52.0, 40.0, 29.0, 35.0, 21.0, 29.0, 28.0, 23.0, 16.0, 23.0, 14.0, 12.0, 12.0, 3.0, 6.0, 6.0, 4.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0087890625, -0.979278564453125, -0.94976806640625, -0.920257568359375, -0.8907470703125, -0.861236572265625, -0.83172607421875, -0.802215576171875, -0.772705078125, -0.743194580078125, -0.71368408203125, -0.684173583984375, -0.6546630859375, -0.625152587890625, -0.59564208984375, -0.566131591796875, -0.53662109375, -0.507110595703125, -0.47760009765625, -0.448089599609375, -0.4185791015625, -0.389068603515625, -0.35955810546875, -0.330047607421875, -0.300537109375, -0.271026611328125, -0.24151611328125, -0.212005615234375, -0.1824951171875, -0.152984619140625, -0.12347412109375, -0.093963623046875, -0.064453125, -0.034942626953125, -0.00543212890625, 0.024078369140625, 0.0535888671875, 0.083099365234375, 0.11260986328125, 0.142120361328125, 0.171630859375, 0.201141357421875, 0.23065185546875, 0.260162353515625, 0.2896728515625, 0.319183349609375, 0.34869384765625, 0.378204345703125, 0.40771484375, 0.437225341796875, 0.46673583984375, 0.496246337890625, 0.5257568359375, 0.555267333984375, 0.58477783203125, 0.614288330078125, 0.643798828125, 0.673309326171875, 0.70281982421875, 0.732330322265625, 0.7618408203125, 0.791351318359375, 0.82086181640625, 0.850372314453125, 0.8798828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 7.0, 8.0, 8.0, 10.0, 16.0, 30.0, 54.0, 60.0, 79.0, 163.0, 261.0, 380.0, 591.0, 1114.0, 2023.0, 3850.0, 7915.0, 18174.0, 47523.0, 137071.0, 327032.0, 306068.0, 122044.0, 42175.0, 16685.0, 7210.0, 3526.0, 1847.0, 1010.0, 596.0, 364.0, 237.0, 152.0, 88.0, 73.0, 38.0, 29.0, 18.0, 10.0, 8.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3876953125, -0.3759269714355469, -0.36415863037109375, -0.3523902893066406, -0.3406219482421875, -0.3288536071777344, -0.31708526611328125, -0.3053169250488281, -0.293548583984375, -0.2817802429199219, -0.27001190185546875, -0.2582435607910156, -0.2464752197265625, -0.23470687866210938, -0.22293853759765625, -0.21117019653320312, -0.19940185546875, -0.18763351440429688, -0.17586517333984375, -0.16409683227539062, -0.1523284912109375, -0.14056015014648438, -0.12879180908203125, -0.11702346801757812, -0.105255126953125, -0.09348678588867188, -0.08171844482421875, -0.06995010375976562, -0.0581817626953125, -0.046413421630859375, -0.03464508056640625, -0.022876739501953125, -0.0111083984375, 0.000659942626953125, 0.01242828369140625, 0.024196624755859375, 0.0359649658203125, 0.047733306884765625, 0.05950164794921875, 0.07126998901367188, 0.083038330078125, 0.09480667114257812, 0.10657501220703125, 0.11834335327148438, 0.1301116943359375, 0.14188003540039062, 0.15364837646484375, 0.16541671752929688, 0.17718505859375, 0.18895339965820312, 0.20072174072265625, 0.21249008178710938, 0.2242584228515625, 0.23602676391601562, 0.24779510498046875, 0.2595634460449219, 0.271331787109375, 0.2831001281738281, 0.29486846923828125, 0.3066368103027344, 0.3184051513671875, 0.3301734924316406, 0.34194183349609375, 0.3537101745605469, 0.365478515625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 3.0, 7.0, 4.0, 14.0, 14.0, 28.0, 45.0, 84.0, 137.0, 160.0, 159.0, 136.0, 78.0, 58.0, 25.0, 24.0, 13.0, 6.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.628036499023438e-05, -6.340909749269485e-05, -6.0537829995155334e-05, -5.7666562497615814e-05, -5.4795295000076294e-05, -5.1924027502536774e-05, -4.9052760004997253e-05, -4.618149250745773e-05, -4.331022500991821e-05, -4.043895751237869e-05, -3.756769001483917e-05, -3.469642251729965e-05, -3.182515501976013e-05, -2.895388752222061e-05, -2.608262002468109e-05, -2.321135252714157e-05, -2.034008502960205e-05, -1.746881753206253e-05, -1.459755003452301e-05, -1.172628253698349e-05, -8.85501503944397e-06, -5.9837475419044495e-06, -3.112480044364929e-06, -2.4121254682540894e-07, 2.6300549507141113e-06, 5.501322448253632e-06, 8.372589945793152e-06, 1.1243857443332672e-05, 1.4115124940872192e-05, 1.6986392438411713e-05, 1.9857659935951233e-05, 2.2728927433490753e-05, 2.5600194931030273e-05, 2.8471462428569794e-05, 3.1342729926109314e-05, 3.4213997423648834e-05, 3.7085264921188354e-05, 3.9956532418727875e-05, 4.2827799916267395e-05, 4.5699067413806915e-05, 4.8570334911346436e-05, 5.1441602408885956e-05, 5.4312869906425476e-05, 5.7184137403964996e-05, 6.0055404901504517e-05, 6.292667239904404e-05, 6.579793989658356e-05, 6.866920739412308e-05, 7.15404748916626e-05, 7.441174238920212e-05, 7.728300988674164e-05, 8.015427738428116e-05, 8.302554488182068e-05, 8.58968123793602e-05, 8.876807987689972e-05, 9.163934737443924e-05, 9.451061487197876e-05, 9.738188236951828e-05, 0.0001002531498670578, 0.00010312441736459732, 0.00010599568486213684, 0.00010886695235967636, 0.00011173821985721588, 0.0001146094873547554, 0.00011748075485229492]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 4.0, 6.0, 4.0, 7.0, 7.0, 7.0, 4.0, 8.0, 19.0, 16.0, 16.0, 20.0, 27.0, 41.0, 45.0, 77.0, 194.0, 772.0, 5754.0, 74240.0, 687016.0, 260784.0, 16966.0, 1844.0, 314.0, 98.0, 60.0, 47.0, 25.0, 32.0, 15.0, 25.0, 15.0, 14.0, 6.0, 8.0, 3.0, 6.0, 2.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.931640625, -0.9055633544921875, -0.879486083984375, -0.8534088134765625, -0.82733154296875, -0.8012542724609375, -0.775177001953125, -0.7490997314453125, -0.7230224609375, -0.6969451904296875, -0.670867919921875, -0.6447906494140625, -0.61871337890625, -0.5926361083984375, -0.566558837890625, -0.5404815673828125, -0.514404296875, -0.4883270263671875, -0.462249755859375, -0.4361724853515625, -0.41009521484375, -0.3840179443359375, -0.357940673828125, -0.3318634033203125, -0.3057861328125, -0.2797088623046875, -0.253631591796875, -0.2275543212890625, -0.20147705078125, -0.1753997802734375, -0.149322509765625, -0.1232452392578125, -0.09716796875, -0.0710906982421875, -0.045013427734375, -0.0189361572265625, 0.00714111328125, 0.0332183837890625, 0.059295654296875, 0.0853729248046875, 0.1114501953125, 0.1375274658203125, 0.163604736328125, 0.1896820068359375, 0.21575927734375, 0.2418365478515625, 0.267913818359375, 0.2939910888671875, 0.320068359375, 0.3461456298828125, 0.372222900390625, 0.3983001708984375, 0.42437744140625, 0.4504547119140625, 0.476531982421875, 0.5026092529296875, 0.5286865234375, 0.5547637939453125, 0.580841064453125, 0.6069183349609375, 0.63299560546875, 0.6590728759765625, 0.685150146484375, 0.7112274169921875, 0.7373046875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 5.0, 5.0, 5.0, 5.0, 8.0, 11.0, 10.0, 16.0, 17.0, 24.0, 19.0, 18.0, 36.0, 35.0, 45.0, 46.0, 53.0, 56.0, 61.0, 49.0, 54.0, 42.0, 59.0, 39.0, 51.0, 28.0, 28.0, 28.0, 27.0, 25.0, 21.0, 17.0, 13.0, 6.0, 7.0, 7.0, 4.0, 6.0, 2.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.19580078125, -0.1898212432861328, -0.18384170532226562, -0.17786216735839844, -0.17188262939453125, -0.16590309143066406, -0.15992355346679688, -0.1539440155029297, -0.1479644775390625, -0.1419849395751953, -0.13600540161132812, -0.13002586364746094, -0.12404632568359375, -0.11806678771972656, -0.11208724975585938, -0.10610771179199219, -0.100128173828125, -0.09414863586425781, -0.08816909790039062, -0.08218955993652344, -0.07621002197265625, -0.07023048400878906, -0.06425094604492188, -0.05827140808105469, -0.0522918701171875, -0.04631233215332031, -0.040332794189453125, -0.03435325622558594, -0.02837371826171875, -0.022394180297851562, -0.016414642333984375, -0.010435104370117188, -0.00445556640625, 0.0015239715576171875, 0.007503509521484375, 0.013483047485351562, 0.01946258544921875, 0.025442123413085938, 0.031421661376953125, 0.03740119934082031, 0.0433807373046875, 0.04936027526855469, 0.055339813232421875, 0.06131935119628906, 0.06729888916015625, 0.07327842712402344, 0.07925796508789062, 0.08523750305175781, 0.091217041015625, 0.09719657897949219, 0.10317611694335938, 0.10915565490722656, 0.11513519287109375, 0.12111473083496094, 0.12709426879882812, 0.1330738067626953, 0.1390533447265625, 0.1450328826904297, 0.15101242065429688, 0.15699195861816406, 0.16297149658203125, 0.16895103454589844, 0.17493057250976562, 0.1809101104736328, 0.1868896484375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [4.0, 3.0, 11.0, 230.0, 646.0, 112.0, 14.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3628416061401367, -1.8222951889038086, -1.28174889087677, -0.7412025928497314, -0.20065617561340332, 0.3398902416229248, 0.8804364204406738, 1.420982837677002, 1.96152925491333, 2.502075672149658, 3.0426220893859863, 3.5831682682037354, 4.123714447021484, 4.6642608642578125, 5.204807281494141, 5.745353698730469, 6.285900115966797, 6.826446533203125, 7.366992950439453, 7.907539367675781, 8.44808578491211, 8.988632202148438, 9.529178619384766, 10.069725036621094, 10.610271453857422, 11.15081787109375, 11.691364288330078, 12.231910705566406, 12.772457122802734, 13.313003540039062, 13.85354995727539, 14.394096374511719, 14.934640884399414, 15.475187301635742, 16.01573371887207, 16.5562801361084, 17.096826553344727, 17.637372970581055, 18.177919387817383, 18.71846580505371, 19.25901222229004, 19.799558639526367, 20.340105056762695, 20.880651473999023, 21.42119789123535, 21.96174430847168, 22.502290725708008, 23.042837142944336, 23.58338165283203, 24.12392807006836, 24.664474487304688, 25.205020904541016, 25.745567321777344, 26.286113739013672, 26.82666015625, 27.367206573486328, 27.907752990722656, 28.448299407958984, 28.988845825195312, 29.52939224243164, 30.06993865966797, 30.610485076904297, 31.151031494140625, 31.691577911376953, 32.23212432861328]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 7.0, 3.0, 8.0, 6.0, 4.0, 12.0, 13.0, 14.0, 18.0, 19.0, 26.0, 28.0, 36.0, 35.0, 33.0, 47.0, 43.0, 53.0, 50.0, 55.0, 59.0, 46.0, 55.0, 40.0, 33.0, 35.0, 36.0, 24.0, 22.0, 19.0, 29.0, 27.0, 15.0, 9.0, 13.0, 5.0, 8.0, 7.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.4141740798950195, -3.3004465103149414, -3.186718702316284, -3.072991132736206, -2.959263563156128, -2.8455357551574707, -2.7318081855773926, -2.6180806159973145, -2.5043530464172363, -2.390625476837158, -2.276897668838501, -2.163170099258423, -2.0494425296783447, -1.935714840888977, -1.8219871520996094, -1.7082595825195312, -1.594531774520874, -1.4808040857315063, -1.3670765161514282, -1.2533488273620605, -1.1396212577819824, -1.0258935689926147, -0.9121658802032471, -0.7984382510185242, -0.6847106218338013, -0.5709829926490784, -0.4572553336620331, -0.3435276746749878, -0.2298000454902649, -0.11607241630554199, -0.0023447275161743164, 0.11138290166854858, 0.22511053085327148, 0.3388381600379944, 0.4525658190250397, 0.566293478012085, 0.6800211071968079, 0.7937487363815308, 0.9074764251708984, 1.0212039947509766, 1.1349316835403442, 1.248659372329712, 1.36238694190979, 1.4761146306991577, 1.5898423194885254, 1.7035698890686035, 1.8172975778579712, 1.9310252666473389, 2.044752836227417, 2.158480405807495, 2.2722082138061523, 2.3859357833862305, 2.4996633529663086, 2.6133909225463867, 2.727118730545044, 2.840846300125122, 2.9545741081237793, 3.0683016777038574, 3.1820294857025146, 3.2957570552825928, 3.409484624862671, 3.523212432861328, 3.6369400024414062, 3.7506675720214844, 3.8643951416015625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 8.0, 4.0, 6.0, 10.0, 19.0, 19.0, 28.0, 34.0, 37.0, 48.0, 69.0, 128.0, 182.0, 275.0, 543.0, 1247.0, 3681.0, 13958.0, 78366.0, 784945.0, 2849943.0, 398263.0, 47930.0, 9497.0, 2737.0, 1040.0, 474.0, 279.0, 150.0, 107.0, 59.0, 55.0, 31.0, 28.0, 18.0, 17.0, 18.0, 5.0, 7.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-1.50390625, -1.4613800048828125, -1.418853759765625, -1.3763275146484375, -1.33380126953125, -1.2912750244140625, -1.248748779296875, -1.2062225341796875, -1.1636962890625, -1.1211700439453125, -1.078643798828125, -1.0361175537109375, -0.99359130859375, -0.9510650634765625, -0.908538818359375, -0.8660125732421875, -0.823486328125, -0.7809600830078125, -0.738433837890625, -0.6959075927734375, -0.65338134765625, -0.6108551025390625, -0.568328857421875, -0.5258026123046875, -0.4832763671875, -0.4407501220703125, -0.398223876953125, -0.3556976318359375, -0.31317138671875, -0.2706451416015625, -0.228118896484375, -0.1855926513671875, -0.14306640625, -0.1005401611328125, -0.058013916015625, -0.0154876708984375, 0.02703857421875, 0.0695648193359375, 0.112091064453125, 0.1546173095703125, 0.1971435546875, 0.2396697998046875, 0.282196044921875, 0.3247222900390625, 0.36724853515625, 0.4097747802734375, 0.452301025390625, 0.4948272705078125, 0.537353515625, 0.5798797607421875, 0.622406005859375, 0.6649322509765625, 0.70745849609375, 0.7499847412109375, 0.792510986328125, 0.8350372314453125, 0.8775634765625, 0.9200897216796875, 0.962615966796875, 1.0051422119140625, 1.04766845703125, 1.0901947021484375, 1.132720947265625, 1.1752471923828125, 1.2177734375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 10.0, 5.0, 7.0, 12.0, 13.0, 16.0, 18.0, 13.0, 24.0, 40.0, 31.0, 37.0, 52.0, 45.0, 50.0, 67.0, 58.0, 63.0, 72.0, 48.0, 50.0, 47.0, 48.0, 32.0, 32.0, 22.0, 28.0, 10.0, 16.0, 5.0, 12.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.59228515625, -0.5752716064453125, -0.558258056640625, -0.5412445068359375, -0.52423095703125, -0.5072174072265625, -0.490203857421875, -0.4731903076171875, -0.4561767578125, -0.4391632080078125, -0.422149658203125, -0.4051361083984375, -0.38812255859375, -0.3711090087890625, -0.354095458984375, -0.3370819091796875, -0.320068359375, -0.3030548095703125, -0.286041259765625, -0.2690277099609375, -0.25201416015625, -0.2350006103515625, -0.217987060546875, -0.2009735107421875, -0.1839599609375, -0.1669464111328125, -0.149932861328125, -0.1329193115234375, -0.11590576171875, -0.0988922119140625, -0.081878662109375, -0.0648651123046875, -0.0478515625, -0.0308380126953125, -0.013824462890625, 0.0031890869140625, 0.02020263671875, 0.0372161865234375, 0.054229736328125, 0.0712432861328125, 0.0882568359375, 0.1052703857421875, 0.122283935546875, 0.1392974853515625, 0.15631103515625, 0.1733245849609375, 0.190338134765625, 0.2073516845703125, 0.224365234375, 0.2413787841796875, 0.258392333984375, 0.2754058837890625, 0.29241943359375, 0.3094329833984375, 0.326446533203125, 0.3434600830078125, 0.3604736328125, 0.3774871826171875, 0.394500732421875, 0.4115142822265625, 0.42852783203125, 0.4455413818359375, 0.462554931640625, 0.4795684814453125, 0.49658203125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 11.0, 5.0, 8.0, 9.0, 16.0, 36.0, 57.0, 77.0, 142.0, 411.0, 1193.0, 4798.0, 24354.0, 150317.0, 907564.0, 2258057.0, 709063.0, 113977.0, 18828.0, 3711.0, 1000.0, 315.0, 139.0, 71.0, 41.0, 30.0, 14.0, 16.0, 9.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.517578125, -1.4734954833984375, -1.429412841796875, -1.3853302001953125, -1.34124755859375, -1.2971649169921875, -1.253082275390625, -1.2089996337890625, -1.1649169921875, -1.1208343505859375, -1.076751708984375, -1.0326690673828125, -0.98858642578125, -0.9445037841796875, -0.900421142578125, -0.8563385009765625, -0.812255859375, -0.7681732177734375, -0.724090576171875, -0.6800079345703125, -0.63592529296875, -0.5918426513671875, -0.547760009765625, -0.5036773681640625, -0.4595947265625, -0.4155120849609375, -0.371429443359375, -0.3273468017578125, -0.28326416015625, -0.2391815185546875, -0.195098876953125, -0.1510162353515625, -0.10693359375, -0.0628509521484375, -0.018768310546875, 0.0253143310546875, 0.06939697265625, 0.1134796142578125, 0.157562255859375, 0.2016448974609375, 0.2457275390625, 0.2898101806640625, 0.333892822265625, 0.3779754638671875, 0.42205810546875, 0.4661407470703125, 0.510223388671875, 0.5543060302734375, 0.598388671875, 0.6424713134765625, 0.686553955078125, 0.7306365966796875, 0.77471923828125, 0.8188018798828125, 0.862884521484375, 0.9069671630859375, 0.9510498046875, 0.9951324462890625, 1.039215087890625, 1.0832977294921875, 1.12738037109375, 1.1714630126953125, 1.215545654296875, 1.2596282958984375, 1.3037109375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 5.0, 6.0, 8.0, 5.0, 12.0, 14.0, 16.0, 17.0, 25.0, 31.0, 37.0, 54.0, 79.0, 89.0, 117.0, 160.0, 197.0, 253.0, 307.0, 315.0, 381.0, 366.0, 326.0, 234.0, 222.0, 183.0, 148.0, 109.0, 81.0, 67.0, 45.0, 56.0, 23.0, 16.0, 20.0, 19.0, 16.0, 8.0, 8.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5029296875, -0.48484039306640625, -0.4667510986328125, -0.44866180419921875, -0.430572509765625, -0.41248321533203125, -0.3943939208984375, -0.37630462646484375, -0.35821533203125, -0.34012603759765625, -0.3220367431640625, -0.30394744873046875, -0.285858154296875, -0.26776885986328125, -0.2496795654296875, -0.23159027099609375, -0.2135009765625, -0.19541168212890625, -0.1773223876953125, -0.15923309326171875, -0.141143798828125, -0.12305450439453125, -0.1049652099609375, -0.08687591552734375, -0.06878662109375, -0.05069732666015625, -0.0326080322265625, -0.01451873779296875, 0.003570556640625, 0.02165985107421875, 0.0397491455078125, 0.05783843994140625, 0.075927734375, 0.09401702880859375, 0.1121063232421875, 0.13019561767578125, 0.148284912109375, 0.16637420654296875, 0.1844635009765625, 0.20255279541015625, 0.22064208984375, 0.23873138427734375, 0.2568206787109375, 0.27490997314453125, 0.292999267578125, 0.31108856201171875, 0.3291778564453125, 0.34726715087890625, 0.3653564453125, 0.38344573974609375, 0.4015350341796875, 0.41962432861328125, 0.437713623046875, 0.45580291748046875, 0.4738922119140625, 0.49198150634765625, 0.51007080078125, 0.5281600952148438, 0.5462493896484375, 0.5643386840820312, 0.582427978515625, 0.6005172729492188, 0.6186065673828125, 0.6366958618164062, 0.65478515625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 5.0, 6.0, 17.0, 20.0, 27.0, 64.0, 69.0, 127.0, 146.0, 138.0, 147.0, 81.0, 69.0, 36.0, 19.0, 19.0, 7.0, 7.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4545135498046875, -3.3234996795654297, -3.192485809326172, -3.061472177505493, -2.9304583072662354, -2.7994444370269775, -2.668430805206299, -2.537416934967041, -2.406403064727783, -2.2753891944885254, -2.1443753242492676, -2.013361692428589, -1.882347822189331, -1.7513339519500732, -1.620320200920105, -1.4893064498901367, -1.358292579650879, -1.227278709411621, -1.0962649583816528, -0.9652511477470398, -0.8342373371124268, -0.7032235264778137, -0.5722097158432007, -0.44119590520858765, -0.3101820945739746, -0.17916828393936157, -0.048154473304748535, 0.0828593373298645, 0.21387314796447754, 0.3448869585990906, 0.4759007692337036, 0.6069145798683167, 0.7379279136657715, 0.8689417243003845, 0.9999555349349976, 1.1309692859649658, 1.2619831562042236, 1.3929970264434814, 1.5240107774734497, 1.655024528503418, 1.7860383987426758, 1.9170522689819336, 2.0480661392211914, 2.17907977104187, 2.310093641281128, 2.4411075115203857, 2.5721211433410645, 2.7031350135803223, 2.83414888381958, 2.965162754058838, 3.0961766242980957, 3.2271902561187744, 3.3582041263580322, 3.48921799659729, 3.6202316284179688, 3.7512454986572266, 3.8822593688964844, 4.013273239135742, 4.144287109375, 4.275300979614258, 4.406314849853516, 4.537328243255615, 4.668342113494873, 4.799355983734131, 4.930369853973389]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 6.0, 8.0, 5.0, 7.0, 18.0, 18.0, 22.0, 24.0, 24.0, 40.0, 33.0, 36.0, 32.0, 42.0, 44.0, 58.0, 49.0, 60.0, 43.0, 50.0, 40.0, 46.0, 37.0, 34.0, 29.0, 46.0, 39.0, 17.0, 22.0, 8.0, 14.0, 14.0, 2.0, 8.0, 8.0, 2.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2550594806671143, -2.176494598388672, -2.0979294776916504, -2.019364595413208, -1.9407997131347656, -1.8622347116470337, -1.7836697101593018, -1.7051048278808594, -1.6265398263931274, -1.5479748249053955, -1.4694099426269531, -1.3908449411392212, -1.3122799396514893, -1.2337150573730469, -1.155150055885315, -1.076585054397583, -0.9980201721191406, -0.9194552302360535, -0.8408902883529663, -0.7623252868652344, -0.6837603449821472, -0.6051954030990601, -0.5266304016113281, -0.44806545972824097, -0.3695005178451538, -0.29093557596206665, -0.2123706042766571, -0.13380564749240875, -0.0552406907081604, 0.023324251174926758, 0.1018892228603363, 0.18045419454574585, 0.2590193748474121, 0.33758431673049927, 0.4161492884159088, 0.49471426010131836, 0.5732792019844055, 0.6518441438674927, 0.7304091453552246, 0.8089740872383118, 0.8875390291213989, 0.9661039710044861, 1.0446689128875732, 1.1232339143753052, 1.201798915863037, 1.2803637981414795, 1.3589287996292114, 1.4374938011169434, 1.5160586833953857, 1.5946236848831177, 1.67318856716156, 1.751753568649292, 1.8303184509277344, 1.9088834524154663, 1.9874484539031982, 2.0660133361816406, 2.144578456878662, 2.2231433391571045, 2.301708459854126, 2.3802733421325684, 2.4588382244110107, 2.537403106689453, 2.6159682273864746, 2.694533109664917, 2.7730979919433594]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 6.0, 9.0, 7.0, 26.0, 26.0, 41.0, 79.0, 122.0, 219.0, 379.0, 588.0, 1035.0, 1655.0, 2762.0, 4584.0, 7968.0, 16194.0, 37581.0, 102821.0, 256109.0, 329401.0, 172315.0, 63550.0, 24589.0, 11301.0, 6185.0, 3537.0, 2149.0, 1262.0, 798.0, 519.0, 277.0, 164.0, 102.0, 73.0, 35.0, 23.0, 15.0, 11.0, 13.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1396484375, -1.1043243408203125, -1.069000244140625, -1.0336761474609375, -0.99835205078125, -0.9630279541015625, -0.927703857421875, -0.8923797607421875, -0.8570556640625, -0.8217315673828125, -0.786407470703125, -0.7510833740234375, -0.71575927734375, -0.6804351806640625, -0.645111083984375, -0.6097869873046875, -0.574462890625, -0.5391387939453125, -0.503814697265625, -0.4684906005859375, -0.43316650390625, -0.3978424072265625, -0.362518310546875, -0.3271942138671875, -0.2918701171875, -0.2565460205078125, -0.221221923828125, -0.1858978271484375, -0.15057373046875, -0.1152496337890625, -0.079925537109375, -0.0446014404296875, -0.00927734375, 0.0260467529296875, 0.061370849609375, 0.0966949462890625, 0.13201904296875, 0.1673431396484375, 0.202667236328125, 0.2379913330078125, 0.2733154296875, 0.3086395263671875, 0.343963623046875, 0.3792877197265625, 0.41461181640625, 0.4499359130859375, 0.485260009765625, 0.5205841064453125, 0.555908203125, 0.5912322998046875, 0.626556396484375, 0.6618804931640625, 0.69720458984375, 0.7325286865234375, 0.767852783203125, 0.8031768798828125, 0.8385009765625, 0.8738250732421875, 0.909149169921875, 0.9444732666015625, 0.97979736328125, 1.0151214599609375, 1.050445556640625, 1.0857696533203125, 1.12109375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 9.0, 3.0, 5.0, 17.0, 8.0, 9.0, 12.0, 14.0, 31.0, 27.0, 29.0, 23.0, 43.0, 40.0, 51.0, 65.0, 70.0, 68.0, 50.0, 69.0, 46.0, 53.0, 44.0, 35.0, 34.0, 32.0, 15.0, 26.0, 17.0, 15.0, 15.0, 8.0, 5.0, 8.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.591796875, -0.5757026672363281, -0.5596084594726562, -0.5435142517089844, -0.5274200439453125, -0.5113258361816406, -0.49523162841796875, -0.4791374206542969, -0.463043212890625, -0.4469490051269531, -0.43085479736328125, -0.4147605895996094, -0.3986663818359375, -0.3825721740722656, -0.36647796630859375, -0.3503837585449219, -0.33428955078125, -0.3181953430175781, -0.30210113525390625, -0.2860069274902344, -0.2699127197265625, -0.2538185119628906, -0.23772430419921875, -0.22163009643554688, -0.205535888671875, -0.18944168090820312, -0.17334747314453125, -0.15725326538085938, -0.1411590576171875, -0.12506484985351562, -0.10897064208984375, -0.09287643432617188, -0.0767822265625, -0.060688018798828125, -0.04459381103515625, -0.028499603271484375, -0.0124053955078125, 0.003688812255859375, 0.01978302001953125, 0.035877227783203125, 0.051971435546875, 0.06806564331054688, 0.08415985107421875, 0.10025405883789062, 0.1163482666015625, 0.13244247436523438, 0.14853668212890625, 0.16463088989257812, 0.18072509765625, 0.19681930541992188, 0.21291351318359375, 0.22900772094726562, 0.2451019287109375, 0.2611961364746094, 0.27729034423828125, 0.2933845520019531, 0.309478759765625, 0.3255729675292969, 0.34166717529296875, 0.3577613830566406, 0.3738555908203125, 0.3899497985839844, 0.40604400634765625, 0.4221382141113281, 0.438232421875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 9.0, 4.0, 11.0, 21.0, 17.0, 22.0, 42.0, 44.0, 78.0, 130.0, 283.0, 683.0, 1661.0, 4195.0, 10496.0, 29856.0, 123617.0, 445373.0, 325830.0, 72675.0, 20523.0, 7813.0, 2964.0, 1139.0, 505.0, 219.0, 113.0, 79.0, 40.0, 33.0, 20.0, 14.0, 18.0, 11.0, 5.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.45703125, -1.406494140625, -1.35595703125, -1.305419921875, -1.2548828125, -1.204345703125, -1.15380859375, -1.103271484375, -1.052734375, -1.002197265625, -0.95166015625, -0.901123046875, -0.8505859375, -0.800048828125, -0.74951171875, -0.698974609375, -0.6484375, -0.597900390625, -0.54736328125, -0.496826171875, -0.4462890625, -0.395751953125, -0.34521484375, -0.294677734375, -0.244140625, -0.193603515625, -0.14306640625, -0.092529296875, -0.0419921875, 0.008544921875, 0.05908203125, 0.109619140625, 0.16015625, 0.210693359375, 0.26123046875, 0.311767578125, 0.3623046875, 0.412841796875, 0.46337890625, 0.513916015625, 0.564453125, 0.614990234375, 0.66552734375, 0.716064453125, 0.7666015625, 0.817138671875, 0.86767578125, 0.918212890625, 0.96875, 1.019287109375, 1.06982421875, 1.120361328125, 1.1708984375, 1.221435546875, 1.27197265625, 1.322509765625, 1.373046875, 1.423583984375, 1.47412109375, 1.524658203125, 1.5751953125, 1.625732421875, 1.67626953125, 1.726806640625, 1.77734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 9.0, 3.0, 7.0, 11.0, 15.0, 24.0, 16.0, 25.0, 25.0, 26.0, 43.0, 51.0, 38.0, 46.0, 50.0, 55.0, 49.0, 60.0, 58.0, 48.0, 36.0, 48.0, 36.0, 38.0, 43.0, 21.0, 18.0, 15.0, 13.0, 9.0, 14.0, 16.0, 7.0, 5.0, 3.0, 6.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.017578125, -0.9846954345703125, -0.951812744140625, -0.9189300537109375, -0.88604736328125, -0.8531646728515625, -0.820281982421875, -0.7873992919921875, -0.7545166015625, -0.7216339111328125, -0.688751220703125, -0.6558685302734375, -0.62298583984375, -0.5901031494140625, -0.557220458984375, -0.5243377685546875, -0.491455078125, -0.4585723876953125, -0.425689697265625, -0.3928070068359375, -0.35992431640625, -0.3270416259765625, -0.294158935546875, -0.2612762451171875, -0.2283935546875, -0.1955108642578125, -0.162628173828125, -0.1297454833984375, -0.09686279296875, -0.0639801025390625, -0.031097412109375, 0.0017852783203125, 0.03466796875, 0.0675506591796875, 0.100433349609375, 0.1333160400390625, 0.16619873046875, 0.1990814208984375, 0.231964111328125, 0.2648468017578125, 0.2977294921875, 0.3306121826171875, 0.363494873046875, 0.3963775634765625, 0.42926025390625, 0.4621429443359375, 0.495025634765625, 0.5279083251953125, 0.560791015625, 0.5936737060546875, 0.626556396484375, 0.6594390869140625, 0.69232177734375, 0.7252044677734375, 0.758087158203125, 0.7909698486328125, 0.8238525390625, 0.8567352294921875, 0.889617919921875, 0.9225006103515625, 0.95538330078125, 0.9882659912109375, 1.021148681640625, 1.0540313720703125, 1.0869140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 12.0, 12.0, 23.0, 27.0, 38.0, 60.0, 78.0, 111.0, 144.0, 201.0, 272.0, 378.0, 570.0, 789.0, 1333.0, 2433.0, 5337.0, 14745.0, 78173.0, 578115.0, 312241.0, 34996.0, 9346.0, 3786.0, 1901.0, 1108.0, 678.0, 448.0, 325.0, 243.0, 158.0, 117.0, 87.0, 68.0, 55.0, 35.0, 25.0, 12.0, 20.0, 17.0, 9.0, 7.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.3876953125, -1.34405517578125, -1.3004150390625, -1.25677490234375, -1.213134765625, -1.16949462890625, -1.1258544921875, -1.08221435546875, -1.03857421875, -0.99493408203125, -0.9512939453125, -0.90765380859375, -0.864013671875, -0.82037353515625, -0.7767333984375, -0.73309326171875, -0.689453125, -0.64581298828125, -0.6021728515625, -0.55853271484375, -0.514892578125, -0.47125244140625, -0.4276123046875, -0.38397216796875, -0.34033203125, -0.29669189453125, -0.2530517578125, -0.20941162109375, -0.165771484375, -0.12213134765625, -0.0784912109375, -0.03485107421875, 0.0087890625, 0.05242919921875, 0.0960693359375, 0.13970947265625, 0.183349609375, 0.22698974609375, 0.2706298828125, 0.31427001953125, 0.35791015625, 0.40155029296875, 0.4451904296875, 0.48883056640625, 0.532470703125, 0.57611083984375, 0.6197509765625, 0.66339111328125, 0.70703125, 0.75067138671875, 0.7943115234375, 0.83795166015625, 0.881591796875, 0.92523193359375, 0.9688720703125, 1.01251220703125, 1.05615234375, 1.09979248046875, 1.1434326171875, 1.18707275390625, 1.230712890625, 1.27435302734375, 1.3179931640625, 1.36163330078125, 1.4052734375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 5.0, 6.0, 10.0, 9.0, 10.0, 25.0, 72.0, 149.0, 222.0, 225.0, 133.0, 61.0, 21.0, 16.0, 3.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00017690658569335938, -0.00017169490456581116, -0.00016648322343826294, -0.00016127154231071472, -0.0001560598611831665, -0.00015084818005561829, -0.00014563649892807007, -0.00014042481780052185, -0.00013521313667297363, -0.00013000145554542542, -0.0001247897744178772, -0.00011957809329032898, -0.00011436641216278076, -0.00010915473103523254, -0.00010394304990768433, -9.873136878013611e-05, -9.351968765258789e-05, -8.830800652503967e-05, -8.309632539749146e-05, -7.788464426994324e-05, -7.267296314239502e-05, -6.74612820148468e-05, -6.224960088729858e-05, -5.7037919759750366e-05, -5.182623863220215e-05, -4.661455750465393e-05, -4.140287637710571e-05, -3.6191195249557495e-05, -3.097951412200928e-05, -2.576783299446106e-05, -2.0556151866912842e-05, -1.5344470739364624e-05, -1.0132789611816406e-05, -4.9211084842681885e-06, 2.905726432800293e-07, 5.502253770828247e-06, 1.0713934898376465e-05, 1.5925616025924683e-05, 2.11372971534729e-05, 2.6348978281021118e-05, 3.1560659408569336e-05, 3.6772340536117554e-05, 4.198402166366577e-05, 4.719570279121399e-05, 5.240738391876221e-05, 5.7619065046310425e-05, 6.283074617385864e-05, 6.804242730140686e-05, 7.325410842895508e-05, 7.84657895565033e-05, 8.367747068405151e-05, 8.888915181159973e-05, 9.410083293914795e-05, 9.931251406669617e-05, 0.00010452419519424438, 0.0001097358763217926, 0.00011494755744934082, 0.00012015923857688904, 0.00012537091970443726, 0.00013058260083198547, 0.0001357942819595337, 0.0001410059630870819, 0.00014621764421463013, 0.00015142932534217834, 0.00015664100646972656]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 6.0, 9.0, 11.0, 34.0, 50.0, 79.0, 146.0, 259.0, 482.0, 1054.0, 2533.0, 6130.0, 19120.0, 72321.0, 253834.0, 405162.0, 207331.0, 55474.0, 15246.0, 5204.0, 2054.0, 940.0, 473.0, 237.0, 152.0, 70.0, 39.0, 33.0, 18.0, 8.0, 10.0, 10.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7138671875, -0.6924972534179688, -0.6711273193359375, -0.6497573852539062, -0.628387451171875, -0.6070175170898438, -0.5856475830078125, -0.5642776489257812, -0.54290771484375, -0.5215377807617188, -0.5001678466796875, -0.47879791259765625, -0.457427978515625, -0.43605804443359375, -0.4146881103515625, -0.39331817626953125, -0.3719482421875, -0.35057830810546875, -0.3292083740234375, -0.30783843994140625, -0.286468505859375, -0.26509857177734375, -0.2437286376953125, -0.22235870361328125, -0.20098876953125, -0.17961883544921875, -0.1582489013671875, -0.13687896728515625, -0.115509033203125, -0.09413909912109375, -0.0727691650390625, -0.05139923095703125, -0.030029296875, -0.00865936279296875, 0.0127105712890625, 0.03408050537109375, 0.055450439453125, 0.07682037353515625, 0.0981903076171875, 0.11956024169921875, 0.14093017578125, 0.16230010986328125, 0.1836700439453125, 0.20503997802734375, 0.226409912109375, 0.24777984619140625, 0.2691497802734375, 0.29051971435546875, 0.3118896484375, 0.33325958251953125, 0.3546295166015625, 0.37599945068359375, 0.397369384765625, 0.41873931884765625, 0.4401092529296875, 0.46147918701171875, 0.48284912109375, 0.5042190551757812, 0.5255889892578125, 0.5469589233398438, 0.568328857421875, 0.5896987915039062, 0.6110687255859375, 0.6324386596679688, 0.65380859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 5.0, 11.0, 12.0, 22.0, 38.0, 40.0, 47.0, 50.0, 55.0, 74.0, 73.0, 65.0, 68.0, 71.0, 67.0, 62.0, 63.0, 34.0, 32.0, 20.0, 14.0, 11.0, 16.0, 6.0, 7.0, 7.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4130859375, -0.4018440246582031, -0.39060211181640625, -0.3793601989746094, -0.3681182861328125, -0.3568763732910156, -0.34563446044921875, -0.3343925476074219, -0.323150634765625, -0.3119087219238281, -0.30066680908203125, -0.2894248962402344, -0.2781829833984375, -0.2669410705566406, -0.25569915771484375, -0.24445724487304688, -0.23321533203125, -0.22197341918945312, -0.21073150634765625, -0.19948959350585938, -0.1882476806640625, -0.17700576782226562, -0.16576385498046875, -0.15452194213867188, -0.143280029296875, -0.13203811645507812, -0.12079620361328125, -0.10955429077148438, -0.0983123779296875, -0.08707046508789062, -0.07582855224609375, -0.06458663940429688, -0.0533447265625, -0.042102813720703125, -0.03086090087890625, -0.019618988037109375, -0.0083770751953125, 0.002864837646484375, 0.01410675048828125, 0.025348663330078125, 0.036590576171875, 0.047832489013671875, 0.05907440185546875, 0.07031631469726562, 0.0815582275390625, 0.09280014038085938, 0.10404205322265625, 0.11528396606445312, 0.12652587890625, 0.13776779174804688, 0.14900970458984375, 0.16025161743164062, 0.1714935302734375, 0.18273544311523438, 0.19397735595703125, 0.20521926879882812, 0.216461181640625, 0.22770309448242188, 0.23894500732421875, 0.2501869201660156, 0.2614288330078125, 0.2726707458496094, 0.28391265869140625, 0.2951545715332031, 0.306396484375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 9.0, 11.0, 36.0, 78.0, 134.0, 196.0, 188.0, 153.0, 96.0, 51.0, 30.0, 14.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9286298751831055, -1.7383207082748413, -1.5480115413665771, -1.3577024936676025, -1.1673933267593384, -0.9770841598510742, -0.7867751121520996, -0.5964659452438354, -0.4061567783355713, -0.21584764122962952, -0.025538504123687744, 0.16477060317993164, 0.3550797700881958, 0.54538893699646, 0.7356979846954346, 0.9260071516036987, 1.116316318511963, 1.306625485420227, 1.4969346523284912, 1.6872437000274658, 1.87755286693573, 2.067862033843994, 2.2581710815429688, 2.4484801292419434, 2.638789415359497, 2.8290984630584717, 3.0194077491760254, 3.209716796875, 3.4000258445739746, 3.5903351306915283, 3.780644178390503, 3.9709534645080566, 4.161262512207031, 4.351571559906006, 4.5418806076049805, 4.732190132141113, 4.922499179840088, 5.1128082275390625, 5.303117275238037, 5.493426322937012, 5.6837358474731445, 5.874044895172119, 6.064353942871094, 6.254663467407227, 6.444972515106201, 6.635281562805176, 6.82559061050415, 7.015899658203125, 7.2062087059021, 7.396517753601074, 7.586826801300049, 7.777135848999023, 7.967445373535156, 8.157754898071289, 8.348063468933105, 8.538372993469238, 8.728681564331055, 8.918991088867188, 9.109299659729004, 9.299609184265137, 9.489917755126953, 9.680227279663086, 9.870536804199219, 10.060845375061035, 10.251154899597168]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 11.0, 4.0, 10.0, 9.0, 10.0, 17.0, 7.0, 14.0, 17.0, 20.0, 23.0, 28.0, 32.0, 37.0, 26.0, 26.0, 38.0, 29.0, 38.0, 47.0, 51.0, 40.0, 35.0, 45.0, 51.0, 30.0, 31.0, 41.0, 25.0, 30.0, 26.0, 24.0, 28.0, 15.0, 14.0, 21.0, 9.0, 8.0, 7.0, 3.0, 4.0, 4.0, 3.0, 6.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.508599042892456, -2.4320833683013916, -2.3555679321289062, -2.279052257537842, -2.2025368213653564, -2.126021146774292, -2.0495057106018066, -1.9729900360107422, -1.8964744806289673, -1.8199589252471924, -1.7434433698654175, -1.6669278144836426, -1.5904121398925781, -1.5138967037200928, -1.4373810291290283, -1.3608654737472534, -1.2843499183654785, -1.2078343629837036, -1.1313188076019287, -1.0548032522201538, -0.9782876372337341, -0.9017720818519592, -0.8252564668655396, -0.7487409114837646, -0.6722253561019897, -0.5957098007202148, -0.5191942453384399, -0.44267863035202026, -0.36616307497024536, -0.28964751958847046, -0.21313193440437317, -0.13661634922027588, -0.060100555419921875, 0.01641501486301422, 0.09293058514595032, 0.1694461554288864, 0.2459617257118225, 0.3224772810935974, 0.3989928662776947, 0.475508451461792, 0.5520240068435669, 0.6285395622253418, 0.7050551176071167, 0.7815707325935364, 0.8580862879753113, 0.9346018433570862, 1.0111174583435059, 1.0876330137252808, 1.1641485691070557, 1.2406641244888306, 1.3171796798706055, 1.3936952352523804, 1.4702107906341553, 1.5467264652252197, 1.6232420206069946, 1.6997575759887695, 1.7762731313705444, 1.8527886867523193, 1.9293042421340942, 2.005819797515869, 2.0823354721069336, 2.158850908279419, 2.2353665828704834, 2.3118820190429688, 2.388397693634033]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 9.0, 13.0, 21.0, 24.0, 36.0, 45.0, 74.0, 114.0, 156.0, 225.0, 366.0, 630.0, 980.0, 1673.0, 2941.0, 5543.0, 10590.0, 22003.0, 50222.0, 123979.0, 334936.0, 857897.0, 1332182.0, 880203.0, 345393.0, 127087.0, 50706.0, 22511.0, 10753.0, 5536.0, 3045.0, 1729.0, 1021.0, 597.0, 362.0, 217.0, 159.0, 90.0, 67.0, 36.0, 30.0, 22.0, 16.0, 18.0, 10.0, 7.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48583984375, -0.4708976745605469, -0.45595550537109375, -0.4410133361816406, -0.4260711669921875, -0.4111289978027344, -0.39618682861328125, -0.3812446594238281, -0.366302490234375, -0.3513603210449219, -0.33641815185546875, -0.3214759826660156, -0.3065338134765625, -0.2915916442871094, -0.27664947509765625, -0.2617073059082031, -0.24676513671875, -0.23182296752929688, -0.21688079833984375, -0.20193862915039062, -0.1869964599609375, -0.17205429077148438, -0.15711212158203125, -0.14216995239257812, -0.127227783203125, -0.11228561401367188, -0.09734344482421875, -0.08240127563476562, -0.0674591064453125, -0.052516937255859375, -0.03757476806640625, -0.022632598876953125, -0.0076904296875, 0.007251739501953125, 0.02219390869140625, 0.037136077880859375, 0.0520782470703125, 0.06702041625976562, 0.08196258544921875, 0.09690475463867188, 0.111846923828125, 0.12678909301757812, 0.14173126220703125, 0.15667343139648438, 0.1716156005859375, 0.18655776977539062, 0.20149993896484375, 0.21644210815429688, 0.23138427734375, 0.24632644653320312, 0.26126861572265625, 0.2762107849121094, 0.2911529541015625, 0.3060951232910156, 0.32103729248046875, 0.3359794616699219, 0.350921630859375, 0.3658638000488281, 0.38080596923828125, 0.3957481384277344, 0.4106903076171875, 0.4256324768066406, 0.44057464599609375, 0.4555168151855469, 0.470458984375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 11.0, 12.0, 10.0, 14.0, 19.0, 19.0, 23.0, 26.0, 32.0, 32.0, 40.0, 56.0, 34.0, 52.0, 56.0, 71.0, 59.0, 60.0, 53.0, 49.0, 40.0, 34.0, 41.0, 29.0, 19.0, 26.0, 17.0, 9.0, 12.0, 6.0, 8.0, 10.0, 5.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.54296875, -0.5277442932128906, -0.5125198364257812, -0.4972953796386719, -0.4820709228515625, -0.4668464660644531, -0.45162200927734375, -0.4363975524902344, -0.421173095703125, -0.4059486389160156, -0.39072418212890625, -0.3754997253417969, -0.3602752685546875, -0.3450508117675781, -0.32982635498046875, -0.3146018981933594, -0.29937744140625, -0.2841529846191406, -0.26892852783203125, -0.2537040710449219, -0.2384796142578125, -0.22325515747070312, -0.20803070068359375, -0.19280624389648438, -0.177581787109375, -0.16235733032226562, -0.14713287353515625, -0.13190841674804688, -0.1166839599609375, -0.10145950317382812, -0.08623504638671875, -0.07101058959960938, -0.0557861328125, -0.040561676025390625, -0.02533721923828125, -0.010112762451171875, 0.0051116943359375, 0.020336151123046875, 0.03556060791015625, 0.050785064697265625, 0.066009521484375, 0.08123397827148438, 0.09645843505859375, 0.11168289184570312, 0.1269073486328125, 0.14213180541992188, 0.15735626220703125, 0.17258071899414062, 0.18780517578125, 0.20302963256835938, 0.21825408935546875, 0.23347854614257812, 0.2487030029296875, 0.2639274597167969, 0.27915191650390625, 0.2943763732910156, 0.309600830078125, 0.3248252868652344, 0.34004974365234375, 0.3552742004394531, 0.3704986572265625, 0.3857231140136719, 0.40094757080078125, 0.4161720275878906, 0.431396484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 9.0, 6.0, 7.0, 12.0, 17.0, 28.0, 32.0, 53.0, 77.0, 117.0, 197.0, 329.0, 647.0, 1520.0, 4167.0, 12786.0, 46904.0, 181080.0, 660691.0, 1553615.0, 1197645.0, 392936.0, 101883.0, 26933.0, 7740.0, 2629.0, 1043.0, 473.0, 270.0, 140.0, 90.0, 62.0, 32.0, 36.0, 20.0, 13.0, 14.0, 13.0, 5.0, 1.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8193359375, -0.792724609375, -0.76611328125, -0.739501953125, -0.712890625, -0.686279296875, -0.65966796875, -0.633056640625, -0.6064453125, -0.579833984375, -0.55322265625, -0.526611328125, -0.5, -0.473388671875, -0.44677734375, -0.420166015625, -0.3935546875, -0.366943359375, -0.34033203125, -0.313720703125, -0.287109375, -0.260498046875, -0.23388671875, -0.207275390625, -0.1806640625, -0.154052734375, -0.12744140625, -0.100830078125, -0.07421875, -0.047607421875, -0.02099609375, 0.005615234375, 0.0322265625, 0.058837890625, 0.08544921875, 0.112060546875, 0.138671875, 0.165283203125, 0.19189453125, 0.218505859375, 0.2451171875, 0.271728515625, 0.29833984375, 0.324951171875, 0.3515625, 0.378173828125, 0.40478515625, 0.431396484375, 0.4580078125, 0.484619140625, 0.51123046875, 0.537841796875, 0.564453125, 0.591064453125, 0.61767578125, 0.644287109375, 0.6708984375, 0.697509765625, 0.72412109375, 0.750732421875, 0.77734375, 0.803955078125, 0.83056640625, 0.857177734375, 0.8837890625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 5.0, 5.0, 1.0, 6.0, 6.0, 6.0, 7.0, 17.0, 20.0, 21.0, 22.0, 42.0, 57.0, 54.0, 83.0, 86.0, 131.0, 155.0, 205.0, 232.0, 262.0, 285.0, 279.0, 313.0, 270.0, 240.0, 217.0, 201.0, 160.0, 134.0, 102.0, 91.0, 91.0, 55.0, 51.0, 39.0, 33.0, 25.0, 19.0, 17.0, 6.0, 9.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.483154296875, -0.4645195007324219, -0.44588470458984375, -0.4272499084472656, -0.4086151123046875, -0.3899803161621094, -0.37134552001953125, -0.3527107238769531, -0.334075927734375, -0.3154411315917969, -0.29680633544921875, -0.2781715393066406, -0.2595367431640625, -0.24090194702148438, -0.22226715087890625, -0.20363235473632812, -0.18499755859375, -0.16636276245117188, -0.14772796630859375, -0.12909317016601562, -0.1104583740234375, -0.09182357788085938, -0.07318878173828125, -0.054553985595703125, -0.035919189453125, -0.017284393310546875, 0.00135040283203125, 0.019985198974609375, 0.0386199951171875, 0.057254791259765625, 0.07588958740234375, 0.09452438354492188, 0.1131591796875, 0.13179397583007812, 0.15042877197265625, 0.16906356811523438, 0.1876983642578125, 0.20633316040039062, 0.22496795654296875, 0.24360275268554688, 0.262237548828125, 0.2808723449707031, 0.29950714111328125, 0.3181419372558594, 0.3367767333984375, 0.3554115295410156, 0.37404632568359375, 0.3926811218261719, 0.41131591796875, 0.4299507141113281, 0.44858551025390625, 0.4672203063964844, 0.4858551025390625, 0.5044898986816406, 0.5231246948242188, 0.5417594909667969, 0.560394287109375, 0.5790290832519531, 0.5976638793945312, 0.6162986755371094, 0.6349334716796875, 0.6535682678222656, 0.6722030639648438, 0.6908378601074219, 0.70947265625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 37.0, 138.0, 361.0, 328.0, 114.0, 21.0, 10.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.46112060546875, -4.008661270141602, -3.556201457977295, -3.1037421226501465, -2.65128231048584, -2.1988229751586914, -1.7463634014129639, -1.2939038276672363, -0.8414442539215088, -0.38898470997810364, 0.06347483396530151, 0.5159343481063843, 0.9683939218521118, 1.4208533763885498, 1.8733129501342773, 2.325772523880005, 2.7782320976257324, 3.23069167137146, 3.6831512451171875, 4.135610580444336, 4.588070392608643, 5.040529727935791, 5.492989540100098, 5.945448875427246, 6.3979082107543945, 6.850367546081543, 7.30282735824585, 7.755286693572998, 8.207746505737305, 8.660205841064453, 9.112665176391602, 9.56512451171875, 10.017584800720215, 10.470044136047363, 10.922503471374512, 11.374963760375977, 11.827423095703125, 12.279882431030273, 12.732341766357422, 13.18480110168457, 13.637261390686035, 14.089720726013184, 14.542180061340332, 14.994640350341797, 15.447099685668945, 15.899559020996094, 16.352018356323242, 16.80447769165039, 17.25693702697754, 17.709396362304688, 18.161855697631836, 18.614315032958984, 19.066774368286133, 19.51923370361328, 19.971694946289062, 20.42415428161621, 20.87661361694336, 21.329072952270508, 21.781532287597656, 22.233991622924805, 22.686450958251953, 23.138912200927734, 23.591371536254883, 24.04383087158203, 24.49629020690918]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 7.0, 14.0, 8.0, 10.0, 15.0, 20.0, 21.0, 14.0, 25.0, 29.0, 37.0, 43.0, 41.0, 39.0, 31.0, 29.0, 40.0, 44.0, 46.0, 45.0, 45.0, 38.0, 32.0, 37.0, 37.0, 37.0, 26.0, 25.0, 14.0, 21.0, 23.0, 14.0, 14.0, 11.0, 6.0, 9.0, 9.0, 5.0, 5.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-2.589674472808838, -2.513974905014038, -2.4382753372192383, -2.3625755310058594, -2.2868759632110596, -2.2111763954162598, -2.13547682762146, -2.05977725982666, -1.9840775728225708, -1.908378005027771, -1.8326783180236816, -1.7569787502288818, -1.681279182434082, -1.6055794954299927, -1.5298799276351929, -1.4541802406311035, -1.3784806728363037, -1.302781105041504, -1.2270814180374146, -1.1513818502426147, -1.0756821632385254, -0.9999825954437256, -0.9242830276489258, -0.8485834002494812, -0.7728837728500366, -0.697184145450592, -0.6214845180511475, -0.5457849502563477, -0.4700853228569031, -0.3943856954574585, -0.3186860978603363, -0.2429865002632141, -0.16728663444519043, -0.09158702194690704, -0.015887409448623657, 0.05981220304965973, 0.13551181554794312, 0.2112114429473877, 0.2869110405445099, 0.3626106381416321, 0.43831026554107666, 0.5140098929405212, 0.5897095203399658, 0.6654090881347656, 0.7411087155342102, 0.8168083429336548, 0.8925079107284546, 0.9682075381278992, 1.0439071655273438, 1.1196067333221436, 1.195306420326233, 1.2710059881210327, 1.346705675125122, 1.4224052429199219, 1.4981048107147217, 1.5738043785095215, 1.6495040655136108, 1.7252036333084106, 1.8009033203125, 1.8766028881072998, 1.9523024559020996, 2.0280022621154785, 2.1037018299102783, 2.179401397705078, 2.255100965499878]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 9.0, 7.0, 12.0, 15.0, 25.0, 33.0, 51.0, 75.0, 145.0, 234.0, 470.0, 951.0, 1777.0, 3600.0, 7647.0, 15316.0, 31440.0, 66145.0, 132747.0, 225332.0, 244610.0, 159866.0, 81460.0, 39520.0, 18798.0, 9094.0, 4514.0, 2241.0, 1132.0, 566.0, 298.0, 171.0, 104.0, 54.0, 39.0, 20.0, 17.0, 9.0, 7.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97265625, -0.9392852783203125, -0.905914306640625, -0.8725433349609375, -0.83917236328125, -0.8058013916015625, -0.772430419921875, -0.7390594482421875, -0.7056884765625, -0.6723175048828125, -0.638946533203125, -0.6055755615234375, -0.57220458984375, -0.5388336181640625, -0.505462646484375, -0.4720916748046875, -0.438720703125, -0.4053497314453125, -0.371978759765625, -0.3386077880859375, -0.30523681640625, -0.2718658447265625, -0.238494873046875, -0.2051239013671875, -0.1717529296875, -0.1383819580078125, -0.105010986328125, -0.0716400146484375, -0.03826904296875, -0.0048980712890625, 0.028472900390625, 0.0618438720703125, 0.09521484375, 0.1285858154296875, 0.161956787109375, 0.1953277587890625, 0.22869873046875, 0.2620697021484375, 0.295440673828125, 0.3288116455078125, 0.3621826171875, 0.3955535888671875, 0.428924560546875, 0.4622955322265625, 0.49566650390625, 0.5290374755859375, 0.562408447265625, 0.5957794189453125, 0.629150390625, 0.6625213623046875, 0.695892333984375, 0.7292633056640625, 0.76263427734375, 0.7960052490234375, 0.829376220703125, 0.8627471923828125, 0.8961181640625, 0.9294891357421875, 0.962860107421875, 0.9962310791015625, 1.02960205078125, 1.0629730224609375, 1.096343994140625, 1.1297149658203125, 1.1630859375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 10.0, 8.0, 12.0, 19.0, 10.0, 18.0, 21.0, 26.0, 37.0, 32.0, 37.0, 38.0, 50.0, 62.0, 52.0, 69.0, 48.0, 57.0, 64.0, 50.0, 50.0, 29.0, 35.0, 38.0, 26.0, 23.0, 31.0, 10.0, 12.0, 9.0, 6.0, 9.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.54833984375, -0.5331344604492188, -0.5179290771484375, -0.5027236938476562, -0.487518310546875, -0.47231292724609375, -0.4571075439453125, -0.44190216064453125, -0.42669677734375, -0.41149139404296875, -0.3962860107421875, -0.38108062744140625, -0.365875244140625, -0.35066986083984375, -0.3354644775390625, -0.32025909423828125, -0.3050537109375, -0.28984832763671875, -0.2746429443359375, -0.25943756103515625, -0.244232177734375, -0.22902679443359375, -0.2138214111328125, -0.19861602783203125, -0.18341064453125, -0.16820526123046875, -0.1529998779296875, -0.13779449462890625, -0.122589111328125, -0.10738372802734375, -0.0921783447265625, -0.07697296142578125, -0.061767578125, -0.04656219482421875, -0.0313568115234375, -0.01615142822265625, -0.000946044921875, 0.01425933837890625, 0.0294647216796875, 0.04467010498046875, 0.05987548828125, 0.07508087158203125, 0.0902862548828125, 0.10549163818359375, 0.120697021484375, 0.13590240478515625, 0.1511077880859375, 0.16631317138671875, 0.1815185546875, 0.19672393798828125, 0.2119293212890625, 0.22713470458984375, 0.242340087890625, 0.25754547119140625, 0.2727508544921875, 0.28795623779296875, 0.30316162109375, 0.31836700439453125, 0.3335723876953125, 0.34877777099609375, 0.363983154296875, 0.37918853759765625, 0.3943939208984375, 0.40959930419921875, 0.4248046875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 11.0, 9.0, 20.0, 19.0, 32.0, 44.0, 77.0, 102.0, 136.0, 217.0, 360.0, 667.0, 1140.0, 2239.0, 4469.0, 8278.0, 16502.0, 31433.0, 60536.0, 112368.0, 188514.0, 226513.0, 175339.0, 103835.0, 55416.0, 29087.0, 14882.0, 7520.0, 4040.0, 2066.0, 1094.0, 602.0, 324.0, 233.0, 126.0, 90.0, 59.0, 37.0, 28.0, 24.0, 18.0, 13.0, 8.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 3.0], "bins": [-1.08203125, -1.0514907836914062, -1.0209503173828125, -0.9904098510742188, -0.959869384765625, -0.9293289184570312, -0.8987884521484375, -0.8682479858398438, -0.83770751953125, -0.8071670532226562, -0.7766265869140625, -0.7460861206054688, -0.715545654296875, -0.6850051879882812, -0.6544647216796875, -0.6239242553710938, -0.5933837890625, -0.5628433227539062, -0.5323028564453125, -0.5017623901367188, -0.471221923828125, -0.44068145751953125, -0.4101409912109375, -0.37960052490234375, -0.34906005859375, -0.31851959228515625, -0.2879791259765625, -0.25743865966796875, -0.226898193359375, -0.19635772705078125, -0.1658172607421875, -0.13527679443359375, -0.104736328125, -0.07419586181640625, -0.0436553955078125, -0.01311492919921875, 0.017425537109375, 0.04796600341796875, 0.0785064697265625, 0.10904693603515625, 0.13958740234375, 0.17012786865234375, 0.2006683349609375, 0.23120880126953125, 0.261749267578125, 0.29228973388671875, 0.3228302001953125, 0.35337066650390625, 0.3839111328125, 0.41445159912109375, 0.4449920654296875, 0.47553253173828125, 0.506072998046875, 0.5366134643554688, 0.5671539306640625, 0.5976943969726562, 0.62823486328125, 0.6587753295898438, 0.6893157958984375, 0.7198562622070312, 0.750396728515625, 0.7809371948242188, 0.8114776611328125, 0.8420181274414062, 0.87255859375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 7.0, 5.0, 2.0, 10.0, 21.0, 17.0, 15.0, 20.0, 19.0, 18.0, 25.0, 27.0, 46.0, 26.0, 33.0, 41.0, 39.0, 48.0, 40.0, 46.0, 38.0, 53.0, 41.0, 38.0, 32.0, 27.0, 36.0, 31.0, 34.0, 20.0, 23.0, 15.0, 15.0, 16.0, 20.0, 11.0, 7.0, 9.0, 4.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.890625, -0.8608551025390625, -0.831085205078125, -0.8013153076171875, -0.77154541015625, -0.7417755126953125, -0.712005615234375, -0.6822357177734375, -0.6524658203125, -0.6226959228515625, -0.592926025390625, -0.5631561279296875, -0.53338623046875, -0.5036163330078125, -0.473846435546875, -0.4440765380859375, -0.414306640625, -0.3845367431640625, -0.354766845703125, -0.3249969482421875, -0.29522705078125, -0.2654571533203125, -0.235687255859375, -0.2059173583984375, -0.1761474609375, -0.1463775634765625, -0.116607666015625, -0.0868377685546875, -0.05706787109375, -0.0272979736328125, 0.002471923828125, 0.0322418212890625, 0.06201171875, 0.0917816162109375, 0.121551513671875, 0.1513214111328125, 0.18109130859375, 0.2108612060546875, 0.240631103515625, 0.2704010009765625, 0.3001708984375, 0.3299407958984375, 0.359710693359375, 0.3894805908203125, 0.41925048828125, 0.4490203857421875, 0.478790283203125, 0.5085601806640625, 0.538330078125, 0.5680999755859375, 0.597869873046875, 0.6276397705078125, 0.65740966796875, 0.6871795654296875, 0.716949462890625, 0.7467193603515625, 0.7764892578125, 0.8062591552734375, 0.836029052734375, 0.8657989501953125, 0.89556884765625, 0.9253387451171875, 0.955108642578125, 0.9848785400390625, 1.0146484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 9.0, 8.0, 6.0, 23.0, 18.0, 31.0, 41.0, 53.0, 85.0, 137.0, 218.0, 345.0, 587.0, 1096.0, 2869.0, 10627.0, 79702.0, 535940.0, 364377.0, 41413.0, 6628.0, 2105.0, 919.0, 456.0, 290.0, 172.0, 107.0, 98.0, 67.0, 37.0, 31.0, 19.0, 15.0, 7.0, 11.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5380859375, -1.4882354736328125, -1.438385009765625, -1.3885345458984375, -1.33868408203125, -1.2888336181640625, -1.238983154296875, -1.1891326904296875, -1.1392822265625, -1.0894317626953125, -1.039581298828125, -0.9897308349609375, -0.93988037109375, -0.8900299072265625, -0.840179443359375, -0.7903289794921875, -0.740478515625, -0.6906280517578125, -0.640777587890625, -0.5909271240234375, -0.54107666015625, -0.4912261962890625, -0.441375732421875, -0.3915252685546875, -0.3416748046875, -0.2918243408203125, -0.241973876953125, -0.1921234130859375, -0.14227294921875, -0.0924224853515625, -0.042572021484375, 0.0072784423828125, 0.05712890625, 0.1069793701171875, 0.156829833984375, 0.2066802978515625, 0.25653076171875, 0.3063812255859375, 0.356231689453125, 0.4060821533203125, 0.4559326171875, 0.5057830810546875, 0.555633544921875, 0.6054840087890625, 0.65533447265625, 0.7051849365234375, 0.755035400390625, 0.8048858642578125, 0.854736328125, 0.9045867919921875, 0.954437255859375, 1.0042877197265625, 1.05413818359375, 1.1039886474609375, 1.153839111328125, 1.2036895751953125, 1.2535400390625, 1.3033905029296875, 1.353240966796875, 1.4030914306640625, 1.45294189453125, 1.5027923583984375, 1.552642822265625, 1.6024932861328125, 1.65234375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 4.0, 5.0, 16.0, 12.0, 20.0, 43.0, 36.0, 80.0, 121.0, 164.0, 148.0, 122.0, 89.0, 43.0, 36.0, 20.0, 11.0, 10.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017452239990234375, -0.00016871094703674316, -0.00016289949417114258, -0.000157088041305542, -0.0001512765884399414, -0.00014546513557434082, -0.00013965368270874023, -0.00013384222984313965, -0.00012803077697753906, -0.00012221932411193848, -0.00011640787124633789, -0.0001105964183807373, -0.00010478496551513672, -9.897351264953613e-05, -9.316205978393555e-05, -8.735060691833496e-05, -8.153915405273438e-05, -7.572770118713379e-05, -6.99162483215332e-05, -6.410479545593262e-05, -5.829334259033203e-05, -5.2481889724731445e-05, -4.667043685913086e-05, -4.0858983993530273e-05, -3.504753112792969e-05, -2.92360782623291e-05, -2.3424625396728516e-05, -1.761317253112793e-05, -1.1801719665527344e-05, -5.990266799926758e-06, -1.7881393432617188e-07, 5.632638931274414e-06, 1.1444091796875e-05, 1.7255544662475586e-05, 2.3066997528076172e-05, 2.8878450393676758e-05, 3.4689903259277344e-05, 4.050135612487793e-05, 4.6312808990478516e-05, 5.21242618560791e-05, 5.793571472167969e-05, 6.374716758728027e-05, 6.955862045288086e-05, 7.537007331848145e-05, 8.118152618408203e-05, 8.699297904968262e-05, 9.28044319152832e-05, 9.861588478088379e-05, 0.00010442733764648438, 0.00011023879051208496, 0.00011605024337768555, 0.00012186169624328613, 0.00012767314910888672, 0.0001334846019744873, 0.0001392960548400879, 0.00014510750770568848, 0.00015091896057128906, 0.00015673041343688965, 0.00016254186630249023, 0.00016835331916809082, 0.0001741647720336914, 0.000179976224899292, 0.00018578767776489258, 0.00019159913063049316, 0.00019741058349609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 4.0, 4.0, 6.0, 7.0, 18.0, 19.0, 27.0, 57.0, 65.0, 121.0, 188.0, 350.0, 750.0, 1566.0, 3069.0, 6655.0, 15212.0, 35982.0, 81320.0, 162357.0, 236879.0, 228356.0, 147867.0, 72154.0, 30631.0, 13304.0, 5980.0, 2733.0, 1376.0, 657.0, 350.0, 178.0, 113.0, 70.0, 45.0, 23.0, 20.0, 16.0, 6.0, 6.0, 5.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.429931640625, -0.4155616760253906, -0.40119171142578125, -0.3868217468261719, -0.3724517822265625, -0.3580818176269531, -0.34371185302734375, -0.3293418884277344, -0.314971923828125, -0.3006019592285156, -0.28623199462890625, -0.2718620300292969, -0.2574920654296875, -0.24312210083007812, -0.22875213623046875, -0.21438217163085938, -0.20001220703125, -0.18564224243164062, -0.17127227783203125, -0.15690231323242188, -0.1425323486328125, -0.12816238403320312, -0.11379241943359375, -0.09942245483398438, -0.085052490234375, -0.07068252563476562, -0.05631256103515625, -0.041942596435546875, -0.0275726318359375, -0.013202667236328125, 0.00116729736328125, 0.015537261962890625, 0.0299072265625, 0.044277191162109375, 0.05864715576171875, 0.07301712036132812, 0.0873870849609375, 0.10175704956054688, 0.11612701416015625, 0.13049697875976562, 0.144866943359375, 0.15923690795898438, 0.17360687255859375, 0.18797683715820312, 0.2023468017578125, 0.21671676635742188, 0.23108673095703125, 0.24545669555664062, 0.25982666015625, 0.2741966247558594, 0.28856658935546875, 0.3029365539550781, 0.3173065185546875, 0.3316764831542969, 0.34604644775390625, 0.3604164123535156, 0.374786376953125, 0.3891563415527344, 0.40352630615234375, 0.4178962707519531, 0.4322662353515625, 0.4466361999511719, 0.46100616455078125, 0.4753761291503906, 0.48974609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 3.0, 2.0, 3.0, 6.0, 3.0, 8.0, 5.0, 7.0, 12.0, 20.0, 13.0, 18.0, 23.0, 25.0, 30.0, 26.0, 38.0, 28.0, 41.0, 31.0, 46.0, 45.0, 42.0, 60.0, 54.0, 48.0, 50.0, 36.0, 34.0, 29.0, 42.0, 36.0, 24.0, 14.0, 21.0, 16.0, 12.0, 4.0, 8.0, 8.0, 6.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.2724609375, -0.2631988525390625, -0.253936767578125, -0.2446746826171875, -0.23541259765625, -0.2261505126953125, -0.216888427734375, -0.2076263427734375, -0.1983642578125, -0.1891021728515625, -0.179840087890625, -0.1705780029296875, -0.16131591796875, -0.1520538330078125, -0.142791748046875, -0.1335296630859375, -0.124267578125, -0.1150054931640625, -0.105743408203125, -0.0964813232421875, -0.08721923828125, -0.0779571533203125, -0.068695068359375, -0.0594329833984375, -0.0501708984375, -0.0409088134765625, -0.031646728515625, -0.0223846435546875, -0.01312255859375, -0.0038604736328125, 0.005401611328125, 0.0146636962890625, 0.02392578125, 0.0331878662109375, 0.042449951171875, 0.0517120361328125, 0.06097412109375, 0.0702362060546875, 0.079498291015625, 0.0887603759765625, 0.0980224609375, 0.1072845458984375, 0.116546630859375, 0.1258087158203125, 0.13507080078125, 0.1443328857421875, 0.153594970703125, 0.1628570556640625, 0.172119140625, 0.1813812255859375, 0.190643310546875, 0.1999053955078125, 0.20916748046875, 0.2184295654296875, 0.227691650390625, 0.2369537353515625, 0.2462158203125, 0.2554779052734375, 0.264739990234375, 0.2740020751953125, 0.28326416015625, 0.2925262451171875, 0.301788330078125, 0.3110504150390625, 0.3203125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 12.0, 8.0, 9.0, 18.0, 28.0, 32.0, 34.0, 34.0, 64.0, 60.0, 76.0, 67.0, 63.0, 76.0, 66.0, 63.0, 44.0, 55.0, 44.0, 24.0, 30.0, 20.0, 13.0, 22.0, 9.0, 5.0, 5.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8996150493621826, -2.809063196182251, -2.7185111045837402, -2.6279592514038086, -2.537407159805298, -2.446855306625366, -2.3563032150268555, -2.265751361846924, -2.175199508666992, -2.0846476554870605, -1.9940955638885498, -1.9035437107086182, -1.8129916191101074, -1.7224397659301758, -1.6318877935409546, -1.5413358211517334, -1.4507837295532227, -1.3602317571640015, -1.2696797847747803, -1.1791279315948486, -1.088575839996338, -0.9980239272117615, -0.9074720144271851, -0.8169200420379639, -0.7263680696487427, -0.6358160972595215, -0.5452641248703003, -0.4547122120857239, -0.3641602396965027, -0.2736082673072815, -0.18305635452270508, -0.09250438213348389, -0.0019526481628417969, 0.0885993093252182, 0.1791512668132782, 0.269703209400177, 0.3602551817893982, 0.4508071541786194, 0.5413590669631958, 0.631911039352417, 0.7224630117416382, 0.8130149841308594, 0.9035669565200806, 0.994118869304657, 1.0846707820892334, 1.1752228736877441, 1.2657747268676758, 1.356326699256897, 1.4468786716461182, 1.5374306440353394, 1.6279826164245605, 1.7185344696044922, 1.809086561203003, 1.8996384143829346, 1.9901903867721558, 2.080742359161377, 2.1712942123413086, 2.2618460655212402, 2.352398157119751, 2.4429500102996826, 2.5335021018981934, 2.624053955078125, 2.7146058082580566, 2.8051578998565674, 2.895709991455078]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 7.0, 8.0, 8.0, 11.0, 8.0, 16.0, 16.0, 20.0, 24.0, 28.0, 27.0, 32.0, 31.0, 30.0, 44.0, 44.0, 31.0, 46.0, 53.0, 39.0, 42.0, 41.0, 58.0, 44.0, 39.0, 28.0, 33.0, 29.0, 27.0, 27.0, 23.0, 14.0, 16.0, 14.0, 9.0, 5.0, 4.0, 4.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.0752735137939453, -2.9814839363098145, -2.8876943588256836, -2.7939047813415527, -2.700115442276001, -2.60632586479187, -2.5125362873077393, -2.4187467098236084, -2.3249571323394775, -2.2311675548553467, -2.137377977371216, -2.043588638305664, -1.9497989416122437, -1.8560094833374023, -1.7622199058532715, -1.6684303283691406, -1.5746408700942993, -1.4808512926101685, -1.3870618343353271, -1.2932722568511963, -1.1994826793670654, -1.1056931018829346, -1.0119036436080933, -0.9181140661239624, -0.8243245482444763, -0.7305350303649902, -0.6367454528808594, -0.5429559350013733, -0.4491663873195648, -0.35537683963775635, -0.26158732175827026, -0.1677977442741394, -0.07400822639465332, 0.019781313836574554, 0.11357085406780243, 0.2073603868484497, 0.3011499345302582, 0.39493948221206665, 0.48872900009155273, 0.5825185775756836, 0.6763080954551697, 0.7700976133346558, 0.8638871908187866, 0.9576767086982727, 1.0514662265777588, 1.1452558040618896, 1.2390453815460205, 1.3328349590301514, 1.4266244173049927, 1.5204139947891235, 1.6142034530639648, 1.7079930305480957, 1.8017826080322266, 1.8955721855163574, 1.9893616437911987, 2.083151340484619, 2.176940679550171, 2.2707302570343018, 2.3645198345184326, 2.4583091735839844, 2.5520987510681152, 2.645888328552246, 2.739677906036377, 2.833467483520508, 2.9272570610046387]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 6.0, 5.0, 10.0, 11.0, 8.0, 21.0, 19.0, 22.0, 27.0, 39.0, 54.0, 83.0, 113.0, 258.0, 597.0, 2085.0, 11067.0, 103959.0, 1607052.0, 2269289.0, 178955.0, 16466.0, 2674.0, 713.0, 304.0, 128.0, 90.0, 59.0, 44.0, 26.0, 18.0, 21.0, 16.0, 7.0, 6.0, 7.0, 10.0, 4.0, 7.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.4453125, -1.4052734375, -1.365234375, -1.3251953125, -1.28515625, -1.2451171875, -1.205078125, -1.1650390625, -1.125, -1.0849609375, -1.044921875, -1.0048828125, -0.96484375, -0.9248046875, -0.884765625, -0.8447265625, -0.8046875, -0.7646484375, -0.724609375, -0.6845703125, -0.64453125, -0.6044921875, -0.564453125, -0.5244140625, -0.484375, -0.4443359375, -0.404296875, -0.3642578125, -0.32421875, -0.2841796875, -0.244140625, -0.2041015625, -0.1640625, -0.1240234375, -0.083984375, -0.0439453125, -0.00390625, 0.0361328125, 0.076171875, 0.1162109375, 0.15625, 0.1962890625, 0.236328125, 0.2763671875, 0.31640625, 0.3564453125, 0.396484375, 0.4365234375, 0.4765625, 0.5166015625, 0.556640625, 0.5966796875, 0.63671875, 0.6767578125, 0.716796875, 0.7568359375, 0.796875, 0.8369140625, 0.876953125, 0.9169921875, 0.95703125, 0.9970703125, 1.037109375, 1.0771484375, 1.1171875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 9.0, 7.0, 11.0, 11.0, 16.0, 21.0, 19.0, 32.0, 26.0, 41.0, 47.0, 28.0, 55.0, 45.0, 50.0, 61.0, 57.0, 57.0, 51.0, 46.0, 53.0, 27.0, 27.0, 46.0, 33.0, 25.0, 23.0, 18.0, 17.0, 11.0, 8.0, 6.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.53759765625, -0.5223236083984375, -0.507049560546875, -0.4917755126953125, -0.47650146484375, -0.4612274169921875, -0.445953369140625, -0.4306793212890625, -0.4154052734375, -0.4001312255859375, -0.384857177734375, -0.3695831298828125, -0.35430908203125, -0.3390350341796875, -0.323760986328125, -0.3084869384765625, -0.293212890625, -0.2779388427734375, -0.262664794921875, -0.2473907470703125, -0.23211669921875, -0.2168426513671875, -0.201568603515625, -0.1862945556640625, -0.1710205078125, -0.1557464599609375, -0.140472412109375, -0.1251983642578125, -0.10992431640625, -0.0946502685546875, -0.079376220703125, -0.0641021728515625, -0.048828125, -0.0335540771484375, -0.018280029296875, -0.0030059814453125, 0.01226806640625, 0.0275421142578125, 0.042816162109375, 0.0580902099609375, 0.0733642578125, 0.0886383056640625, 0.103912353515625, 0.1191864013671875, 0.13446044921875, 0.1497344970703125, 0.165008544921875, 0.1802825927734375, 0.195556640625, 0.2108306884765625, 0.226104736328125, 0.2413787841796875, 0.25665283203125, 0.2719268798828125, 0.287200927734375, 0.3024749755859375, 0.3177490234375, 0.3330230712890625, 0.348297119140625, 0.3635711669921875, 0.37884521484375, 0.3941192626953125, 0.409393310546875, 0.4246673583984375, 0.43994140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 11.0, 15.0, 31.0, 36.0, 52.0, 87.0, 133.0, 211.0, 361.0, 672.0, 1557.0, 3686.0, 10787.0, 37359.0, 141897.0, 531156.0, 1416082.0, 1367378.0, 498005.0, 133270.0, 34749.0, 10244.0, 3483.0, 1429.0, 653.0, 357.0, 203.0, 134.0, 69.0, 48.0, 32.0, 34.0, 23.0, 4.0, 8.0, 6.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6865234375, -0.66107177734375, -0.6356201171875, -0.61016845703125, -0.584716796875, -0.55926513671875, -0.5338134765625, -0.50836181640625, -0.48291015625, -0.45745849609375, -0.4320068359375, -0.40655517578125, -0.381103515625, -0.35565185546875, -0.3302001953125, -0.30474853515625, -0.279296875, -0.25384521484375, -0.2283935546875, -0.20294189453125, -0.177490234375, -0.15203857421875, -0.1265869140625, -0.10113525390625, -0.07568359375, -0.05023193359375, -0.0247802734375, 0.00067138671875, 0.026123046875, 0.05157470703125, 0.0770263671875, 0.10247802734375, 0.1279296875, 0.15338134765625, 0.1788330078125, 0.20428466796875, 0.229736328125, 0.25518798828125, 0.2806396484375, 0.30609130859375, 0.33154296875, 0.35699462890625, 0.3824462890625, 0.40789794921875, 0.433349609375, 0.45880126953125, 0.4842529296875, 0.50970458984375, 0.53515625, 0.56060791015625, 0.5860595703125, 0.61151123046875, 0.636962890625, 0.66241455078125, 0.6878662109375, 0.71331787109375, 0.73876953125, 0.76422119140625, 0.7896728515625, 0.81512451171875, 0.840576171875, 0.86602783203125, 0.8914794921875, 0.91693115234375, 0.9423828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 5.0, 8.0, 4.0, 9.0, 20.0, 14.0, 16.0, 25.0, 48.0, 62.0, 72.0, 84.0, 102.0, 147.0, 188.0, 190.0, 233.0, 291.0, 304.0, 312.0, 305.0, 258.0, 265.0, 217.0, 212.0, 157.0, 122.0, 109.0, 82.0, 49.0, 42.0, 29.0, 22.0, 15.0, 14.0, 8.0, 13.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.701171875, -0.6815643310546875, -0.661956787109375, -0.6423492431640625, -0.62274169921875, -0.6031341552734375, -0.583526611328125, -0.5639190673828125, -0.5443115234375, -0.5247039794921875, -0.505096435546875, -0.4854888916015625, -0.46588134765625, -0.4462738037109375, -0.426666259765625, -0.4070587158203125, -0.387451171875, -0.3678436279296875, -0.348236083984375, -0.3286285400390625, -0.30902099609375, -0.2894134521484375, -0.269805908203125, -0.2501983642578125, -0.2305908203125, -0.2109832763671875, -0.191375732421875, -0.1717681884765625, -0.15216064453125, -0.1325531005859375, -0.112945556640625, -0.0933380126953125, -0.07373046875, -0.0541229248046875, -0.034515380859375, -0.0149078369140625, 0.00469970703125, 0.0243072509765625, 0.043914794921875, 0.0635223388671875, 0.0831298828125, 0.1027374267578125, 0.122344970703125, 0.1419525146484375, 0.16156005859375, 0.1811676025390625, 0.200775146484375, 0.2203826904296875, 0.239990234375, 0.2595977783203125, 0.279205322265625, 0.2988128662109375, 0.31842041015625, 0.3380279541015625, 0.357635498046875, 0.3772430419921875, 0.3968505859375, 0.4164581298828125, 0.436065673828125, 0.4556732177734375, 0.47528076171875, 0.4948883056640625, 0.514495849609375, 0.5341033935546875, 0.5537109375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 9.0, 8.0, 12.0, 22.0, 50.0, 48.0, 64.0, 68.0, 85.0, 89.0, 72.0, 89.0, 77.0, 93.0, 62.0, 46.0, 39.0, 23.0, 12.0, 8.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.7697625160217285, -3.666752338409424, -3.563742160797119, -3.4607319831848145, -3.3577215671539307, -3.254711389541626, -3.1517012119293213, -3.0486910343170166, -2.945680618286133, -2.842670440673828, -2.7396602630615234, -2.6366500854492188, -2.533639669418335, -2.4306294918060303, -2.3276193141937256, -2.224609136581421, -2.121598958969116, -2.0185887813568115, -1.9155784845352173, -1.8125683069229126, -1.7095580101013184, -1.6065478324890137, -1.503537654876709, -1.4005274772644043, -1.29751718044281, -1.1945070028305054, -1.0914967060089111, -0.9884865283966064, -0.885476291179657, -0.7824660539627075, -0.6794558763504028, -0.5764456391334534, -0.4734354019165039, -0.37042516469955444, -0.26741495728492737, -0.1644047498703003, -0.06139451265335083, 0.04161572456359863, 0.14462590217590332, 0.24763613939285278, 0.35064637660980225, 0.4536566138267517, 0.5566668510437012, 0.6596770286560059, 0.7626872658729553, 0.8656975030899048, 0.9687076807022095, 1.0717179775238037, 1.1747281551361084, 1.277738332748413, 1.3807486295700073, 1.483758807182312, 1.5867691040039062, 1.689779281616211, 1.7927894592285156, 1.8957996368408203, 1.9988099336624146, 2.101820230484009, 2.2048304080963135, 2.307840585708618, 2.410850763320923, 2.5138611793518066, 2.6168713569641113, 2.719881534576416, 2.8228917121887207]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 0.0, 5.0, 8.0, 5.0, 5.0, 11.0, 9.0, 18.0, 18.0, 19.0, 28.0, 25.0, 28.0, 31.0, 32.0, 29.0, 43.0, 50.0, 34.0, 49.0, 50.0, 56.0, 52.0, 40.0, 51.0, 40.0, 37.0, 37.0, 26.0, 20.0, 23.0, 28.0, 21.0, 14.0, 13.0, 10.0, 15.0, 4.0, 5.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4814047813415527, -2.399526596069336, -2.317648410797119, -2.2357699871063232, -2.1538918018341064, -2.0720136165618896, -1.9901353120803833, -1.908257007598877, -1.8263788223266602, -1.7445006370544434, -1.662622332572937, -1.5807440280914307, -1.4988658428192139, -1.416987657546997, -1.3351093530654907, -1.2532310485839844, -1.1713528633117676, -1.0894746780395508, -1.0075963735580444, -0.9257181286811829, -0.8438398838043213, -0.7619616389274597, -0.6800833940505981, -0.5982051491737366, -0.516326904296875, -0.4344486594200134, -0.35257041454315186, -0.2706921696662903, -0.1888139247894287, -0.10693567991256714, -0.025057435035705566, 0.056820809841156006, 0.13869881629943848, 0.22057706117630005, 0.3024553060531616, 0.3843335509300232, 0.46621179580688477, 0.5480900406837463, 0.6299682855606079, 0.7118465304374695, 0.793724775314331, 0.8756030201911926, 0.9574812650680542, 1.0393595695495605, 1.1212377548217773, 1.2031159400939941, 1.2849942445755005, 1.3668725490570068, 1.4487507343292236, 1.5306289196014404, 1.6125072240829468, 1.6943855285644531, 1.77626371383667, 1.8581418991088867, 1.940020203590393, 2.0218985080718994, 2.103776693344116, 2.185654878616333, 2.267533302307129, 2.3494114875793457, 2.4312896728515625, 2.5131678581237793, 2.595046043395996, 2.676924467086792, 2.758802652359009]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 16.0, 14.0, 19.0, 20.0, 51.0, 77.0, 133.0, 270.0, 448.0, 809.0, 1601.0, 2900.0, 5439.0, 10078.0, 19910.0, 41907.0, 91640.0, 183907.0, 263344.0, 211964.0, 112946.0, 51202.0, 23818.0, 12150.0, 6411.0, 3489.0, 1794.0, 972.0, 534.0, 290.0, 163.0, 70.0, 54.0, 41.0, 18.0, 14.0, 5.0, 9.0, 9.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9052734375, -0.8725128173828125, -0.839752197265625, -0.8069915771484375, -0.77423095703125, -0.7414703369140625, -0.708709716796875, -0.6759490966796875, -0.6431884765625, -0.6104278564453125, -0.577667236328125, -0.5449066162109375, -0.51214599609375, -0.4793853759765625, -0.446624755859375, -0.4138641357421875, -0.381103515625, -0.3483428955078125, -0.315582275390625, -0.2828216552734375, -0.25006103515625, -0.2173004150390625, -0.184539794921875, -0.1517791748046875, -0.1190185546875, -0.0862579345703125, -0.053497314453125, -0.0207366943359375, 0.01202392578125, 0.0447845458984375, 0.077545166015625, 0.1103057861328125, 0.14306640625, 0.1758270263671875, 0.208587646484375, 0.2413482666015625, 0.27410888671875, 0.3068695068359375, 0.339630126953125, 0.3723907470703125, 0.4051513671875, 0.4379119873046875, 0.470672607421875, 0.5034332275390625, 0.53619384765625, 0.5689544677734375, 0.601715087890625, 0.6344757080078125, 0.667236328125, 0.6999969482421875, 0.732757568359375, 0.7655181884765625, 0.79827880859375, 0.8310394287109375, 0.863800048828125, 0.8965606689453125, 0.9293212890625, 0.9620819091796875, 0.994842529296875, 1.0276031494140625, 1.06036376953125, 1.0931243896484375, 1.125885009765625, 1.1586456298828125, 1.19140625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 5.0, 9.0, 6.0, 12.0, 6.0, 15.0, 18.0, 25.0, 22.0, 22.0, 30.0, 40.0, 36.0, 39.0, 41.0, 51.0, 50.0, 53.0, 61.0, 51.0, 49.0, 48.0, 52.0, 33.0, 42.0, 25.0, 28.0, 28.0, 25.0, 19.0, 17.0, 19.0, 10.0, 3.0, 3.0, 6.0, 8.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4970703125, -0.48294830322265625, -0.4688262939453125, -0.45470428466796875, -0.440582275390625, -0.42646026611328125, -0.4123382568359375, -0.39821624755859375, -0.38409423828125, -0.36997222900390625, -0.3558502197265625, -0.34172821044921875, -0.327606201171875, -0.31348419189453125, -0.2993621826171875, -0.28524017333984375, -0.2711181640625, -0.25699615478515625, -0.2428741455078125, -0.22875213623046875, -0.214630126953125, -0.20050811767578125, -0.1863861083984375, -0.17226409912109375, -0.15814208984375, -0.14402008056640625, -0.1298980712890625, -0.11577606201171875, -0.101654052734375, -0.08753204345703125, -0.0734100341796875, -0.05928802490234375, -0.045166015625, -0.03104400634765625, -0.0169219970703125, -0.00279998779296875, 0.011322021484375, 0.02544403076171875, 0.0395660400390625, 0.05368804931640625, 0.06781005859375, 0.08193206787109375, 0.0960540771484375, 0.11017608642578125, 0.124298095703125, 0.13842010498046875, 0.1525421142578125, 0.16666412353515625, 0.1807861328125, 0.19490814208984375, 0.2090301513671875, 0.22315216064453125, 0.237274169921875, 0.25139617919921875, 0.2655181884765625, 0.27964019775390625, 0.29376220703125, 0.30788421630859375, 0.3220062255859375, 0.33612823486328125, 0.350250244140625, 0.36437225341796875, 0.3784942626953125, 0.39261627197265625, 0.40673828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 7.0, 3.0, 8.0, 11.0, 8.0, 11.0, 16.0, 21.0, 36.0, 44.0, 74.0, 70.0, 118.0, 152.0, 270.0, 460.0, 815.0, 1618.0, 3526.0, 7871.0, 18685.0, 44757.0, 105039.0, 210894.0, 279874.0, 201205.0, 98734.0, 42153.0, 17690.0, 7512.0, 3360.0, 1500.0, 777.0, 416.0, 263.0, 187.0, 131.0, 71.0, 46.0, 41.0, 23.0, 18.0, 16.0, 17.0, 6.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9541015625, -0.9205780029296875, -0.887054443359375, -0.8535308837890625, -0.82000732421875, -0.7864837646484375, -0.752960205078125, -0.7194366455078125, -0.6859130859375, -0.6523895263671875, -0.618865966796875, -0.5853424072265625, -0.55181884765625, -0.5182952880859375, -0.484771728515625, -0.4512481689453125, -0.417724609375, -0.3842010498046875, -0.350677490234375, -0.3171539306640625, -0.28363037109375, -0.2501068115234375, -0.216583251953125, -0.1830596923828125, -0.1495361328125, -0.1160125732421875, -0.082489013671875, -0.0489654541015625, -0.01544189453125, 0.0180816650390625, 0.051605224609375, 0.0851287841796875, 0.11865234375, 0.1521759033203125, 0.185699462890625, 0.2192230224609375, 0.25274658203125, 0.2862701416015625, 0.319793701171875, 0.3533172607421875, 0.3868408203125, 0.4203643798828125, 0.453887939453125, 0.4874114990234375, 0.52093505859375, 0.5544586181640625, 0.587982177734375, 0.6215057373046875, 0.655029296875, 0.6885528564453125, 0.722076416015625, 0.7555999755859375, 0.78912353515625, 0.8226470947265625, 0.856170654296875, 0.8896942138671875, 0.9232177734375, 0.9567413330078125, 0.990264892578125, 1.0237884521484375, 1.05731201171875, 1.0908355712890625, 1.124359130859375, 1.1578826904296875, 1.19140625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 9.0, 9.0, 5.0, 12.0, 11.0, 12.0, 22.0, 18.0, 18.0, 31.0, 21.0, 33.0, 36.0, 37.0, 39.0, 45.0, 44.0, 50.0, 50.0, 52.0, 47.0, 46.0, 55.0, 44.0, 32.0, 30.0, 32.0, 26.0, 33.0, 17.0, 19.0, 19.0, 12.0, 16.0, 7.0, 3.0, 6.0, 5.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.958984375, -0.92181396484375, -0.8846435546875, -0.84747314453125, -0.810302734375, -0.77313232421875, -0.7359619140625, -0.69879150390625, -0.66162109375, -0.62445068359375, -0.5872802734375, -0.55010986328125, -0.512939453125, -0.47576904296875, -0.4385986328125, -0.40142822265625, -0.3642578125, -0.32708740234375, -0.2899169921875, -0.25274658203125, -0.215576171875, -0.17840576171875, -0.1412353515625, -0.10406494140625, -0.06689453125, -0.02972412109375, 0.0074462890625, 0.04461669921875, 0.081787109375, 0.11895751953125, 0.1561279296875, 0.19329833984375, 0.23046875, 0.26763916015625, 0.3048095703125, 0.34197998046875, 0.379150390625, 0.41632080078125, 0.4534912109375, 0.49066162109375, 0.52783203125, 0.56500244140625, 0.6021728515625, 0.63934326171875, 0.676513671875, 0.71368408203125, 0.7508544921875, 0.78802490234375, 0.8251953125, 0.86236572265625, 0.8995361328125, 0.93670654296875, 0.973876953125, 1.01104736328125, 1.0482177734375, 1.08538818359375, 1.12255859375, 1.15972900390625, 1.1968994140625, 1.23406982421875, 1.271240234375, 1.30841064453125, 1.3455810546875, 1.38275146484375, 1.419921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 10.0, 9.0, 13.0, 7.0, 19.0, 48.0, 82.0, 197.0, 397.0, 816.0, 2013.0, 4787.0, 12260.0, 34155.0, 99394.0, 236012.0, 320982.0, 208960.0, 82199.0, 28677.0, 10254.0, 4077.0, 1766.0, 759.0, 328.0, 162.0, 74.0, 32.0, 30.0, 17.0, 8.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.448486328125, -0.4321250915527344, -0.41576385498046875, -0.3994026184082031, -0.3830413818359375, -0.3666801452636719, -0.35031890869140625, -0.3339576721191406, -0.317596435546875, -0.3012351989746094, -0.28487396240234375, -0.2685127258300781, -0.2521514892578125, -0.23579025268554688, -0.21942901611328125, -0.20306777954101562, -0.18670654296875, -0.17034530639648438, -0.15398406982421875, -0.13762283325195312, -0.1212615966796875, -0.10490036010742188, -0.08853912353515625, -0.07217788696289062, -0.055816650390625, -0.039455413818359375, -0.02309417724609375, -0.006732940673828125, 0.0096282958984375, 0.025989532470703125, 0.04235076904296875, 0.058712005615234375, 0.0750732421875, 0.09143447875976562, 0.10779571533203125, 0.12415695190429688, 0.1405181884765625, 0.15687942504882812, 0.17324066162109375, 0.18960189819335938, 0.205963134765625, 0.22232437133789062, 0.23868560791015625, 0.2550468444824219, 0.2714080810546875, 0.2877693176269531, 0.30413055419921875, 0.3204917907714844, 0.33685302734375, 0.3532142639160156, 0.36957550048828125, 0.3859367370605469, 0.4022979736328125, 0.4186592102050781, 0.43502044677734375, 0.4513816833496094, 0.467742919921875, 0.4841041564941406, 0.5004653930664062, 0.5168266296386719, 0.5331878662109375, 0.5495491027832031, 0.5659103393554688, 0.5822715759277344, 0.5986328125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 0.0, 7.0, 5.0, 8.0, 7.0, 13.0, 19.0, 24.0, 25.0, 50.0, 44.0, 56.0, 87.0, 83.0, 109.0, 84.0, 70.0, 65.0, 67.0, 42.0, 28.0, 25.0, 15.0, 15.0, 13.0, 9.0, 4.0, 5.0, 8.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.826089859008789e-05, -7.57165253162384e-05, -7.317215204238892e-05, -7.062777876853943e-05, -6.808340549468994e-05, -6.553903222084045e-05, -6.299465894699097e-05, -6.045028567314148e-05, -5.790591239929199e-05, -5.5361539125442505e-05, -5.281716585159302e-05, -5.027279257774353e-05, -4.772841930389404e-05, -4.5184046030044556e-05, -4.263967275619507e-05, -4.009529948234558e-05, -3.7550926208496094e-05, -3.5006552934646606e-05, -3.246217966079712e-05, -2.9917806386947632e-05, -2.7373433113098145e-05, -2.4829059839248657e-05, -2.228468656539917e-05, -1.9740313291549683e-05, -1.7195940017700195e-05, -1.4651566743850708e-05, -1.210719347000122e-05, -9.562820196151733e-06, -7.018446922302246e-06, -4.474073648452759e-06, -1.9297003746032715e-06, 6.146728992462158e-07, 3.159046173095703e-06, 5.7034194469451904e-06, 8.247792720794678e-06, 1.0792165994644165e-05, 1.3336539268493652e-05, 1.588091254234314e-05, 1.8425285816192627e-05, 2.0969659090042114e-05, 2.35140323638916e-05, 2.605840563774109e-05, 2.8602778911590576e-05, 3.1147152185440063e-05, 3.369152545928955e-05, 3.623589873313904e-05, 3.8780272006988525e-05, 4.132464528083801e-05, 4.38690185546875e-05, 4.641339182853699e-05, 4.8957765102386475e-05, 5.150213837623596e-05, 5.404651165008545e-05, 5.6590884923934937e-05, 5.9135258197784424e-05, 6.167963147163391e-05, 6.42240047454834e-05, 6.676837801933289e-05, 6.931275129318237e-05, 7.185712456703186e-05, 7.440149784088135e-05, 7.694587111473083e-05, 7.949024438858032e-05, 8.203461766242981e-05, 8.45789909362793e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 8.0, 15.0, 20.0, 24.0, 40.0, 58.0, 94.0, 122.0, 209.0, 330.0, 601.0, 1144.0, 2371.0, 4896.0, 11223.0, 26294.0, 65318.0, 147358.0, 248767.0, 256503.0, 158782.0, 72057.0, 29202.0, 12090.0, 5548.0, 2545.0, 1275.0, 695.0, 355.0, 213.0, 116.0, 87.0, 63.0, 36.0, 26.0, 15.0, 16.0, 8.0, 6.0, 2.0, 6.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0], "bins": [-0.42626953125, -0.4137535095214844, -0.40123748779296875, -0.3887214660644531, -0.3762054443359375, -0.3636894226074219, -0.35117340087890625, -0.3386573791503906, -0.326141357421875, -0.3136253356933594, -0.30110931396484375, -0.2885932922363281, -0.2760772705078125, -0.2635612487792969, -0.25104522705078125, -0.23852920532226562, -0.22601318359375, -0.21349716186523438, -0.20098114013671875, -0.18846511840820312, -0.1759490966796875, -0.16343307495117188, -0.15091705322265625, -0.13840103149414062, -0.125885009765625, -0.11336898803710938, -0.10085296630859375, -0.08833694458007812, -0.0758209228515625, -0.06330490112304688, -0.05078887939453125, -0.038272857666015625, -0.0257568359375, -0.013240814208984375, -0.00072479248046875, 0.011791229248046875, 0.0243072509765625, 0.036823272705078125, 0.04933929443359375, 0.061855316162109375, 0.074371337890625, 0.08688735961914062, 0.09940338134765625, 0.11191940307617188, 0.1244354248046875, 0.13695144653320312, 0.14946746826171875, 0.16198348999023438, 0.17449951171875, 0.18701553344726562, 0.19953155517578125, 0.21204757690429688, 0.2245635986328125, 0.23707962036132812, 0.24959564208984375, 0.2621116638183594, 0.274627685546875, 0.2871437072753906, 0.29965972900390625, 0.3121757507324219, 0.3246917724609375, 0.3372077941894531, 0.34972381591796875, 0.3622398376464844, 0.374755859375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 1.0, 4.0, 9.0, 12.0, 11.0, 21.0, 23.0, 17.0, 26.0, 51.0, 41.0, 59.0, 60.0, 74.0, 69.0, 75.0, 72.0, 61.0, 51.0, 58.0, 40.0, 37.0, 24.0, 19.0, 17.0, 14.0, 11.0, 13.0, 6.0, 8.0, 8.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.303955078125, -0.2926979064941406, -0.28144073486328125, -0.2701835632324219, -0.2589263916015625, -0.24766921997070312, -0.23641204833984375, -0.22515487670898438, -0.213897705078125, -0.20264053344726562, -0.19138336181640625, -0.18012619018554688, -0.1688690185546875, -0.15761184692382812, -0.14635467529296875, -0.13509750366210938, -0.12384033203125, -0.11258316040039062, -0.10132598876953125, -0.09006881713867188, -0.0788116455078125, -0.06755447387695312, -0.05629730224609375, -0.045040130615234375, -0.033782958984375, -0.022525787353515625, -0.01126861572265625, -1.1444091796875e-05, 0.0112457275390625, 0.022502899169921875, 0.03376007080078125, 0.045017242431640625, 0.0562744140625, 0.06753158569335938, 0.07878875732421875, 0.09004592895507812, 0.1013031005859375, 0.11256027221679688, 0.12381744384765625, 0.13507461547851562, 0.146331787109375, 0.15758895874023438, 0.16884613037109375, 0.18010330200195312, 0.1913604736328125, 0.20261764526367188, 0.21387481689453125, 0.22513198852539062, 0.23638916015625, 0.24764633178710938, 0.25890350341796875, 0.2701606750488281, 0.2814178466796875, 0.2926750183105469, 0.30393218994140625, 0.3151893615722656, 0.326446533203125, 0.3377037048339844, 0.34896087646484375, 0.3602180480957031, 0.3714752197265625, 0.3827323913574219, 0.39398956298828125, 0.4052467346191406, 0.41650390625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 6.0, 25.0, 48.0, 104.0, 148.0, 207.0, 182.0, 129.0, 82.0, 47.0, 19.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.388137817382812, -12.13931655883789, -11.890495300292969, -11.641674041748047, -11.392852783203125, -11.144031524658203, -10.895210266113281, -10.64638900756836, -10.397568702697754, -10.148747444152832, -9.89992618560791, -9.651104927062988, -9.402283668518066, -9.153462409973145, -8.904642105102539, -8.655820846557617, -8.406998634338379, -8.158177375793457, -7.909356117248535, -7.660534858703613, -7.41171407699585, -7.162892818450928, -6.914071559906006, -6.665250301361084, -6.41642951965332, -6.167608261108398, -5.918787002563477, -5.669965744018555, -5.421144962310791, -5.172323703765869, -4.923502445220947, -4.674681186676025, -4.4258599281311035, -4.177038669586182, -3.928217649459839, -3.679396390914917, -3.430575132369995, -3.1817541122436523, -2.9329328536987305, -2.6841115951538086, -2.4352903366088867, -2.186469078063965, -1.9376479387283325, -1.6888267993927002, -1.4400055408477783, -1.191184401512146, -0.9423632621765137, -0.6935420036315918, -0.444720983505249, -0.19589979946613312, 0.05292138457298279, 0.3017425537109375, 0.5505637526512146, 0.7993849515914917, 1.048206090927124, 1.297027349472046, 1.5458484888076782, 1.7946696281433105, 2.0434908866882324, 2.2923121452331543, 2.541133165359497, 2.789954423904419, 3.0387754440307617, 3.2875967025756836, 3.5364179611206055]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 6.0, 5.0, 6.0, 5.0, 5.0, 7.0, 8.0, 5.0, 5.0, 9.0, 15.0, 12.0, 17.0, 17.0, 34.0, 22.0, 33.0, 28.0, 41.0, 39.0, 42.0, 43.0, 33.0, 36.0, 43.0, 41.0, 39.0, 33.0, 32.0, 28.0, 32.0, 38.0, 29.0, 23.0, 37.0, 27.0, 20.0, 18.0, 19.0, 16.0, 7.0, 9.0, 7.0, 8.0, 7.0, 8.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0], "bins": [-2.9885332584381104, -2.8936450481414795, -2.7987568378448486, -2.7038686275482178, -2.608980417251587, -2.514091968536377, -2.419203758239746, -2.3243155479431152, -2.2294273376464844, -2.1345391273498535, -2.0396509170532227, -1.9447627067565918, -1.8498743772506714, -1.7549861669540405, -1.6600979566574097, -1.5652096271514893, -1.470321536064148, -1.375433325767517, -1.2805451154708862, -1.1856567859649658, -1.090768575668335, -0.9958803653717041, -0.9009921550750732, -0.8061038851737976, -0.7112156748771667, -0.6163274645805359, -0.5214391946792603, -0.4265509843826294, -0.33166274428367615, -0.2367745041847229, -0.14188629388809204, -0.046998023986816406, 0.04789018630981445, 0.1427784264087677, 0.23766665160655975, 0.3325548768043518, 0.42744311690330505, 0.5223313570022583, 0.6172195672988892, 0.7121078372001648, 0.8069960474967957, 0.9018842577934265, 0.9967725276947021, 1.091660737991333, 1.1865489482879639, 1.2814371585845947, 1.3763253688812256, 1.471213698387146, 1.5661019086837769, 1.6609901189804077, 1.7558783292770386, 1.850766658782959, 1.9456548690795898, 2.0405430793762207, 2.1354312896728516, 2.2303194999694824, 2.3252077102661133, 2.420095920562744, 2.514984130859375, 2.609872341156006, 2.7047605514526367, 2.7996487617492676, 2.8945369720458984, 2.9894254207611084, 3.0843136310577393]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 13.0, 12.0, 8.0, 21.0, 25.0, 45.0, 59.0, 89.0, 144.0, 199.0, 311.0, 573.0, 926.0, 1688.0, 3105.0, 6042.0, 12151.0, 27385.0, 65085.0, 169752.0, 470981.0, 1076207.0, 1262998.0, 675644.0, 255110.0, 95398.0, 37986.0, 16321.0, 7657.0, 3794.0, 1971.0, 1073.0, 594.0, 331.0, 220.0, 123.0, 78.0, 51.0, 34.0, 29.0, 20.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.479736328125, -0.46570587158203125, -0.4516754150390625, -0.43764495849609375, -0.423614501953125, -0.40958404541015625, -0.3955535888671875, -0.38152313232421875, -0.36749267578125, -0.35346221923828125, -0.3394317626953125, -0.32540130615234375, -0.311370849609375, -0.29734039306640625, -0.2833099365234375, -0.26927947998046875, -0.2552490234375, -0.24121856689453125, -0.2271881103515625, -0.21315765380859375, -0.199127197265625, -0.18509674072265625, -0.1710662841796875, -0.15703582763671875, -0.14300537109375, -0.12897491455078125, -0.1149444580078125, -0.10091400146484375, -0.086883544921875, -0.07285308837890625, -0.0588226318359375, -0.04479217529296875, -0.03076171875, -0.01673126220703125, -0.0027008056640625, 0.01132965087890625, 0.025360107421875, 0.03939056396484375, 0.0534210205078125, 0.06745147705078125, 0.08148193359375, 0.09551239013671875, 0.1095428466796875, 0.12357330322265625, 0.137603759765625, 0.15163421630859375, 0.1656646728515625, 0.17969512939453125, 0.1937255859375, 0.20775604248046875, 0.2217864990234375, 0.23581695556640625, 0.249847412109375, 0.26387786865234375, 0.2779083251953125, 0.29193878173828125, 0.30596923828125, 0.31999969482421875, 0.3340301513671875, 0.34806060791015625, 0.362091064453125, 0.37612152099609375, 0.3901519775390625, 0.40418243408203125, 0.418212890625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 6.0, 10.0, 9.0, 13.0, 11.0, 20.0, 20.0, 34.0, 31.0, 37.0, 41.0, 50.0, 47.0, 59.0, 64.0, 75.0, 58.0, 48.0, 55.0, 52.0, 53.0, 30.0, 35.0, 34.0, 16.0, 21.0, 21.0, 14.0, 13.0, 4.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53515625, -0.5191383361816406, -0.5031204223632812, -0.4871025085449219, -0.4710845947265625, -0.4550666809082031, -0.43904876708984375, -0.4230308532714844, -0.407012939453125, -0.3909950256347656, -0.37497711181640625, -0.3589591979980469, -0.3429412841796875, -0.3269233703613281, -0.31090545654296875, -0.2948875427246094, -0.27886962890625, -0.2628517150878906, -0.24683380126953125, -0.23081588745117188, -0.2147979736328125, -0.19878005981445312, -0.18276214599609375, -0.16674423217773438, -0.150726318359375, -0.13470840454101562, -0.11869049072265625, -0.10267257690429688, -0.0866546630859375, -0.07063674926757812, -0.05461883544921875, -0.038600921630859375, -0.0225830078125, -0.006565093994140625, 0.00945281982421875, 0.025470733642578125, 0.0414886474609375, 0.057506561279296875, 0.07352447509765625, 0.08954238891601562, 0.105560302734375, 0.12157821655273438, 0.13759613037109375, 0.15361404418945312, 0.1696319580078125, 0.18564987182617188, 0.20166778564453125, 0.21768569946289062, 0.23370361328125, 0.24972152709960938, 0.26573944091796875, 0.2817573547363281, 0.2977752685546875, 0.3137931823730469, 0.32981109619140625, 0.3458290100097656, 0.361846923828125, 0.3778648376464844, 0.39388275146484375, 0.4099006652832031, 0.4259185791015625, 0.4419364929199219, 0.45795440673828125, 0.4739723205566406, 0.489990234375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 5.0, 8.0, 10.0, 20.0, 16.0, 33.0, 35.0, 52.0, 70.0, 119.0, 155.0, 292.0, 590.0, 1201.0, 3176.0, 9829.0, 35015.0, 138618.0, 540741.0, 1536555.0, 1350858.0, 428386.0, 107901.0, 27770.0, 7874.0, 2573.0, 1050.0, 495.0, 281.0, 159.0, 113.0, 76.0, 51.0, 32.0, 27.0, 30.0, 14.0, 10.0, 12.0, 12.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.86376953125, -0.8390274047851562, -0.8142852783203125, -0.7895431518554688, -0.764801025390625, -0.7400588989257812, -0.7153167724609375, -0.6905746459960938, -0.66583251953125, -0.6410903930664062, -0.6163482666015625, -0.5916061401367188, -0.566864013671875, -0.5421218872070312, -0.5173797607421875, -0.49263763427734375, -0.4678955078125, -0.44315338134765625, -0.4184112548828125, -0.39366912841796875, -0.368927001953125, -0.34418487548828125, -0.3194427490234375, -0.29470062255859375, -0.26995849609375, -0.24521636962890625, -0.2204742431640625, -0.19573211669921875, -0.170989990234375, -0.14624786376953125, -0.1215057373046875, -0.09676361083984375, -0.072021484375, -0.04727935791015625, -0.0225372314453125, 0.00220489501953125, 0.026947021484375, 0.05168914794921875, 0.0764312744140625, 0.10117340087890625, 0.12591552734375, 0.15065765380859375, 0.1753997802734375, 0.20014190673828125, 0.224884033203125, 0.24962615966796875, 0.2743682861328125, 0.29911041259765625, 0.3238525390625, 0.34859466552734375, 0.3733367919921875, 0.39807891845703125, 0.422821044921875, 0.44756317138671875, 0.4723052978515625, 0.49704742431640625, 0.52178955078125, 0.5465316772460938, 0.5712738037109375, 0.5960159301757812, 0.620758056640625, 0.6455001831054688, 0.6702423095703125, 0.6949844360351562, 0.7197265625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 11.0, 12.0, 18.0, 17.0, 25.0, 36.0, 49.0, 57.0, 71.0, 91.0, 100.0, 123.0, 126.0, 173.0, 209.0, 227.0, 267.0, 283.0, 291.0, 278.0, 276.0, 220.0, 199.0, 171.0, 141.0, 116.0, 107.0, 70.0, 63.0, 60.0, 39.0, 27.0, 26.0, 18.0, 20.0, 15.0, 5.0, 5.0, 4.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.492431640625, -0.4762458801269531, -0.46006011962890625, -0.4438743591308594, -0.4276885986328125, -0.4115028381347656, -0.39531707763671875, -0.3791313171386719, -0.362945556640625, -0.3467597961425781, -0.33057403564453125, -0.3143882751464844, -0.2982025146484375, -0.2820167541503906, -0.26583099365234375, -0.24964523315429688, -0.23345947265625, -0.21727371215820312, -0.20108795166015625, -0.18490219116210938, -0.1687164306640625, -0.15253067016601562, -0.13634490966796875, -0.12015914916992188, -0.103973388671875, -0.08778762817382812, -0.07160186767578125, -0.055416107177734375, -0.0392303466796875, -0.023044586181640625, -0.00685882568359375, 0.009326934814453125, 0.0255126953125, 0.041698455810546875, 0.05788421630859375, 0.07406997680664062, 0.0902557373046875, 0.10644149780273438, 0.12262725830078125, 0.13881301879882812, 0.154998779296875, 0.17118453979492188, 0.18737030029296875, 0.20355606079101562, 0.2197418212890625, 0.23592758178710938, 0.25211334228515625, 0.2682991027832031, 0.28448486328125, 0.3006706237792969, 0.31685638427734375, 0.3330421447753906, 0.3492279052734375, 0.3654136657714844, 0.38159942626953125, 0.3977851867675781, 0.413970947265625, 0.4301567077636719, 0.44634246826171875, 0.4625282287597656, 0.4787139892578125, 0.4948997497558594, 0.5110855102539062, 0.5272712707519531, 0.54345703125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 6.0, 10.0, 14.0, 21.0, 25.0, 31.0, 39.0, 51.0, 59.0, 68.0, 70.0, 86.0, 77.0, 87.0, 65.0, 58.0, 51.0, 41.0, 40.0, 25.0, 24.0, 17.0, 13.0, 8.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.6794261932373047, -3.589672088623047, -3.49991774559021, -3.410163640975952, -3.3204092979431152, -3.2306551933288574, -3.1409010887145996, -3.051146984100342, -2.961392641067505, -2.871638536453247, -2.78188419342041, -2.6921300888061523, -2.6023759841918945, -2.5126216411590576, -2.4228675365448, -2.333113193511963, -2.243359088897705, -2.1536049842834473, -2.0638506412506104, -1.9740965366363525, -1.8843423128128052, -1.7945880889892578, -1.704833984375, -1.6150797605514526, -1.5253255367279053, -1.435571312904358, -1.3458170890808105, -1.2560629844665527, -1.1663087606430054, -1.076554536819458, -0.9868003726005554, -0.8970462083816528, -0.8072919845581055, -0.7175377607345581, -0.6277835965156555, -0.5380294322967529, -0.44827520847320557, -0.3585210144519806, -0.2687668204307556, -0.17901265621185303, -0.08925843238830566, 0.0004957616329193115, 0.09024995565414429, 0.18000414967536926, 0.26975834369659424, 0.3595125377178192, 0.4492667317390442, 0.5390208959579468, 0.6287751197814941, 0.7185293436050415, 0.8082835078239441, 0.8980376720428467, 0.987791895866394, 1.0775461196899414, 1.1673002243041992, 1.2570544481277466, 1.346808671951294, 1.4365628957748413, 1.5263171195983887, 1.6160712242126465, 1.7058254480361938, 1.7955796718597412, 1.885333776473999, 1.9750880002975464, 2.0648422241210938]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 9.0, 7.0, 7.0, 7.0, 4.0, 7.0, 10.0, 11.0, 11.0, 21.0, 14.0, 22.0, 23.0, 17.0, 25.0, 34.0, 27.0, 36.0, 37.0, 41.0, 32.0, 40.0, 44.0, 35.0, 46.0, 42.0, 44.0, 36.0, 34.0, 32.0, 31.0, 29.0, 28.0, 25.0, 24.0, 21.0, 12.0, 20.0, 16.0, 8.0, 12.0, 3.0, 8.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0], "bins": [-2.5613512992858887, -2.492141008377075, -2.4229307174682617, -2.3537204265594482, -2.2845101356506348, -2.2152998447418213, -2.146089553833008, -2.0768795013427734, -2.007668972015381, -1.9384586811065674, -1.869248390197754, -1.8000380992889404, -1.730827808380127, -1.6616175174713135, -1.5924073457717896, -1.523197054862976, -1.4539868831634521, -1.3847765922546387, -1.3155663013458252, -1.2463560104370117, -1.1771457195281982, -1.1079354286193848, -1.0387252569198608, -0.9695149660110474, -0.9003046751022339, -0.8310943841934204, -0.7618840932846069, -0.6926738619804382, -0.6234635710716248, -0.5542532801628113, -0.4850430190563202, -0.4158327579498291, -0.3466227054595947, -0.27741241455078125, -0.20820215344429016, -0.13899187743663788, -0.0697816014289856, -0.0005713105201721191, 0.06863895058631897, 0.13784921169281006, 0.20705950260162354, 0.276269793510437, 0.3454800546169281, 0.4146903157234192, 0.48390060663223267, 0.5531108975410461, 0.6223211288452148, 0.6915314197540283, 0.7607417106628418, 0.8299520015716553, 0.8991622924804688, 0.9683725237846375, 1.0375828742980957, 1.1067931652069092, 1.176003336906433, 1.2452136278152466, 1.31442391872406, 1.3836342096328735, 1.452844500541687, 1.5220547914505005, 1.5912649631500244, 1.660475254058838, 1.7296855449676514, 1.7988958358764648, 1.8681061267852783]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 6.0, 9.0, 13.0, 7.0, 37.0, 52.0, 66.0, 138.0, 253.0, 455.0, 874.0, 1829.0, 3839.0, 8595.0, 19468.0, 43830.0, 97181.0, 196031.0, 274057.0, 209025.0, 105998.0, 47818.0, 21241.0, 9435.0, 4207.0, 1954.0, 987.0, 491.0, 273.0, 157.0, 79.0, 42.0, 29.0, 17.0, 11.0, 16.0, 12.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0048828125, -0.9730377197265625, -0.941192626953125, -0.9093475341796875, -0.87750244140625, -0.8456573486328125, -0.813812255859375, -0.7819671630859375, -0.7501220703125, -0.7182769775390625, -0.686431884765625, -0.6545867919921875, -0.62274169921875, -0.5908966064453125, -0.559051513671875, -0.5272064208984375, -0.495361328125, -0.4635162353515625, -0.431671142578125, -0.3998260498046875, -0.36798095703125, -0.3361358642578125, -0.304290771484375, -0.2724456787109375, -0.2406005859375, -0.2087554931640625, -0.176910400390625, -0.1450653076171875, -0.11322021484375, -0.0813751220703125, -0.049530029296875, -0.0176849365234375, 0.01416015625, 0.0460052490234375, 0.077850341796875, 0.1096954345703125, 0.14154052734375, 0.1733856201171875, 0.205230712890625, 0.2370758056640625, 0.2689208984375, 0.3007659912109375, 0.332611083984375, 0.3644561767578125, 0.39630126953125, 0.4281463623046875, 0.459991455078125, 0.4918365478515625, 0.523681640625, 0.5555267333984375, 0.587371826171875, 0.6192169189453125, 0.65106201171875, 0.6829071044921875, 0.714752197265625, 0.7465972900390625, 0.7784423828125, 0.8102874755859375, 0.842132568359375, 0.8739776611328125, 0.90582275390625, 0.9376678466796875, 0.969512939453125, 1.0013580322265625, 1.033203125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 5.0, 8.0, 9.0, 14.0, 16.0, 15.0, 29.0, 14.0, 31.0, 38.0, 36.0, 50.0, 52.0, 47.0, 52.0, 39.0, 39.0, 58.0, 66.0, 34.0, 33.0, 48.0, 39.0, 35.0, 28.0, 40.0, 21.0, 15.0, 17.0, 10.0, 10.0, 12.0, 8.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.470703125, -0.4573249816894531, -0.44394683837890625, -0.4305686950683594, -0.4171905517578125, -0.4038124084472656, -0.39043426513671875, -0.3770561218261719, -0.363677978515625, -0.3502998352050781, -0.33692169189453125, -0.3235435485839844, -0.3101654052734375, -0.2967872619628906, -0.28340911865234375, -0.2700309753417969, -0.25665283203125, -0.24327468872070312, -0.22989654541015625, -0.21651840209960938, -0.2031402587890625, -0.18976211547851562, -0.17638397216796875, -0.16300582885742188, -0.149627685546875, -0.13624954223632812, -0.12287139892578125, -0.10949325561523438, -0.0961151123046875, -0.08273696899414062, -0.06935882568359375, -0.055980682373046875, -0.0426025390625, -0.029224395751953125, -0.01584625244140625, -0.002468109130859375, 0.0109100341796875, 0.024288177490234375, 0.03766632080078125, 0.051044464111328125, 0.064422607421875, 0.07780075073242188, 0.09117889404296875, 0.10455703735351562, 0.1179351806640625, 0.13131332397460938, 0.14469146728515625, 0.15806961059570312, 0.17144775390625, 0.18482589721679688, 0.19820404052734375, 0.21158218383789062, 0.2249603271484375, 0.23833847045898438, 0.25171661376953125, 0.2650947570800781, 0.278472900390625, 0.2918510437011719, 0.30522918701171875, 0.3186073303222656, 0.3319854736328125, 0.3453636169433594, 0.35874176025390625, 0.3721199035644531, 0.385498046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 4.0, 5.0, 6.0, 10.0, 12.0, 18.0, 35.0, 43.0, 42.0, 63.0, 169.0, 373.0, 1042.0, 3245.0, 9928.0, 29478.0, 82580.0, 204087.0, 326671.0, 235527.0, 100307.0, 36708.0, 12172.0, 3911.0, 1283.0, 411.0, 168.0, 76.0, 47.0, 29.0, 25.0, 30.0, 11.0, 6.0, 9.0, 6.0, 4.0, 6.0, 2.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3916015625, -1.35137939453125, -1.3111572265625, -1.27093505859375, -1.230712890625, -1.19049072265625, -1.1502685546875, -1.11004638671875, -1.06982421875, -1.02960205078125, -0.9893798828125, -0.94915771484375, -0.908935546875, -0.86871337890625, -0.8284912109375, -0.78826904296875, -0.748046875, -0.70782470703125, -0.6676025390625, -0.62738037109375, -0.587158203125, -0.54693603515625, -0.5067138671875, -0.46649169921875, -0.42626953125, -0.38604736328125, -0.3458251953125, -0.30560302734375, -0.265380859375, -0.22515869140625, -0.1849365234375, -0.14471435546875, -0.1044921875, -0.06427001953125, -0.0240478515625, 0.01617431640625, 0.056396484375, 0.09661865234375, 0.1368408203125, 0.17706298828125, 0.21728515625, 0.25750732421875, 0.2977294921875, 0.33795166015625, 0.378173828125, 0.41839599609375, 0.4586181640625, 0.49884033203125, 0.5390625, 0.57928466796875, 0.6195068359375, 0.65972900390625, 0.699951171875, 0.74017333984375, 0.7803955078125, 0.82061767578125, 0.86083984375, 0.90106201171875, 0.9412841796875, 0.98150634765625, 1.021728515625, 1.06195068359375, 1.1021728515625, 1.14239501953125, 1.1826171875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 4.0, 5.0, 5.0, 4.0, 8.0, 11.0, 19.0, 18.0, 18.0, 20.0, 21.0, 31.0, 26.0, 37.0, 39.0, 46.0, 47.0, 41.0, 58.0, 32.0, 57.0, 55.0, 46.0, 52.0, 38.0, 39.0, 22.0, 34.0, 35.0, 20.0, 32.0, 16.0, 13.0, 15.0, 20.0, 5.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.15234375, -1.1149444580078125, -1.077545166015625, -1.0401458740234375, -1.00274658203125, -0.9653472900390625, -0.927947998046875, -0.8905487060546875, -0.8531494140625, -0.8157501220703125, -0.778350830078125, -0.7409515380859375, -0.70355224609375, -0.6661529541015625, -0.628753662109375, -0.5913543701171875, -0.553955078125, -0.5165557861328125, -0.479156494140625, -0.4417572021484375, -0.40435791015625, -0.3669586181640625, -0.329559326171875, -0.2921600341796875, -0.2547607421875, -0.2173614501953125, -0.179962158203125, -0.1425628662109375, -0.10516357421875, -0.0677642822265625, -0.030364990234375, 0.0070343017578125, 0.04443359375, 0.0818328857421875, 0.119232177734375, 0.1566314697265625, 0.19403076171875, 0.2314300537109375, 0.268829345703125, 0.3062286376953125, 0.3436279296875, 0.3810272216796875, 0.418426513671875, 0.4558258056640625, 0.49322509765625, 0.5306243896484375, 0.568023681640625, 0.6054229736328125, 0.642822265625, 0.6802215576171875, 0.717620849609375, 0.7550201416015625, 0.79241943359375, 0.8298187255859375, 0.867218017578125, 0.9046173095703125, 0.9420166015625, 0.9794158935546875, 1.016815185546875, 1.0542144775390625, 1.09161376953125, 1.1290130615234375, 1.166412353515625, 1.2038116455078125, 1.2412109375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 8.0, 18.0, 21.0, 45.0, 75.0, 88.0, 151.0, 187.0, 323.0, 483.0, 747.0, 1235.0, 1873.0, 3319.0, 5444.0, 9396.0, 16770.0, 29674.0, 52589.0, 88941.0, 135154.0, 173681.0, 173389.0, 138407.0, 90882.0, 53949.0, 30305.0, 17104.0, 9796.0, 5739.0, 3367.0, 1981.0, 1233.0, 800.0, 447.0, 329.0, 193.0, 151.0, 103.0, 48.0, 44.0, 24.0, 14.0, 7.0, 12.0, 1.0, 7.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.296875, -0.28839874267578125, -0.2799224853515625, -0.27144622802734375, -0.262969970703125, -0.25449371337890625, -0.2460174560546875, -0.23754119873046875, -0.22906494140625, -0.22058868408203125, -0.2121124267578125, -0.20363616943359375, -0.195159912109375, -0.18668365478515625, -0.1782073974609375, -0.16973114013671875, -0.1612548828125, -0.15277862548828125, -0.1443023681640625, -0.13582611083984375, -0.127349853515625, -0.11887359619140625, -0.1103973388671875, -0.10192108154296875, -0.09344482421875, -0.08496856689453125, -0.0764923095703125, -0.06801605224609375, -0.059539794921875, -0.05106353759765625, -0.0425872802734375, -0.03411102294921875, -0.025634765625, -0.01715850830078125, -0.0086822509765625, -0.00020599365234375, 0.008270263671875, 0.01674652099609375, 0.0252227783203125, 0.03369903564453125, 0.04217529296875, 0.05065155029296875, 0.0591278076171875, 0.06760406494140625, 0.076080322265625, 0.08455657958984375, 0.0930328369140625, 0.10150909423828125, 0.1099853515625, 0.11846160888671875, 0.1269378662109375, 0.13541412353515625, 0.143890380859375, 0.15236663818359375, 0.1608428955078125, 0.16931915283203125, 0.17779541015625, 0.18627166748046875, 0.1947479248046875, 0.20322418212890625, 0.211700439453125, 0.22017669677734375, 0.2286529541015625, 0.23712921142578125, 0.24560546875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 1.0, 4.0, 7.0, 2.0, 14.0, 10.0, 16.0, 16.0, 17.0, 22.0, 36.0, 50.0, 52.0, 84.0, 92.0, 96.0, 97.0, 82.0, 64.0, 62.0, 41.0, 35.0, 18.0, 22.0, 17.0, 9.0, 7.0, 9.0, 4.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00010991096496582031, -0.0001071607694029808, -0.0001044105738401413, -0.00010166037827730179, -9.891018271446228e-05, -9.615998715162277e-05, -9.340979158878326e-05, -9.065959602594376e-05, -8.790940046310425e-05, -8.515920490026474e-05, -8.240900933742523e-05, -7.965881377458572e-05, -7.690861821174622e-05, -7.415842264890671e-05, -7.14082270860672e-05, -6.865803152322769e-05, -6.590783596038818e-05, -6.315764039754868e-05, -6.040744483470917e-05, -5.765724927186966e-05, -5.490705370903015e-05, -5.215685814619064e-05, -4.9406662583351135e-05, -4.665646702051163e-05, -4.390627145767212e-05, -4.115607589483261e-05, -3.84058803319931e-05, -3.5655684769153595e-05, -3.290548920631409e-05, -3.015529364347458e-05, -2.740509808063507e-05, -2.4654902517795563e-05, -2.1904706954956055e-05, -1.9154511392116547e-05, -1.640431582927704e-05, -1.365412026643753e-05, -1.0903924703598022e-05, -8.153729140758514e-06, -5.403533577919006e-06, -2.6533380150794983e-06, 9.685754776000977e-08, 2.847053110599518e-06, 5.597248673439026e-06, 8.347444236278534e-06, 1.1097639799118042e-05, 1.384783536195755e-05, 1.6598030924797058e-05, 1.9348226487636566e-05, 2.2098422050476074e-05, 2.4848617613315582e-05, 2.759881317615509e-05, 3.03490087389946e-05, 3.3099204301834106e-05, 3.5849399864673615e-05, 3.859959542751312e-05, 4.134979099035263e-05, 4.409998655319214e-05, 4.685018211603165e-05, 4.9600377678871155e-05, 5.235057324171066e-05, 5.510076880455017e-05, 5.785096436738968e-05, 6.060115993022919e-05, 6.33513554930687e-05, 6.61015510559082e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 7.0, 2.0, 6.0, 11.0, 14.0, 8.0, 20.0, 26.0, 39.0, 61.0, 108.0, 169.0, 336.0, 554.0, 980.0, 1802.0, 3290.0, 5892.0, 11420.0, 21717.0, 42444.0, 78449.0, 130344.0, 181681.0, 193815.0, 156232.0, 100307.0, 56330.0, 29739.0, 15285.0, 7879.0, 4342.0, 2267.0, 1269.0, 689.0, 411.0, 225.0, 142.0, 85.0, 42.0, 40.0, 25.0, 14.0, 14.0, 12.0, 6.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2445068359375, -0.2364177703857422, -0.22832870483398438, -0.22023963928222656, -0.21215057373046875, -0.20406150817871094, -0.19597244262695312, -0.1878833770751953, -0.1797943115234375, -0.1717052459716797, -0.16361618041992188, -0.15552711486816406, -0.14743804931640625, -0.13934898376464844, -0.13125991821289062, -0.12317085266113281, -0.115081787109375, -0.10699272155761719, -0.09890365600585938, -0.09081459045410156, -0.08272552490234375, -0.07463645935058594, -0.06654739379882812, -0.05845832824707031, -0.0503692626953125, -0.04228019714355469, -0.034191131591796875, -0.026102066040039062, -0.01801300048828125, -0.009923934936523438, -0.001834869384765625, 0.0062541961669921875, 0.01434326171875, 0.022432327270507812, 0.030521392822265625, 0.03861045837402344, 0.04669952392578125, 0.05478858947753906, 0.06287765502929688, 0.07096672058105469, 0.0790557861328125, 0.08714485168457031, 0.09523391723632812, 0.10332298278808594, 0.11141204833984375, 0.11950111389160156, 0.12759017944335938, 0.1356792449951172, 0.143768310546875, 0.1518573760986328, 0.15994644165039062, 0.16803550720214844, 0.17612457275390625, 0.18421363830566406, 0.19230270385742188, 0.2003917694091797, 0.2084808349609375, 0.2165699005126953, 0.22465896606445312, 0.23274803161621094, 0.24083709716796875, 0.24892616271972656, 0.2570152282714844, 0.2651042938232422, 0.273193359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 5.0, 7.0, 7.0, 7.0, 10.0, 14.0, 14.0, 12.0, 16.0, 17.0, 15.0, 26.0, 31.0, 32.0, 42.0, 38.0, 30.0, 43.0, 38.0, 48.0, 42.0, 48.0, 44.0, 29.0, 35.0, 46.0, 36.0, 39.0, 28.0, 32.0, 18.0, 34.0, 25.0, 16.0, 11.0, 10.0, 9.0, 7.0, 2.0, 4.0, 5.0, 8.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.207763671875, -0.2012042999267578, -0.19464492797851562, -0.18808555603027344, -0.18152618408203125, -0.17496681213378906, -0.16840744018554688, -0.1618480682373047, -0.1552886962890625, -0.1487293243408203, -0.14216995239257812, -0.13561058044433594, -0.12905120849609375, -0.12249183654785156, -0.11593246459960938, -0.10937309265136719, -0.102813720703125, -0.09625434875488281, -0.08969497680664062, -0.08313560485839844, -0.07657623291015625, -0.07001686096191406, -0.06345748901367188, -0.05689811706542969, -0.0503387451171875, -0.04377937316894531, -0.037220001220703125, -0.030660629272460938, -0.02410125732421875, -0.017541885375976562, -0.010982513427734375, -0.0044231414794921875, 0.00213623046875, 0.008695602416992188, 0.015254974365234375, 0.021814346313476562, 0.02837371826171875, 0.03493309020996094, 0.041492462158203125, 0.04805183410644531, 0.0546112060546875, 0.06117057800292969, 0.06772994995117188, 0.07428932189941406, 0.08084869384765625, 0.08740806579589844, 0.09396743774414062, 0.10052680969238281, 0.107086181640625, 0.11364555358886719, 0.12020492553710938, 0.12676429748535156, 0.13332366943359375, 0.13988304138183594, 0.14644241333007812, 0.1530017852783203, 0.1595611572265625, 0.1661205291748047, 0.17267990112304688, 0.17923927307128906, 0.18579864501953125, 0.19235801696777344, 0.19891738891601562, 0.2054767608642578, 0.2120361328125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 6.0, 8.0, 13.0, 36.0, 46.0, 69.0, 101.0, 114.0, 120.0, 122.0, 92.0, 93.0, 70.0, 54.0, 22.0, 22.0, 10.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.383004188537598, -4.220355033874512, -4.057705879211426, -3.8950564861297607, -3.7324070930480957, -3.5697579383850098, -3.407108783721924, -3.244459629058838, -3.081810235977173, -2.919161081314087, -2.756511688232422, -2.593862533569336, -2.43121337890625, -2.268563985824585, -2.105914831161499, -1.9432655572891235, -1.780616283416748, -1.6179670095443726, -1.455317735671997, -1.2926685810089111, -1.1300193071365356, -0.9673700332641602, -0.8047208189964294, -0.6420716047286987, -0.47942233085632324, -0.31677308678627014, -0.15412384271621704, 0.00852540135383606, 0.17117464542388916, 0.33382391929626465, 0.49647313356399536, 0.6591223478317261, 0.8217716217041016, 0.984420895576477, 1.1470701694488525, 1.3097193241119385, 1.472368597984314, 1.6350178718566895, 1.7976670265197754, 1.9603163003921509, 2.1229655742645264, 2.2856147289276123, 2.4482641220092773, 2.6109132766723633, 2.773562431335449, 2.9362118244171143, 3.0988609790802, 3.2615103721618652, 3.424159526824951, 3.586808681488037, 3.749458074569702, 3.912107229232788, 4.074756622314453, 4.237405776977539, 4.400054931640625, 4.562704086303711, 4.725353240966797, 4.888002395629883, 5.050651550292969, 5.213301181793213, 5.375950336456299, 5.538599491119385, 5.701248645782471, 5.863897800445557, 6.026547431945801]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 6.0, 6.0, 7.0, 2.0, 5.0, 13.0, 11.0, 13.0, 25.0, 14.0, 27.0, 23.0, 28.0, 29.0, 34.0, 43.0, 42.0, 47.0, 43.0, 45.0, 49.0, 45.0, 43.0, 53.0, 38.0, 45.0, 46.0, 32.0, 31.0, 21.0, 22.0, 29.0, 23.0, 12.0, 12.0, 12.0, 9.0, 5.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.866793632507324, -2.7603862285614014, -2.6539788246154785, -2.5475716590881348, -2.441164255142212, -2.334756851196289, -2.228349447250366, -2.1219420433044434, -2.0155346393585205, -1.9091272354125977, -1.8027199506759644, -1.6963125467300415, -1.5899051427841187, -1.4834978580474854, -1.3770904541015625, -1.2706830501556396, -1.1642757654190063, -1.0578683614730835, -0.9514610171318054, -0.8450536727905273, -0.7386462688446045, -0.6322389245033264, -0.5258315801620483, -0.4194241762161255, -0.3130168318748474, -0.20660945773124695, -0.10020209848880768, 0.006205260753631592, 0.11261263489723206, 0.21902000904083252, 0.3254273533821106, 0.43183475732803345, 0.5382421016693115, 0.6446494460105896, 0.7510568499565125, 0.8574641942977905, 0.9638715982437134, 1.0702788829803467, 1.1766862869262695, 1.2830936908721924, 1.3895010948181152, 1.495908498764038, 1.6023157835006714, 1.7087231874465942, 1.815130591392517, 1.9215378761291504, 2.0279452800750732, 2.134352684020996, 2.24075984954834, 2.3471672534942627, 2.4535746574401855, 2.5599818229675293, 2.666389226913452, 2.772796630859375, 2.879204034805298, 2.9856114387512207, 3.0920188426971436, 3.1984262466430664, 3.3048336505889893, 3.411241054534912, 3.517648220062256, 3.6240556240081787, 3.7304630279541016, 3.8368704319000244, 3.9432778358459473]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 6.0, 11.0, 11.0, 14.0, 27.0, 38.0, 61.0, 109.0, 166.0, 359.0, 723.0, 1498.0, 3624.0, 10434.0, 32787.0, 128458.0, 623547.0, 1930775.0, 1137777.0, 242096.0, 56370.0, 16051.0, 5387.0, 2075.0, 934.0, 416.0, 214.0, 108.0, 74.0, 49.0, 31.0, 19.0, 10.0, 5.0, 9.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.8447265625, -0.8210678100585938, -0.7974090576171875, -0.7737503051757812, -0.750091552734375, -0.7264328002929688, -0.7027740478515625, -0.6791152954101562, -0.65545654296875, -0.6317977905273438, -0.6081390380859375, -0.5844802856445312, -0.560821533203125, -0.5371627807617188, -0.5135040283203125, -0.48984527587890625, -0.4661865234375, -0.44252777099609375, -0.4188690185546875, -0.39521026611328125, -0.371551513671875, -0.34789276123046875, -0.3242340087890625, -0.30057525634765625, -0.27691650390625, -0.25325775146484375, -0.2295989990234375, -0.20594024658203125, -0.182281494140625, -0.15862274169921875, -0.1349639892578125, -0.11130523681640625, -0.087646484375, -0.06398773193359375, -0.0403289794921875, -0.01667022705078125, 0.006988525390625, 0.03064727783203125, 0.0543060302734375, 0.07796478271484375, 0.10162353515625, 0.12528228759765625, 0.1489410400390625, 0.17259979248046875, 0.196258544921875, 0.21991729736328125, 0.2435760498046875, 0.26723480224609375, 0.2908935546875, 0.31455230712890625, 0.3382110595703125, 0.36186981201171875, 0.385528564453125, 0.40918731689453125, 0.4328460693359375, 0.45650482177734375, 0.48016357421875, 0.5038223266601562, 0.5274810791015625, 0.5511398315429688, 0.574798583984375, 0.5984573364257812, 0.6221160888671875, 0.6457748413085938, 0.66943359375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 2.0, 11.0, 9.0, 13.0, 21.0, 22.0, 24.0, 21.0, 30.0, 39.0, 49.0, 50.0, 44.0, 46.0, 50.0, 59.0, 62.0, 52.0, 51.0, 56.0, 49.0, 51.0, 38.0, 28.0, 22.0, 17.0, 19.0, 23.0, 14.0, 10.0, 4.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5439453125, -0.5283355712890625, -0.512725830078125, -0.4971160888671875, -0.48150634765625, -0.4658966064453125, -0.450286865234375, -0.4346771240234375, -0.4190673828125, -0.4034576416015625, -0.387847900390625, -0.3722381591796875, -0.35662841796875, -0.3410186767578125, -0.325408935546875, -0.3097991943359375, -0.294189453125, -0.2785797119140625, -0.262969970703125, -0.2473602294921875, -0.23175048828125, -0.2161407470703125, -0.200531005859375, -0.1849212646484375, -0.1693115234375, -0.1537017822265625, -0.138092041015625, -0.1224822998046875, -0.10687255859375, -0.0912628173828125, -0.075653076171875, -0.0600433349609375, -0.04443359375, -0.0288238525390625, -0.013214111328125, 0.0023956298828125, 0.01800537109375, 0.0336151123046875, 0.049224853515625, 0.0648345947265625, 0.0804443359375, 0.0960540771484375, 0.111663818359375, 0.1272735595703125, 0.14288330078125, 0.1584930419921875, 0.174102783203125, 0.1897125244140625, 0.205322265625, 0.2209320068359375, 0.236541748046875, 0.2521514892578125, 0.26776123046875, 0.2833709716796875, 0.298980712890625, 0.3145904541015625, 0.3302001953125, 0.3458099365234375, 0.361419677734375, 0.3770294189453125, 0.39263916015625, 0.4082489013671875, 0.423858642578125, 0.4394683837890625, 0.455078125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 9.0, 5.0, 6.0, 4.0, 24.0, 12.0, 21.0, 42.0, 88.0, 105.0, 198.0, 303.0, 630.0, 1663.0, 5310.0, 21206.0, 99808.0, 509278.0, 1802500.0, 1360621.0, 311737.0, 61228.0, 13424.0, 3592.0, 1243.0, 530.0, 260.0, 163.0, 98.0, 60.0, 34.0, 21.0, 15.0, 20.0, 12.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.1640625, -1.1348495483398438, -1.1056365966796875, -1.0764236450195312, -1.047210693359375, -1.0179977416992188, -0.9887847900390625, -0.9595718383789062, -0.93035888671875, -0.9011459350585938, -0.8719329833984375, -0.8427200317382812, -0.813507080078125, -0.7842941284179688, -0.7550811767578125, -0.7258682250976562, -0.6966552734375, -0.6674423217773438, -0.6382293701171875, -0.6090164184570312, -0.579803466796875, -0.5505905151367188, -0.5213775634765625, -0.49216461181640625, -0.46295166015625, -0.43373870849609375, -0.4045257568359375, -0.37531280517578125, -0.346099853515625, -0.31688690185546875, -0.2876739501953125, -0.25846099853515625, -0.229248046875, -0.20003509521484375, -0.1708221435546875, -0.14160919189453125, -0.112396240234375, -0.08318328857421875, -0.0539703369140625, -0.02475738525390625, 0.00445556640625, 0.03366851806640625, 0.0628814697265625, 0.09209442138671875, 0.121307373046875, 0.15052032470703125, 0.1797332763671875, 0.20894622802734375, 0.2381591796875, 0.26737213134765625, 0.2965850830078125, 0.32579803466796875, 0.355010986328125, 0.38422393798828125, 0.4134368896484375, 0.44264984130859375, 0.47186279296875, 0.5010757446289062, 0.5302886962890625, 0.5595016479492188, 0.588714599609375, 0.6179275512695312, 0.6471405029296875, 0.6763534545898438, 0.70556640625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 12.0, 17.0, 20.0, 25.0, 33.0, 43.0, 60.0, 69.0, 122.0, 152.0, 172.0, 198.0, 270.0, 303.0, 356.0, 357.0, 318.0, 294.0, 257.0, 213.0, 171.0, 163.0, 110.0, 76.0, 73.0, 37.0, 39.0, 32.0, 30.0, 11.0, 6.0, 10.0, 4.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54736328125, -0.5281143188476562, -0.5088653564453125, -0.48961639404296875, -0.470367431640625, -0.45111846923828125, -0.4318695068359375, -0.41262054443359375, -0.39337158203125, -0.37412261962890625, -0.3548736572265625, -0.33562469482421875, -0.316375732421875, -0.29712677001953125, -0.2778778076171875, -0.25862884521484375, -0.2393798828125, -0.22013092041015625, -0.2008819580078125, -0.18163299560546875, -0.162384033203125, -0.14313507080078125, -0.1238861083984375, -0.10463714599609375, -0.08538818359375, -0.06613922119140625, -0.0468902587890625, -0.02764129638671875, -0.008392333984375, 0.01085662841796875, 0.0301055908203125, 0.04935455322265625, 0.068603515625, 0.08785247802734375, 0.1071014404296875, 0.12635040283203125, 0.145599365234375, 0.16484832763671875, 0.1840972900390625, 0.20334625244140625, 0.22259521484375, 0.24184417724609375, 0.2610931396484375, 0.28034210205078125, 0.299591064453125, 0.31884002685546875, 0.3380889892578125, 0.35733795166015625, 0.3765869140625, 0.39583587646484375, 0.4150848388671875, 0.43433380126953125, 0.453582763671875, 0.47283172607421875, 0.4920806884765625, 0.5113296508789062, 0.53057861328125, 0.5498275756835938, 0.5690765380859375, 0.5883255004882812, 0.607574462890625, 0.6268234252929688, 0.6460723876953125, 0.6653213500976562, 0.6845703125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 10.0, 20.0, 22.0, 31.0, 54.0, 59.0, 88.0, 103.0, 108.0, 131.0, 102.0, 89.0, 65.0, 40.0, 34.0, 20.0, 7.0, 11.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.599460601806641, -4.46221399307251, -4.324967384338379, -4.18772029876709, -4.050473690032959, -3.913227081298828, -3.7759804725646973, -3.6387338638305664, -3.5014870166778564, -3.3642404079437256, -3.2269935607910156, -3.0897469520568848, -2.952500343322754, -2.815253496170044, -2.678006887435913, -2.540760040283203, -2.4035134315490723, -2.2662668228149414, -2.1290199756622314, -1.9917733669281006, -1.8545266389846802, -1.7172799110412598, -1.580033302307129, -1.4427865743637085, -1.305539846420288, -1.1682931184768677, -1.0310463905334473, -0.8937997817993164, -0.756553053855896, -0.6193063259124756, -0.48205965757369995, -0.3448129892349243, -0.2075667381286621, -0.07032003998756409, 0.06692665815353394, 0.20417335629463196, 0.34142005443573, 0.4786667823791504, 0.615913450717926, 0.7531601190567017, 0.8904068470001221, 1.0276535749435425, 1.164900302886963, 1.3021469116210938, 1.4393936395645142, 1.5766403675079346, 1.7138869762420654, 1.8511337041854858, 1.9883804321289062, 2.125627040863037, 2.262873888015747, 2.400120496749878, 2.537367343902588, 2.6746139526367188, 2.8118605613708496, 2.9491071701049805, 3.0863540172576904, 3.2236006259918213, 3.3608474731445312, 3.498094081878662, 3.635340690612793, 3.772587537765503, 3.909834146499634, 4.047080993652344, 4.184327602386475]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 2.0, 7.0, 6.0, 11.0, 9.0, 21.0, 15.0, 21.0, 27.0, 23.0, 26.0, 29.0, 27.0, 35.0, 39.0, 49.0, 38.0, 44.0, 42.0, 50.0, 44.0, 45.0, 43.0, 25.0, 48.0, 48.0, 35.0, 31.0, 29.0, 28.0, 22.0, 14.0, 12.0, 4.0, 9.0, 9.0, 11.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.500917911529541, -2.425679922103882, -2.3504419326782227, -2.2752037048339844, -2.199965715408325, -2.124727725982666, -2.0494894981384277, -1.9742515087127686, -1.8990135192871094, -1.8237755298614502, -1.7485374212265015, -1.6732993125915527, -1.5980613231658936, -1.5228233337402344, -1.4475852251052856, -1.372347116470337, -1.2971091270446777, -1.2218711376190186, -1.1466330289840698, -1.071394920349121, -0.9961569309234619, -0.920918881893158, -0.845680832862854, -0.77044278383255, -0.6952047348022461, -0.6199666857719421, -0.5447286367416382, -0.46949058771133423, -0.3942525386810303, -0.3190144896507263, -0.24377644062042236, -0.1685383915901184, -0.09330034255981445, -0.018062293529510498, 0.05717575550079346, 0.1324138045310974, 0.20765185356140137, 0.2828899025917053, 0.3581279516220093, 0.43336600065231323, 0.5086040496826172, 0.5838420987129211, 0.6590801477432251, 0.734318196773529, 0.809556245803833, 0.884794294834137, 0.9600323438644409, 1.0352704524993896, 1.1105084419250488, 1.185746431350708, 1.2609845399856567, 1.3362226486206055, 1.4114606380462646, 1.4866986274719238, 1.5619367361068726, 1.6371748447418213, 1.7124128341674805, 1.7876508235931396, 1.8628889322280884, 1.938127040863037, 2.0133650302886963, 2.0886030197143555, 2.1638412475585938, 2.239079236984253, 2.314317226409912]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 1.0, 1.0, 2.0, 3.0, 8.0, 8.0, 13.0, 24.0, 31.0, 52.0, 106.0, 193.0, 320.0, 729.0, 1443.0, 3057.0, 6551.0, 13819.0, 31199.0, 70255.0, 153018.0, 262513.0, 250489.0, 139040.0, 63637.0, 28090.0, 12798.0, 5727.0, 2768.0, 1305.0, 608.0, 361.0, 177.0, 78.0, 53.0, 34.0, 21.0, 12.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.900390625, -1.8502960205078125, -1.800201416015625, -1.7501068115234375, -1.70001220703125, -1.6499176025390625, -1.599822998046875, -1.5497283935546875, -1.4996337890625, -1.4495391845703125, -1.399444580078125, -1.3493499755859375, -1.29925537109375, -1.2491607666015625, -1.199066162109375, -1.1489715576171875, -1.098876953125, -1.0487823486328125, -0.998687744140625, -0.9485931396484375, -0.89849853515625, -0.8484039306640625, -0.798309326171875, -0.7482147216796875, -0.6981201171875, -0.6480255126953125, -0.597930908203125, -0.5478363037109375, -0.49774169921875, -0.4476470947265625, -0.397552490234375, -0.3474578857421875, -0.29736328125, -0.2472686767578125, -0.197174072265625, -0.1470794677734375, -0.09698486328125, -0.0468902587890625, 0.003204345703125, 0.0532989501953125, 0.1033935546875, 0.1534881591796875, 0.203582763671875, 0.2536773681640625, 0.30377197265625, 0.3538665771484375, 0.403961181640625, 0.4540557861328125, 0.504150390625, 0.5542449951171875, 0.604339599609375, 0.6544342041015625, 0.70452880859375, 0.7546234130859375, 0.804718017578125, 0.8548126220703125, 0.9049072265625, 0.9550018310546875, 1.005096435546875, 1.0551910400390625, 1.10528564453125, 1.1553802490234375, 1.205474853515625, 1.2555694580078125, 1.3056640625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 4.0, 8.0, 9.0, 13.0, 12.0, 13.0, 27.0, 27.0, 19.0, 44.0, 29.0, 38.0, 41.0, 45.0, 52.0, 60.0, 61.0, 46.0, 63.0, 38.0, 56.0, 51.0, 38.0, 39.0, 37.0, 31.0, 18.0, 20.0, 17.0, 11.0, 7.0, 7.0, 5.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5146484375, -0.5002365112304688, -0.4858245849609375, -0.47141265869140625, -0.457000732421875, -0.44258880615234375, -0.4281768798828125, -0.41376495361328125, -0.39935302734375, -0.38494110107421875, -0.3705291748046875, -0.35611724853515625, -0.341705322265625, -0.32729339599609375, -0.3128814697265625, -0.29846954345703125, -0.2840576171875, -0.26964569091796875, -0.2552337646484375, -0.24082183837890625, -0.226409912109375, -0.21199798583984375, -0.1975860595703125, -0.18317413330078125, -0.16876220703125, -0.15435028076171875, -0.1399383544921875, -0.12552642822265625, -0.111114501953125, -0.09670257568359375, -0.0822906494140625, -0.06787872314453125, -0.053466796875, -0.03905487060546875, -0.0246429443359375, -0.01023101806640625, 0.004180908203125, 0.01859283447265625, 0.0330047607421875, 0.04741668701171875, 0.06182861328125, 0.07624053955078125, 0.0906524658203125, 0.10506439208984375, 0.119476318359375, 0.13388824462890625, 0.1483001708984375, 0.16271209716796875, 0.1771240234375, 0.19153594970703125, 0.2059478759765625, 0.22035980224609375, 0.234771728515625, 0.24918365478515625, 0.2635955810546875, 0.27800750732421875, 0.29241943359375, 0.30683135986328125, 0.3212432861328125, 0.33565521240234375, 0.350067138671875, 0.36447906494140625, 0.3788909912109375, 0.39330291748046875, 0.40771484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 12.0, 27.0, 21.0, 43.0, 62.0, 98.0, 172.0, 254.0, 538.0, 1231.0, 3466.0, 10286.0, 32320.0, 97836.0, 235060.0, 325463.0, 213732.0, 85747.0, 28211.0, 8962.0, 2896.0, 1047.0, 505.0, 207.0, 136.0, 67.0, 59.0, 36.0, 16.0, 19.0, 9.0, 8.0, 0.0, 8.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4052734375, -1.35211181640625, -1.2989501953125, -1.24578857421875, -1.192626953125, -1.13946533203125, -1.0863037109375, -1.03314208984375, -0.97998046875, -0.92681884765625, -0.8736572265625, -0.82049560546875, -0.767333984375, -0.71417236328125, -0.6610107421875, -0.60784912109375, -0.5546875, -0.50152587890625, -0.4483642578125, -0.39520263671875, -0.342041015625, -0.28887939453125, -0.2357177734375, -0.18255615234375, -0.12939453125, -0.07623291015625, -0.0230712890625, 0.03009033203125, 0.083251953125, 0.13641357421875, 0.1895751953125, 0.24273681640625, 0.2958984375, 0.34906005859375, 0.4022216796875, 0.45538330078125, 0.508544921875, 0.56170654296875, 0.6148681640625, 0.66802978515625, 0.72119140625, 0.77435302734375, 0.8275146484375, 0.88067626953125, 0.933837890625, 0.98699951171875, 1.0401611328125, 1.09332275390625, 1.146484375, 1.19964599609375, 1.2528076171875, 1.30596923828125, 1.359130859375, 1.41229248046875, 1.4654541015625, 1.51861572265625, 1.57177734375, 1.62493896484375, 1.6781005859375, 1.73126220703125, 1.784423828125, 1.83758544921875, 1.8907470703125, 1.94390869140625, 1.9970703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 11.0, 14.0, 13.0, 16.0, 20.0, 16.0, 21.0, 31.0, 33.0, 27.0, 32.0, 39.0, 43.0, 45.0, 50.0, 56.0, 49.0, 48.0, 44.0, 42.0, 37.0, 46.0, 44.0, 35.0, 26.0, 30.0, 17.0, 12.0, 18.0, 17.0, 17.0, 7.0, 8.0, 9.0, 11.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.080078125, -1.0424041748046875, -1.004730224609375, -0.9670562744140625, -0.92938232421875, -0.8917083740234375, -0.854034423828125, -0.8163604736328125, -0.7786865234375, -0.7410125732421875, -0.703338623046875, -0.6656646728515625, -0.62799072265625, -0.5903167724609375, -0.552642822265625, -0.5149688720703125, -0.477294921875, -0.4396209716796875, -0.401947021484375, -0.3642730712890625, -0.32659912109375, -0.2889251708984375, -0.251251220703125, -0.2135772705078125, -0.1759033203125, -0.1382293701171875, -0.100555419921875, -0.0628814697265625, -0.02520751953125, 0.0124664306640625, 0.050140380859375, 0.0878143310546875, 0.12548828125, 0.1631622314453125, 0.200836181640625, 0.2385101318359375, 0.27618408203125, 0.3138580322265625, 0.351531982421875, 0.3892059326171875, 0.4268798828125, 0.4645538330078125, 0.502227783203125, 0.5399017333984375, 0.57757568359375, 0.6152496337890625, 0.652923583984375, 0.6905975341796875, 0.728271484375, 0.7659454345703125, 0.803619384765625, 0.8412933349609375, 0.87896728515625, 0.9166412353515625, 0.954315185546875, 0.9919891357421875, 1.0296630859375, 1.0673370361328125, 1.105010986328125, 1.1426849365234375, 1.18035888671875, 1.2180328369140625, 1.255706787109375, 1.2933807373046875, 1.3310546875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 9.0, 6.0, 13.0, 13.0, 17.0, 35.0, 45.0, 100.0, 198.0, 325.0, 634.0, 1250.0, 2640.0, 5733.0, 12664.0, 29510.0, 71306.0, 166521.0, 287145.0, 252126.0, 126435.0, 52202.0, 21713.0, 9507.0, 4268.0, 2016.0, 978.0, 525.0, 278.0, 149.0, 61.0, 46.0, 34.0, 21.0, 9.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7294921875, -0.7091293334960938, -0.6887664794921875, -0.6684036254882812, -0.648040771484375, -0.6276779174804688, -0.6073150634765625, -0.5869522094726562, -0.56658935546875, -0.5462265014648438, -0.5258636474609375, -0.5055007934570312, -0.485137939453125, -0.46477508544921875, -0.4444122314453125, -0.42404937744140625, -0.4036865234375, -0.38332366943359375, -0.3629608154296875, -0.34259796142578125, -0.322235107421875, -0.30187225341796875, -0.2815093994140625, -0.26114654541015625, -0.24078369140625, -0.22042083740234375, -0.2000579833984375, -0.17969512939453125, -0.159332275390625, -0.13896942138671875, -0.1186065673828125, -0.09824371337890625, -0.077880859375, -0.05751800537109375, -0.0371551513671875, -0.01679229736328125, 0.003570556640625, 0.02393341064453125, 0.0442962646484375, 0.06465911865234375, 0.08502197265625, 0.10538482666015625, 0.1257476806640625, 0.14611053466796875, 0.166473388671875, 0.18683624267578125, 0.2071990966796875, 0.22756195068359375, 0.2479248046875, 0.26828765869140625, 0.2886505126953125, 0.30901336669921875, 0.329376220703125, 0.34973907470703125, 0.3701019287109375, 0.39046478271484375, 0.41082763671875, 0.43119049072265625, 0.4515533447265625, 0.47191619873046875, 0.492279052734375, 0.5126419067382812, 0.5330047607421875, 0.5533676147460938, 0.57373046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 7.0, 1.0, 4.0, 5.0, 9.0, 13.0, 22.0, 22.0, 27.0, 52.0, 47.0, 75.0, 96.0, 105.0, 94.0, 90.0, 70.0, 64.0, 43.0, 29.0, 34.0, 19.0, 15.0, 15.0, 11.0, 6.0, 7.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016450881958007812, -0.00015968270599842072, -0.0001548565924167633, -0.0001500304788351059, -0.00014520436525344849, -0.00014037825167179108, -0.00013555213809013367, -0.00013072602450847626, -0.00012589991092681885, -0.00012107379734516144, -0.00011624768376350403, -0.00011142157018184662, -0.00010659545660018921, -0.0001017693430185318, -9.694322943687439e-05, -9.211711585521698e-05, -8.729100227355957e-05, -8.246488869190216e-05, -7.763877511024475e-05, -7.281266152858734e-05, -6.798654794692993e-05, -6.316043436527252e-05, -5.833432078361511e-05, -5.35082072019577e-05, -4.868209362030029e-05, -4.385598003864288e-05, -3.9029866456985474e-05, -3.4203752875328064e-05, -2.9377639293670654e-05, -2.4551525712013245e-05, -1.9725412130355835e-05, -1.4899298548698425e-05, -1.0073184967041016e-05, -5.247071385383606e-06, -4.209578037261963e-07, 4.405155777931213e-06, 9.231269359588623e-06, 1.4057382941246033e-05, 1.8883496522903442e-05, 2.3709610104560852e-05, 2.8535723686218262e-05, 3.336183726787567e-05, 3.818795084953308e-05, 4.301406443119049e-05, 4.78401780128479e-05, 5.266629159450531e-05, 5.749240517616272e-05, 6.231851875782013e-05, 6.714463233947754e-05, 7.197074592113495e-05, 7.679685950279236e-05, 8.162297308444977e-05, 8.644908666610718e-05, 9.127520024776459e-05, 9.6101313829422e-05, 0.0001009274274110794, 0.00010575354099273682, 0.00011057965457439423, 0.00011540576815605164, 0.00012023188173770905, 0.00012505799531936646, 0.00012988410890102386, 0.00013471022248268127, 0.00013953633606433868, 0.0001443624496459961]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 7.0, 10.0, 12.0, 15.0, 26.0, 34.0, 44.0, 58.0, 108.0, 169.0, 280.0, 491.0, 892.0, 1836.0, 3795.0, 7709.0, 16883.0, 39699.0, 102325.0, 239700.0, 319391.0, 186326.0, 73921.0, 29716.0, 12781.0, 6144.0, 2877.0, 1428.0, 762.0, 446.0, 234.0, 159.0, 76.0, 56.0, 38.0, 24.0, 22.0, 17.0, 13.0, 11.0, 5.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61865234375, -0.599517822265625, -0.58038330078125, -0.561248779296875, -0.5421142578125, -0.522979736328125, -0.50384521484375, -0.484710693359375, -0.465576171875, -0.446441650390625, -0.42730712890625, -0.408172607421875, -0.3890380859375, -0.369903564453125, -0.35076904296875, -0.331634521484375, -0.3125, -0.293365478515625, -0.27423095703125, -0.255096435546875, -0.2359619140625, -0.216827392578125, -0.19769287109375, -0.178558349609375, -0.159423828125, -0.140289306640625, -0.12115478515625, -0.102020263671875, -0.0828857421875, -0.063751220703125, -0.04461669921875, -0.025482177734375, -0.00634765625, 0.012786865234375, 0.03192138671875, 0.051055908203125, 0.0701904296875, 0.089324951171875, 0.10845947265625, 0.127593994140625, 0.146728515625, 0.165863037109375, 0.18499755859375, 0.204132080078125, 0.2232666015625, 0.242401123046875, 0.26153564453125, 0.280670166015625, 0.2998046875, 0.318939208984375, 0.33807373046875, 0.357208251953125, 0.3763427734375, 0.395477294921875, 0.41461181640625, 0.433746337890625, 0.452880859375, 0.472015380859375, 0.49114990234375, 0.510284423828125, 0.5294189453125, 0.548553466796875, 0.56768798828125, 0.586822509765625, 0.60595703125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 2.0, 4.0, 6.0, 4.0, 9.0, 11.0, 6.0, 14.0, 18.0, 24.0, 29.0, 35.0, 35.0, 42.0, 52.0, 59.0, 74.0, 60.0, 66.0, 75.0, 63.0, 51.0, 39.0, 45.0, 29.0, 34.0, 22.0, 16.0, 23.0, 10.0, 11.0, 5.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.393310546875, -0.37985992431640625, -0.3664093017578125, -0.35295867919921875, -0.339508056640625, -0.32605743408203125, -0.3126068115234375, -0.29915618896484375, -0.28570556640625, -0.27225494384765625, -0.2588043212890625, -0.24535369873046875, -0.231903076171875, -0.21845245361328125, -0.2050018310546875, -0.19155120849609375, -0.1781005859375, -0.16464996337890625, -0.1511993408203125, -0.13774871826171875, -0.124298095703125, -0.11084747314453125, -0.0973968505859375, -0.08394622802734375, -0.07049560546875, -0.05704498291015625, -0.0435943603515625, -0.03014373779296875, -0.016693115234375, -0.00324249267578125, 0.0102081298828125, 0.02365875244140625, 0.037109375, 0.05055999755859375, 0.0640106201171875, 0.07746124267578125, 0.090911865234375, 0.10436248779296875, 0.1178131103515625, 0.13126373291015625, 0.14471435546875, 0.15816497802734375, 0.1716156005859375, 0.18506622314453125, 0.198516845703125, 0.21196746826171875, 0.2254180908203125, 0.23886871337890625, 0.2523193359375, 0.26576995849609375, 0.2792205810546875, 0.29267120361328125, 0.306121826171875, 0.31957244873046875, 0.3330230712890625, 0.34647369384765625, 0.35992431640625, 0.37337493896484375, 0.3868255615234375, 0.40027618408203125, 0.413726806640625, 0.42717742919921875, 0.4406280517578125, 0.45407867431640625, 0.467529296875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 4.0, 6.0, 4.0, 13.0, 10.0, 17.0, 21.0, 23.0, 29.0, 32.0, 38.0, 48.0, 53.0, 60.0, 70.0, 61.0, 52.0, 66.0, 54.0, 54.0, 55.0, 48.0, 29.0, 36.0, 22.0, 17.0, 15.0, 19.0, 13.0, 6.0, 9.0, 5.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4626381397247314, -3.3460724353790283, -3.229506731033325, -3.112941026687622, -2.99637508392334, -2.8798093795776367, -2.7632436752319336, -2.6466779708862305, -2.5301122665405273, -2.413546562194824, -2.296980857849121, -2.180415153503418, -2.063849449157715, -1.9472836256027222, -1.8307178020477295, -1.7141520977020264, -1.5975863933563232, -1.4810206890106201, -1.364454984664917, -1.2478891611099243, -1.1313234567642212, -1.014757752418518, -0.8981919884681702, -0.7816262245178223, -0.6650605201721191, -0.548494815826416, -0.4319290518760681, -0.3153633177280426, -0.1987975835800171, -0.08223187923431396, 0.034333884716033936, 0.15089964866638184, 0.26746511459350586, 0.38403084874153137, 0.5005965828895569, 0.6171623468399048, 0.7337280511856079, 0.850293755531311, 0.9668595194816589, 1.0834252834320068, 1.19999098777771, 1.316556692123413, 1.4331223964691162, 1.5496882200241089, 1.666253924369812, 1.7828196287155151, 1.8993854522705078, 2.015951156616211, 2.132516860961914, 2.249082565307617, 2.3656482696533203, 2.4822139739990234, 2.5987796783447266, 2.7153453826904297, 2.831911325454712, 2.948477029800415, 3.065042734146118, 3.1816084384918213, 3.2981741428375244, 3.4147398471832275, 3.5313057899475098, 3.647871494293213, 3.764437198638916, 3.881002902984619, 3.9975686073303223]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 4.0, 5.0, 11.0, 13.0, 7.0, 17.0, 21.0, 16.0, 22.0, 26.0, 23.0, 30.0, 31.0, 33.0, 39.0, 39.0, 38.0, 43.0, 38.0, 47.0, 33.0, 51.0, 41.0, 50.0, 37.0, 33.0, 29.0, 34.0, 27.0, 20.0, 26.0, 14.0, 14.0, 16.0, 15.0, 13.0, 12.0, 4.0, 6.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5046651363372803, -3.3897159099578857, -3.274766683578491, -3.159817695617676, -3.0448684692382812, -2.9299192428588867, -2.814970016479492, -2.7000207901000977, -2.585071563720703, -2.4701223373413086, -2.355173110961914, -2.2402238845825195, -2.125274896621704, -2.0103256702423096, -1.895376443862915, -1.7804272174835205, -1.665478229522705, -1.5505290031433105, -1.4355798959732056, -1.320630669593811, -1.205681562423706, -1.0907323360443115, -0.975783109664917, -0.8608339428901672, -0.7458847761154175, -0.6309356093406677, -0.515986442565918, -0.40103721618652344, -0.2860880494117737, -0.17113888263702393, -0.056189656257629395, 0.05875951051712036, 0.17370891571044922, 0.288658082485199, 0.4036072790622711, 0.5185564756393433, 0.633505642414093, 0.7484548091888428, 0.8634040355682373, 0.9783532023429871, 1.0933023691177368, 1.2082515954971313, 1.3232007026672363, 1.4381499290466309, 1.5530991554260254, 1.6680482625961304, 1.782997488975525, 1.8979465961456299, 2.0128958225250244, 2.127845048904419, 2.2427942752838135, 2.357743263244629, 2.4726924896240234, 2.587641716003418, 2.7025909423828125, 2.817540168762207, 2.9324893951416016, 3.047438621520996, 3.1623878479003906, 3.277337074279785, 3.3922860622406006, 3.507235288619995, 3.6221845149993896, 3.737133741378784, 3.8520827293395996]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 10.0, 7.0, 15.0, 26.0, 37.0, 52.0, 89.0, 149.0, 224.0, 391.0, 766.0, 1384.0, 2946.0, 6348.0, 14620.0, 37328.0, 107252.0, 348664.0, 1086964.0, 1552668.0, 705359.0, 214754.0, 69617.0, 25104.0, 10459.0, 4613.0, 2125.0, 1049.0, 558.0, 281.0, 162.0, 93.0, 56.0, 41.0, 35.0, 15.0, 9.0, 8.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.671875, -0.6504058837890625, -0.628936767578125, -0.6074676513671875, -0.58599853515625, -0.5645294189453125, -0.543060302734375, -0.5215911865234375, -0.5001220703125, -0.4786529541015625, -0.457183837890625, -0.4357147216796875, -0.41424560546875, -0.3927764892578125, -0.371307373046875, -0.3498382568359375, -0.328369140625, -0.3069000244140625, -0.285430908203125, -0.2639617919921875, -0.24249267578125, -0.2210235595703125, -0.199554443359375, -0.1780853271484375, -0.1566162109375, -0.1351470947265625, -0.113677978515625, -0.0922088623046875, -0.07073974609375, -0.0492706298828125, -0.027801513671875, -0.0063323974609375, 0.01513671875, 0.0366058349609375, 0.058074951171875, 0.0795440673828125, 0.10101318359375, 0.1224822998046875, 0.143951416015625, 0.1654205322265625, 0.1868896484375, 0.2083587646484375, 0.229827880859375, 0.2512969970703125, 0.27276611328125, 0.2942352294921875, 0.315704345703125, 0.3371734619140625, 0.358642578125, 0.3801116943359375, 0.401580810546875, 0.4230499267578125, 0.44451904296875, 0.4659881591796875, 0.487457275390625, 0.5089263916015625, 0.5303955078125, 0.5518646240234375, 0.573333740234375, 0.5948028564453125, 0.61627197265625, 0.6377410888671875, 0.659210205078125, 0.6806793212890625, 0.7021484375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 3.0, 10.0, 15.0, 11.0, 19.0, 14.0, 30.0, 35.0, 54.0, 38.0, 39.0, 43.0, 51.0, 50.0, 64.0, 63.0, 63.0, 66.0, 43.0, 43.0, 44.0, 32.0, 28.0, 29.0, 25.0, 20.0, 18.0, 7.0, 16.0, 6.0, 11.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70263671875, -0.6836166381835938, -0.6645965576171875, -0.6455764770507812, -0.626556396484375, -0.6075363159179688, -0.5885162353515625, -0.5694961547851562, -0.55047607421875, -0.5314559936523438, -0.5124359130859375, -0.49341583251953125, -0.474395751953125, -0.45537567138671875, -0.4363555908203125, -0.41733551025390625, -0.3983154296875, -0.37929534912109375, -0.3602752685546875, -0.34125518798828125, -0.322235107421875, -0.30321502685546875, -0.2841949462890625, -0.26517486572265625, -0.24615478515625, -0.22713470458984375, -0.2081146240234375, -0.18909454345703125, -0.170074462890625, -0.15105438232421875, -0.1320343017578125, -0.11301422119140625, -0.093994140625, -0.07497406005859375, -0.0559539794921875, -0.03693389892578125, -0.017913818359375, 0.00110626220703125, 0.0201263427734375, 0.03914642333984375, 0.05816650390625, 0.07718658447265625, 0.0962066650390625, 0.11522674560546875, 0.134246826171875, 0.15326690673828125, 0.1722869873046875, 0.19130706787109375, 0.2103271484375, 0.22934722900390625, 0.2483673095703125, 0.26738739013671875, 0.286407470703125, 0.30542755126953125, 0.3244476318359375, 0.34346771240234375, 0.36248779296875, 0.38150787353515625, 0.4005279541015625, 0.41954803466796875, 0.438568115234375, 0.45758819580078125, 0.4766082763671875, 0.49562835693359375, 0.5146484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 7.0, 3.0, 12.0, 13.0, 23.0, 21.0, 32.0, 41.0, 97.0, 119.0, 175.0, 293.0, 477.0, 891.0, 1420.0, 2658.0, 5193.0, 10666.0, 23252.0, 53660.0, 132555.0, 330613.0, 773139.0, 1292970.0, 896656.0, 393739.0, 158531.0, 64303.0, 27284.0, 12373.0, 6014.0, 3101.0, 1599.0, 936.0, 533.0, 313.0, 214.0, 122.0, 87.0, 42.0, 47.0, 21.0, 16.0, 10.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.7197265625, -0.6995086669921875, -0.679290771484375, -0.6590728759765625, -0.63885498046875, -0.6186370849609375, -0.598419189453125, -0.5782012939453125, -0.5579833984375, -0.5377655029296875, -0.517547607421875, -0.4973297119140625, -0.47711181640625, -0.4568939208984375, -0.436676025390625, -0.4164581298828125, -0.396240234375, -0.3760223388671875, -0.355804443359375, -0.3355865478515625, -0.31536865234375, -0.2951507568359375, -0.274932861328125, -0.2547149658203125, -0.2344970703125, -0.2142791748046875, -0.194061279296875, -0.1738433837890625, -0.15362548828125, -0.1334075927734375, -0.113189697265625, -0.0929718017578125, -0.07275390625, -0.0525360107421875, -0.032318115234375, -0.0121002197265625, 0.00811767578125, 0.0283355712890625, 0.048553466796875, 0.0687713623046875, 0.0889892578125, 0.1092071533203125, 0.129425048828125, 0.1496429443359375, 0.16986083984375, 0.1900787353515625, 0.210296630859375, 0.2305145263671875, 0.250732421875, 0.2709503173828125, 0.291168212890625, 0.3113861083984375, 0.33160400390625, 0.3518218994140625, 0.372039794921875, 0.3922576904296875, 0.4124755859375, 0.4326934814453125, 0.452911376953125, 0.4731292724609375, 0.49334716796875, 0.5135650634765625, 0.533782958984375, 0.5540008544921875, 0.57421875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 3.0, 5.0, 8.0, 13.0, 16.0, 16.0, 26.0, 30.0, 27.0, 63.0, 59.0, 57.0, 90.0, 113.0, 155.0, 194.0, 222.0, 263.0, 333.0, 325.0, 342.0, 288.0, 237.0, 237.0, 195.0, 157.0, 114.0, 112.0, 57.0, 65.0, 55.0, 45.0, 26.0, 32.0, 21.0, 24.0, 12.0, 7.0, 8.0, 6.0, 4.0, 8.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.72119140625, -0.6993560791015625, -0.677520751953125, -0.6556854248046875, -0.63385009765625, -0.6120147705078125, -0.590179443359375, -0.5683441162109375, -0.5465087890625, -0.5246734619140625, -0.502838134765625, -0.4810028076171875, -0.45916748046875, -0.4373321533203125, -0.415496826171875, -0.3936614990234375, -0.371826171875, -0.3499908447265625, -0.328155517578125, -0.3063201904296875, -0.28448486328125, -0.2626495361328125, -0.240814208984375, -0.2189788818359375, -0.1971435546875, -0.1753082275390625, -0.153472900390625, -0.1316375732421875, -0.10980224609375, -0.0879669189453125, -0.066131591796875, -0.0442962646484375, -0.0224609375, -0.0006256103515625, 0.021209716796875, 0.0430450439453125, 0.06488037109375, 0.0867156982421875, 0.108551025390625, 0.1303863525390625, 0.1522216796875, 0.1740570068359375, 0.195892333984375, 0.2177276611328125, 0.23956298828125, 0.2613983154296875, 0.283233642578125, 0.3050689697265625, 0.326904296875, 0.3487396240234375, 0.370574951171875, 0.3924102783203125, 0.41424560546875, 0.4360809326171875, 0.457916259765625, 0.4797515869140625, 0.5015869140625, 0.5234222412109375, 0.545257568359375, 0.5670928955078125, 0.58892822265625, 0.6107635498046875, 0.632598876953125, 0.6544342041015625, 0.67626953125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 7.0, 15.0, 19.0, 36.0, 52.0, 73.0, 94.0, 112.0, 115.0, 95.0, 114.0, 81.0, 68.0, 44.0, 39.0, 16.0, 14.0, 5.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.793507099151611, -6.603335380554199, -6.413163661956787, -6.222991943359375, -6.032820224761963, -5.842648506164551, -5.652477264404297, -5.462305068969727, -5.272133827209473, -5.0819621086120605, -4.891790390014648, -4.701618671417236, -4.511446952819824, -4.321275234222412, -4.131103515625, -3.940932035446167, -3.750760078430176, -3.5605883598327637, -3.3704166412353516, -3.1802449226379395, -2.9900732040405273, -2.7999014854431152, -2.6097300052642822, -2.41955828666687, -2.229386568069458, -2.039214849472046, -1.8490431308746338, -1.6588715314865112, -1.4686998128890991, -1.278528094291687, -1.0883564949035645, -0.8981847763061523, -0.7080135345458984, -0.5178418159484863, -0.327670156955719, -0.13749849796295166, 0.05267322063446045, 0.24284493923187256, 0.4330165386199951, 0.6231882572174072, 0.8133599758148193, 1.0035316944122314, 1.1937034130096436, 1.3838750123977661, 1.5740467309951782, 1.7642184495925903, 1.954390048980713, 2.144561767578125, 2.334733486175537, 2.524905204772949, 2.7150769233703613, 2.9052486419677734, 3.0954203605651855, 3.2855920791625977, 3.4757635593414307, 3.6659352779388428, 3.856106996536255, 4.046278476715088, 4.2364501953125, 4.426621913909912, 4.616793632507324, 4.806965351104736, 4.997137069702148, 5.1873087882995605, 5.377480506896973]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 7.0, 7.0, 7.0, 7.0, 8.0, 19.0, 13.0, 20.0, 23.0, 27.0, 25.0, 38.0, 34.0, 30.0, 29.0, 42.0, 33.0, 36.0, 41.0, 35.0, 44.0, 33.0, 41.0, 41.0, 33.0, 36.0, 32.0, 40.0, 28.0, 34.0, 22.0, 26.0, 17.0, 18.0, 15.0, 8.0, 12.0, 7.0, 10.0, 6.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.0110158920288086, -2.920952320098877, -2.8308887481689453, -2.7408251762390137, -2.650761604309082, -2.5606980323791504, -2.4706344604492188, -2.380570888519287, -2.2905073165893555, -2.200443744659424, -2.110380172729492, -2.0203166007995605, -1.930253028869629, -1.8401894569396973, -1.7501258850097656, -1.660062313079834, -1.5699987411499023, -1.4799351692199707, -1.389871597290039, -1.2998080253601074, -1.2097444534301758, -1.1196808815002441, -1.0296173095703125, -0.9395537376403809, -0.8494901657104492, -0.7594265937805176, -0.6693630218505859, -0.5792994499206543, -0.48923587799072266, -0.399172306060791, -0.3091087341308594, -0.21904516220092773, -0.1289818286895752, -0.038918256759643555, 0.051145315170288086, 0.14120888710021973, 0.23127245903015137, 0.321336030960083, 0.41139960289001465, 0.5014631748199463, 0.5915267467498779, 0.6815903186798096, 0.7716538906097412, 0.8617174625396729, 0.9517810344696045, 1.0418446063995361, 1.1319081783294678, 1.2219717502593994, 1.312035322189331, 1.4020988941192627, 1.4921624660491943, 1.582226037979126, 1.6722896099090576, 1.7623531818389893, 1.852416753768921, 1.9424803256988525, 2.032543897628784, 2.122607469558716, 2.2126710414886475, 2.302734613418579, 2.3927981853485107, 2.4828617572784424, 2.572925329208374, 2.6629889011383057, 2.7530524730682373]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 10.0, 11.0, 11.0, 17.0, 41.0, 56.0, 86.0, 117.0, 214.0, 411.0, 702.0, 1292.0, 2662.0, 4950.0, 9300.0, 17467.0, 33439.0, 66712.0, 147950.0, 274904.0, 249394.0, 121946.0, 56082.0, 28703.0, 14940.0, 8061.0, 4234.0, 2224.0, 1137.0, 596.0, 340.0, 191.0, 132.0, 67.0, 49.0, 32.0, 21.0, 19.0, 10.0, 5.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1640625, -1.1251068115234375, -1.086151123046875, -1.0471954345703125, -1.00823974609375, -0.9692840576171875, -0.930328369140625, -0.8913726806640625, -0.8524169921875, -0.8134613037109375, -0.774505615234375, -0.7355499267578125, -0.69659423828125, -0.6576385498046875, -0.618682861328125, -0.5797271728515625, -0.540771484375, -0.5018157958984375, -0.462860107421875, -0.4239044189453125, -0.38494873046875, -0.3459930419921875, -0.307037353515625, -0.2680816650390625, -0.2291259765625, -0.1901702880859375, -0.151214599609375, -0.1122589111328125, -0.07330322265625, -0.0343475341796875, 0.004608154296875, 0.0435638427734375, 0.08251953125, 0.1214752197265625, 0.160430908203125, 0.1993865966796875, 0.23834228515625, 0.2772979736328125, 0.316253662109375, 0.3552093505859375, 0.3941650390625, 0.4331207275390625, 0.472076416015625, 0.5110321044921875, 0.54998779296875, 0.5889434814453125, 0.627899169921875, 0.6668548583984375, 0.705810546875, 0.7447662353515625, 0.783721923828125, 0.8226776123046875, 0.86163330078125, 0.9005889892578125, 0.939544677734375, 0.9785003662109375, 1.0174560546875, 1.0564117431640625, 1.095367431640625, 1.1343231201171875, 1.17327880859375, 1.2122344970703125, 1.251190185546875, 1.2901458740234375, 1.3291015625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 5.0, 11.0, 9.0, 10.0, 7.0, 10.0, 14.0, 21.0, 26.0, 25.0, 30.0, 23.0, 37.0, 36.0, 27.0, 40.0, 45.0, 46.0, 46.0, 48.0, 47.0, 42.0, 57.0, 31.0, 39.0, 43.0, 25.0, 29.0, 37.0, 24.0, 20.0, 16.0, 13.0, 11.0, 6.0, 9.0, 11.0, 8.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.52880859375, -0.5141944885253906, -0.49958038330078125, -0.4849662780761719, -0.4703521728515625, -0.4557380676269531, -0.44112396240234375, -0.4265098571777344, -0.411895751953125, -0.3972816467285156, -0.38266754150390625, -0.3680534362792969, -0.3534393310546875, -0.3388252258300781, -0.32421112060546875, -0.3095970153808594, -0.29498291015625, -0.2803688049316406, -0.26575469970703125, -0.2511405944824219, -0.2365264892578125, -0.22191238403320312, -0.20729827880859375, -0.19268417358398438, -0.178070068359375, -0.16345596313476562, -0.14884185791015625, -0.13422775268554688, -0.1196136474609375, -0.10499954223632812, -0.09038543701171875, -0.07577133178710938, -0.0611572265625, -0.046543121337890625, -0.03192901611328125, -0.017314910888671875, -0.0027008056640625, 0.011913299560546875, 0.02652740478515625, 0.041141510009765625, 0.055755615234375, 0.07036972045898438, 0.08498382568359375, 0.09959793090820312, 0.1142120361328125, 0.12882614135742188, 0.14344024658203125, 0.15805435180664062, 0.17266845703125, 0.18728256225585938, 0.20189666748046875, 0.21651077270507812, 0.2311248779296875, 0.24573898315429688, 0.26035308837890625, 0.2749671936035156, 0.289581298828125, 0.3041954040527344, 0.31880950927734375, 0.3334236145019531, 0.3480377197265625, 0.3626518249511719, 0.37726593017578125, 0.3918800354003906, 0.406494140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 1.0, 6.0, 11.0, 10.0, 14.0, 19.0, 26.0, 48.0, 75.0, 140.0, 221.0, 444.0, 1145.0, 4523.0, 21987.0, 107804.0, 448570.0, 364393.0, 78110.0, 15840.0, 3314.0, 943.0, 348.0, 209.0, 133.0, 93.0, 54.0, 23.0, 23.0, 10.0, 8.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.59765625, -2.525299072265625, -2.45294189453125, -2.380584716796875, -2.3082275390625, -2.235870361328125, -2.16351318359375, -2.091156005859375, -2.018798828125, -1.946441650390625, -1.87408447265625, -1.801727294921875, -1.7293701171875, -1.657012939453125, -1.58465576171875, -1.512298583984375, -1.43994140625, -1.367584228515625, -1.29522705078125, -1.222869873046875, -1.1505126953125, -1.078155517578125, -1.00579833984375, -0.933441162109375, -0.861083984375, -0.788726806640625, -0.71636962890625, -0.644012451171875, -0.5716552734375, -0.499298095703125, -0.42694091796875, -0.354583740234375, -0.2822265625, -0.209869384765625, -0.13751220703125, -0.065155029296875, 0.0072021484375, 0.079559326171875, 0.15191650390625, 0.224273681640625, 0.296630859375, 0.368988037109375, 0.44134521484375, 0.513702392578125, 0.5860595703125, 0.658416748046875, 0.73077392578125, 0.803131103515625, 0.87548828125, 0.947845458984375, 1.02020263671875, 1.092559814453125, 1.1649169921875, 1.237274169921875, 1.30963134765625, 1.381988525390625, 1.454345703125, 1.526702880859375, 1.59906005859375, 1.671417236328125, 1.7437744140625, 1.816131591796875, 1.88848876953125, 1.960845947265625, 2.033203125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 6.0, 8.0, 11.0, 11.0, 18.0, 21.0, 18.0, 32.0, 30.0, 40.0, 35.0, 53.0, 41.0, 50.0, 40.0, 52.0, 39.0, 42.0, 52.0, 44.0, 52.0, 40.0, 41.0, 38.0, 34.0, 23.0, 22.0, 19.0, 22.0, 13.0, 15.0, 12.0, 8.0, 5.0, 7.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3857421875, -1.3373565673828125, -1.288970947265625, -1.2405853271484375, -1.19219970703125, -1.1438140869140625, -1.095428466796875, -1.0470428466796875, -0.9986572265625, -0.9502716064453125, -0.901885986328125, -0.8535003662109375, -0.80511474609375, -0.7567291259765625, -0.708343505859375, -0.6599578857421875, -0.611572265625, -0.5631866455078125, -0.514801025390625, -0.4664154052734375, -0.41802978515625, -0.3696441650390625, -0.321258544921875, -0.2728729248046875, -0.2244873046875, -0.1761016845703125, -0.127716064453125, -0.0793304443359375, -0.03094482421875, 0.0174407958984375, 0.065826416015625, 0.1142120361328125, 0.16259765625, 0.2109832763671875, 0.259368896484375, 0.3077545166015625, 0.35614013671875, 0.4045257568359375, 0.452911376953125, 0.5012969970703125, 0.5496826171875, 0.5980682373046875, 0.646453857421875, 0.6948394775390625, 0.74322509765625, 0.7916107177734375, 0.839996337890625, 0.8883819580078125, 0.936767578125, 0.9851531982421875, 1.033538818359375, 1.0819244384765625, 1.13031005859375, 1.1786956787109375, 1.227081298828125, 1.2754669189453125, 1.3238525390625, 1.3722381591796875, 1.420623779296875, 1.4690093994140625, 1.51739501953125, 1.5657806396484375, 1.614166259765625, 1.6625518798828125, 1.7109375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 13.0, 15.0, 17.0, 44.0, 55.0, 66.0, 117.0, 166.0, 271.0, 428.0, 638.0, 1011.0, 1669.0, 2522.0, 3875.0, 6213.0, 9866.0, 15920.0, 24962.0, 40844.0, 69606.0, 117203.0, 172517.0, 190922.0, 150440.0, 94702.0, 55696.0, 32916.0, 20835.0, 12835.0, 8262.0, 5109.0, 3277.0, 1960.0, 1252.0, 809.0, 496.0, 355.0, 196.0, 156.0, 113.0, 45.0, 34.0, 31.0, 31.0, 21.0, 6.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.3984375, -0.3860969543457031, -0.37375640869140625, -0.3614158630371094, -0.3490753173828125, -0.3367347717285156, -0.32439422607421875, -0.3120536804199219, -0.299713134765625, -0.2873725891113281, -0.27503204345703125, -0.2626914978027344, -0.2503509521484375, -0.23801040649414062, -0.22566986083984375, -0.21332931518554688, -0.20098876953125, -0.18864822387695312, -0.17630767822265625, -0.16396713256835938, -0.1516265869140625, -0.13928604125976562, -0.12694549560546875, -0.11460494995117188, -0.102264404296875, -0.08992385864257812, -0.07758331298828125, -0.06524276733398438, -0.0529022216796875, -0.040561676025390625, -0.02822113037109375, -0.015880584716796875, -0.0035400390625, 0.008800506591796875, 0.02114105224609375, 0.033481597900390625, 0.0458221435546875, 0.058162689208984375, 0.07050323486328125, 0.08284378051757812, 0.095184326171875, 0.10752487182617188, 0.11986541748046875, 0.13220596313476562, 0.1445465087890625, 0.15688705444335938, 0.16922760009765625, 0.18156814575195312, 0.19390869140625, 0.20624923706054688, 0.21858978271484375, 0.23093032836914062, 0.2432708740234375, 0.2556114196777344, 0.26795196533203125, 0.2802925109863281, 0.292633056640625, 0.3049736022949219, 0.31731414794921875, 0.3296546936035156, 0.3419952392578125, 0.3543357849121094, 0.36667633056640625, 0.3790168762207031, 0.391357421875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 8.0, 6.0, 3.0, 11.0, 13.0, 11.0, 15.0, 10.0, 17.0, 14.0, 18.0, 25.0, 45.0, 68.0, 79.0, 99.0, 98.0, 100.0, 88.0, 69.0, 36.0, 31.0, 24.0, 19.0, 16.0, 9.0, 12.0, 6.0, 8.0, 9.0, 7.0, 5.0, 4.0, 6.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011241436004638672, -0.00010832585394382477, -0.00010423734784126282, -0.00010014884173870087, -9.606033563613892e-05, -9.197182953357697e-05, -8.788332343101501e-05, -8.379481732845306e-05, -7.970631122589111e-05, -7.561780512332916e-05, -7.152929902076721e-05, -6.744079291820526e-05, -6.335228681564331e-05, -5.926378071308136e-05, -5.517527461051941e-05, -5.108676850795746e-05, -4.699826240539551e-05, -4.290975630283356e-05, -3.8821250200271606e-05, -3.4732744097709656e-05, -3.0644237995147705e-05, -2.6555731892585754e-05, -2.2467225790023804e-05, -1.8378719687461853e-05, -1.4290213584899902e-05, -1.0201707482337952e-05, -6.113201379776001e-06, -2.0246952772140503e-06, 2.0638108253479004e-06, 6.152316927909851e-06, 1.0240823030471802e-05, 1.4329329133033752e-05, 1.8417835235595703e-05, 2.2506341338157654e-05, 2.6594847440719604e-05, 3.0683353543281555e-05, 3.4771859645843506e-05, 3.8860365748405457e-05, 4.294887185096741e-05, 4.703737795352936e-05, 5.112588405609131e-05, 5.521439015865326e-05, 5.930289626121521e-05, 6.339140236377716e-05, 6.747990846633911e-05, 7.156841456890106e-05, 7.565692067146301e-05, 7.974542677402496e-05, 8.383393287658691e-05, 8.792243897914886e-05, 9.201094508171082e-05, 9.609945118427277e-05, 0.00010018795728683472, 0.00010427646338939667, 0.00010836496949195862, 0.00011245347559452057, 0.00011654198169708252, 0.00012063048779964447, 0.00012471899390220642, 0.00012880750000476837, 0.00013289600610733032, 0.00013698451220989227, 0.00014107301831245422, 0.00014516152441501617, 0.00014925003051757812]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 8.0, 5.0, 8.0, 22.0, 13.0, 13.0, 29.0, 49.0, 71.0, 118.0, 175.0, 362.0, 643.0, 1486.0, 3463.0, 8817.0, 22732.0, 56650.0, 165612.0, 387988.0, 259483.0, 85760.0, 32857.0, 12974.0, 5247.0, 2047.0, 867.0, 409.0, 230.0, 140.0, 75.0, 68.0, 38.0, 28.0, 20.0, 16.0, 12.0, 6.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.783203125, -0.7606353759765625, -0.738067626953125, -0.7154998779296875, -0.69293212890625, -0.6703643798828125, -0.647796630859375, -0.6252288818359375, -0.6026611328125, -0.5800933837890625, -0.557525634765625, -0.5349578857421875, -0.51239013671875, -0.4898223876953125, -0.467254638671875, -0.4446868896484375, -0.422119140625, -0.3995513916015625, -0.376983642578125, -0.3544158935546875, -0.33184814453125, -0.3092803955078125, -0.286712646484375, -0.2641448974609375, -0.2415771484375, -0.2190093994140625, -0.196441650390625, -0.1738739013671875, -0.15130615234375, -0.1287384033203125, -0.106170654296875, -0.0836029052734375, -0.06103515625, -0.0384674072265625, -0.015899658203125, 0.0066680908203125, 0.02923583984375, 0.0518035888671875, 0.074371337890625, 0.0969390869140625, 0.1195068359375, 0.1420745849609375, 0.164642333984375, 0.1872100830078125, 0.20977783203125, 0.2323455810546875, 0.254913330078125, 0.2774810791015625, 0.300048828125, 0.3226165771484375, 0.345184326171875, 0.3677520751953125, 0.39031982421875, 0.4128875732421875, 0.435455322265625, 0.4580230712890625, 0.4805908203125, 0.5031585693359375, 0.525726318359375, 0.5482940673828125, 0.57086181640625, 0.5934295654296875, 0.615997314453125, 0.6385650634765625, 0.6611328125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 1.0, 8.0, 6.0, 4.0, 10.0, 8.0, 10.0, 7.0, 9.0, 17.0, 30.0, 20.0, 26.0, 32.0, 29.0, 49.0, 50.0, 57.0, 52.0, 53.0, 48.0, 65.0, 47.0, 57.0, 35.0, 37.0, 39.0, 22.0, 28.0, 26.0, 24.0, 13.0, 10.0, 8.0, 10.0, 9.0, 3.0, 4.0, 3.0, 3.0, 7.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.390625, -0.37801361083984375, -0.3654022216796875, -0.35279083251953125, -0.340179443359375, -0.32756805419921875, -0.3149566650390625, -0.30234527587890625, -0.28973388671875, -0.27712249755859375, -0.2645111083984375, -0.25189971923828125, -0.239288330078125, -0.22667694091796875, -0.2140655517578125, -0.20145416259765625, -0.1888427734375, -0.17623138427734375, -0.1636199951171875, -0.15100860595703125, -0.138397216796875, -0.12578582763671875, -0.1131744384765625, -0.10056304931640625, -0.08795166015625, -0.07534027099609375, -0.0627288818359375, -0.05011749267578125, -0.037506103515625, -0.02489471435546875, -0.0122833251953125, 0.00032806396484375, 0.012939453125, 0.02555084228515625, 0.0381622314453125, 0.05077362060546875, 0.063385009765625, 0.07599639892578125, 0.0886077880859375, 0.10121917724609375, 0.11383056640625, 0.12644195556640625, 0.1390533447265625, 0.15166473388671875, 0.164276123046875, 0.17688751220703125, 0.1894989013671875, 0.20211029052734375, 0.2147216796875, 0.22733306884765625, 0.2399444580078125, 0.25255584716796875, 0.265167236328125, 0.27777862548828125, 0.2903900146484375, 0.30300140380859375, 0.31561279296875, 0.32822418212890625, 0.3408355712890625, 0.35344696044921875, 0.366058349609375, 0.37866973876953125, 0.3912811279296875, 0.40389251708984375, 0.41650390625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 19.0, 28.0, 62.0, 100.0, 132.0, 156.0, 154.0, 129.0, 91.0, 77.0, 31.0, 10.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.625092506408691, -13.346542358398438, -13.067992210388184, -12.789443016052246, -12.510892868041992, -12.232342720031738, -11.953792572021484, -11.675243377685547, -11.396693229675293, -11.118143081665039, -10.839592933654785, -10.561043739318848, -10.282493591308594, -10.00394344329834, -9.725393295288086, -9.446844100952148, -9.168292999267578, -8.889742851257324, -8.61119270324707, -8.332643508911133, -8.054093360900879, -7.775543212890625, -7.496993064880371, -7.218443393707275, -6.93989372253418, -6.661343574523926, -6.38279390335083, -6.104243755340576, -5.8256940841674805, -5.547143936157227, -5.268593788146973, -4.990044116973877, -4.711493968963623, -4.432943820953369, -4.154394149780273, -3.8758440017700195, -3.597294330596924, -3.31874418258667, -3.040194272994995, -2.7616443634033203, -2.4830944538116455, -2.2045445442199707, -1.925994634628296, -1.6474446058273315, -1.3688946962356567, -1.090344786643982, -0.8117947578430176, -0.5332448482513428, -0.25469493865966797, 0.023855000734329224, 0.3024049401283264, 0.580954909324646, 0.8595048189163208, 1.1380547285079956, 1.41660475730896, 1.6951546669006348, 1.9737045764923096, 2.2522544860839844, 2.530804395675659, 2.809354305267334, 3.087904453277588, 3.3664541244506836, 3.6450042724609375, 3.9235541820526123, 4.202104091644287]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [6.0, 3.0, 3.0, 6.0, 9.0, 4.0, 8.0, 9.0, 11.0, 12.0, 15.0, 10.0, 18.0, 19.0, 22.0, 23.0, 20.0, 27.0, 27.0, 38.0, 33.0, 42.0, 37.0, 39.0, 44.0, 33.0, 46.0, 43.0, 41.0, 33.0, 40.0, 24.0, 46.0, 35.0, 30.0, 20.0, 14.0, 24.0, 22.0, 15.0, 9.0, 11.0, 12.0, 10.0, 10.0, 7.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.842925548553467, -2.7322440147399902, -2.6215627193450928, -2.510881185531616, -2.4001998901367188, -2.289518356323242, -2.1788370609283447, -2.068155527114868, -1.9574742317199707, -1.8467928171157837, -1.7361114025115967, -1.6254299879074097, -1.5147485733032227, -1.404067039489746, -1.2933857440948486, -1.182704210281372, -1.072022795677185, -0.961341381072998, -0.850659966468811, -0.739978551864624, -0.629297137260437, -0.5186156630516052, -0.4079342484474182, -0.2972528338432312, -0.1865714192390442, -0.07588999718427658, 0.03479142487049103, 0.14547285437583923, 0.25615426898002625, 0.36683571338653564, 0.47751712799072266, 0.5881985425949097, 0.6988799571990967, 0.8095613718032837, 0.9202427864074707, 1.0309242010116577, 1.1416056156158447, 1.2522871494293213, 1.3629684448242188, 1.4736499786376953, 1.5843312740325928, 1.6950126886367798, 1.8056941032409668, 1.9163755178451538, 2.027056932449341, 2.1377384662628174, 2.248419761657715, 2.3591012954711914, 2.469782829284668, 2.5804643630981445, 2.691145658493042, 2.8018271923065186, 2.912508487701416, 3.0231900215148926, 3.13387131690979, 3.2445528507232666, 3.355234146118164, 3.4659156799316406, 3.576596975326538, 3.6872785091400146, 3.797959804534912, 3.9086413383483887, 4.019322872161865, 4.130003929138184, 4.24068546295166]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 11.0, 20.0, 31.0, 44.0, 52.0, 96.0, 162.0, 215.0, 417.0, 700.0, 1180.0, 2280.0, 4204.0, 8309.0, 18499.0, 44252.0, 119965.0, 356123.0, 1013237.0, 1497211.0, 732351.0, 248160.0, 85620.0, 32883.0, 14132.0, 6721.0, 3285.0, 1703.0, 955.0, 569.0, 329.0, 231.0, 107.0, 76.0, 45.0, 33.0, 22.0, 19.0, 12.0, 4.0, 8.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68603515625, -0.6648178100585938, -0.6436004638671875, -0.6223831176757812, -0.601165771484375, -0.5799484252929688, -0.5587310791015625, -0.5375137329101562, -0.51629638671875, -0.49507904052734375, -0.4738616943359375, -0.45264434814453125, -0.431427001953125, -0.41020965576171875, -0.3889923095703125, -0.36777496337890625, -0.3465576171875, -0.32534027099609375, -0.3041229248046875, -0.28290557861328125, -0.261688232421875, -0.24047088623046875, -0.2192535400390625, -0.19803619384765625, -0.17681884765625, -0.15560150146484375, -0.1343841552734375, -0.11316680908203125, -0.091949462890625, -0.07073211669921875, -0.0495147705078125, -0.02829742431640625, -0.007080078125, 0.01413726806640625, 0.0353546142578125, 0.05657196044921875, 0.077789306640625, 0.09900665283203125, 0.1202239990234375, 0.14144134521484375, 0.16265869140625, 0.18387603759765625, 0.2050933837890625, 0.22631072998046875, 0.247528076171875, 0.26874542236328125, 0.2899627685546875, 0.31118011474609375, 0.3323974609375, 0.35361480712890625, 0.3748321533203125, 0.39604949951171875, 0.417266845703125, 0.43848419189453125, 0.4597015380859375, 0.48091888427734375, 0.50213623046875, 0.5233535766601562, 0.5445709228515625, 0.5657882690429688, 0.587005615234375, 0.6082229614257812, 0.6294403076171875, 0.6506576538085938, 0.671875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 4.0, 6.0, 5.0, 12.0, 6.0, 7.0, 14.0, 19.0, 17.0, 22.0, 30.0, 32.0, 31.0, 35.0, 33.0, 46.0, 44.0, 46.0, 38.0, 31.0, 46.0, 45.0, 43.0, 41.0, 43.0, 26.0, 33.0, 25.0, 43.0, 35.0, 29.0, 22.0, 22.0, 14.0, 15.0, 13.0, 5.0, 6.0, 3.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.556640625, -0.5411872863769531, -0.5257339477539062, -0.5102806091308594, -0.4948272705078125, -0.4793739318847656, -0.46392059326171875, -0.4484672546386719, -0.433013916015625, -0.4175605773925781, -0.40210723876953125, -0.3866539001464844, -0.3712005615234375, -0.3557472229003906, -0.34029388427734375, -0.3248405456542969, -0.30938720703125, -0.2939338684082031, -0.27848052978515625, -0.2630271911621094, -0.2475738525390625, -0.23212051391601562, -0.21666717529296875, -0.20121383666992188, -0.185760498046875, -0.17030715942382812, -0.15485382080078125, -0.13940048217773438, -0.1239471435546875, -0.10849380493164062, -0.09304046630859375, -0.07758712768554688, -0.0621337890625, -0.046680450439453125, -0.03122711181640625, -0.015773773193359375, -0.0003204345703125, 0.015132904052734375, 0.03058624267578125, 0.046039581298828125, 0.061492919921875, 0.07694625854492188, 0.09239959716796875, 0.10785293579101562, 0.1233062744140625, 0.13875961303710938, 0.15421295166015625, 0.16966629028320312, 0.18511962890625, 0.20057296752929688, 0.21602630615234375, 0.23147964477539062, 0.2469329833984375, 0.2623863220214844, 0.27783966064453125, 0.2932929992675781, 0.308746337890625, 0.3241996765136719, 0.33965301513671875, 0.3551063537597656, 0.3705596923828125, 0.3860130310058594, 0.40146636962890625, 0.4169197082519531, 0.432373046875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 6.0, 6.0, 0.0, 4.0, 8.0, 7.0, 19.0, 21.0, 30.0, 56.0, 78.0, 132.0, 185.0, 361.0, 643.0, 1065.0, 2204.0, 4867.0, 11366.0, 29441.0, 85523.0, 260202.0, 760911.0, 1536126.0, 975237.0, 347072.0, 113937.0, 38790.0, 14473.0, 5834.0, 2614.0, 1320.0, 716.0, 416.0, 238.0, 122.0, 90.0, 51.0, 37.0, 30.0, 14.0, 16.0, 5.0, 6.0, 6.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76708984375, -0.7393264770507812, -0.7115631103515625, -0.6837997436523438, -0.656036376953125, -0.6282730102539062, -0.6005096435546875, -0.5727462768554688, -0.54498291015625, -0.5172195434570312, -0.4894561767578125, -0.46169281005859375, -0.433929443359375, -0.40616607666015625, -0.3784027099609375, -0.35063934326171875, -0.3228759765625, -0.29511260986328125, -0.2673492431640625, -0.23958587646484375, -0.211822509765625, -0.18405914306640625, -0.1562957763671875, -0.12853240966796875, -0.10076904296875, -0.07300567626953125, -0.0452423095703125, -0.01747894287109375, 0.010284423828125, 0.03804779052734375, 0.0658111572265625, 0.09357452392578125, 0.121337890625, 0.14910125732421875, 0.1768646240234375, 0.20462799072265625, 0.232391357421875, 0.26015472412109375, 0.2879180908203125, 0.31568145751953125, 0.34344482421875, 0.37120819091796875, 0.3989715576171875, 0.42673492431640625, 0.454498291015625, 0.48226165771484375, 0.5100250244140625, 0.5377883911132812, 0.5655517578125, 0.5933151245117188, 0.6210784912109375, 0.6488418579101562, 0.676605224609375, 0.7043685913085938, 0.7321319580078125, 0.7598953247070312, 0.78765869140625, 0.8154220581054688, 0.8431854248046875, 0.8709487915039062, 0.898712158203125, 0.9264755249023438, 0.9542388916015625, 0.9820022583007812, 1.009765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 8.0, 9.0, 20.0, 27.0, 35.0, 63.0, 78.0, 110.0, 182.0, 182.0, 282.0, 366.0, 431.0, 469.0, 441.0, 355.0, 285.0, 204.0, 157.0, 117.0, 62.0, 56.0, 38.0, 27.0, 24.0, 14.0, 11.0, 1.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.3916015625, -1.358001708984375, -1.32440185546875, -1.290802001953125, -1.2572021484375, -1.223602294921875, -1.19000244140625, -1.156402587890625, -1.122802734375, -1.089202880859375, -1.05560302734375, -1.022003173828125, -0.9884033203125, -0.954803466796875, -0.92120361328125, -0.887603759765625, -0.85400390625, -0.820404052734375, -0.78680419921875, -0.753204345703125, -0.7196044921875, -0.686004638671875, -0.65240478515625, -0.618804931640625, -0.585205078125, -0.551605224609375, -0.51800537109375, -0.484405517578125, -0.4508056640625, -0.417205810546875, -0.38360595703125, -0.350006103515625, -0.31640625, -0.282806396484375, -0.24920654296875, -0.215606689453125, -0.1820068359375, -0.148406982421875, -0.11480712890625, -0.081207275390625, -0.047607421875, -0.014007568359375, 0.01959228515625, 0.053192138671875, 0.0867919921875, 0.120391845703125, 0.15399169921875, 0.187591552734375, 0.22119140625, 0.254791259765625, 0.28839111328125, 0.321990966796875, 0.3555908203125, 0.389190673828125, 0.42279052734375, 0.456390380859375, 0.489990234375, 0.523590087890625, 0.55718994140625, 0.590789794921875, 0.6243896484375, 0.657989501953125, 0.69158935546875, 0.725189208984375, 0.7587890625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 5.0, 10.0, 9.0, 12.0, 13.0, 26.0, 42.0, 45.0, 48.0, 62.0, 81.0, 63.0, 78.0, 73.0, 87.0, 82.0, 63.0, 43.0, 38.0, 34.0, 30.0, 20.0, 15.0, 11.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5292301177978516, -3.3889148235321045, -3.2485992908477783, -3.1082839965820312, -2.967968702316284, -2.827653408050537, -2.687337875366211, -2.547022581100464, -2.406707286834717, -2.2663919925689697, -2.1260764598846436, -1.9857611656188965, -1.8454458713531494, -1.7051304578781128, -1.5648150444030762, -1.424499750137329, -1.284184217453003, -1.1438688039779663, -1.0035535097122192, -0.8632380962371826, -0.7229227423667908, -0.5826073884963989, -0.4422919750213623, -0.30197662115097046, -0.1616612672805786, -0.021345898509025574, 0.11896947026252747, 0.2592848539352417, 0.39960020780563354, 0.5399155616760254, 0.680230975151062, 0.8205463290214539, 0.9608616828918457, 1.1011770963668823, 1.2414923906326294, 1.381807804107666, 1.522123098373413, 1.6624385118484497, 1.8027539253234863, 1.9430692195892334, 2.0833845138549805, 2.2236998081207275, 2.3640153408050537, 2.504330635070801, 2.644645929336548, 2.784961223602295, 2.925276756286621, 3.065592050552368, 3.2059075832366943, 3.3462228775024414, 3.4865384101867676, 3.6268537044525146, 3.7671689987182617, 3.907484531402588, 4.047800064086914, 4.188115119934082, 4.328430652618408, 4.468746185302734, 4.609061241149902, 4.7493767738342285, 4.889692306518555, 5.030007362365723, 5.170322895050049, 5.310638427734375, 5.450953483581543]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 1.0, 7.0, 5.0, 12.0, 8.0, 18.0, 20.0, 22.0, 21.0, 22.0, 23.0, 29.0, 34.0, 31.0, 33.0, 37.0, 35.0, 40.0, 47.0, 47.0, 51.0, 39.0, 46.0, 38.0, 45.0, 33.0, 23.0, 22.0, 36.0, 25.0, 18.0, 17.0, 24.0, 21.0, 8.0, 10.0, 14.0, 13.0, 9.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.71490216255188, -3.6149706840515137, -3.5150389671325684, -3.415107488632202, -3.315176010131836, -3.2152445316314697, -3.1153130531311035, -3.015381336212158, -2.915449857711792, -2.815518379211426, -2.7155866622924805, -2.6156551837921143, -2.515723705291748, -2.415792226791382, -2.3158607482910156, -2.2159290313720703, -2.115997552871704, -2.016066074371338, -1.9161344766616821, -1.8162028789520264, -1.7162714004516602, -1.616339921951294, -1.5164083242416382, -1.4164767265319824, -1.3165452480316162, -1.21661376953125, -1.1166821718215942, -1.0167505741119385, -0.9168190956115723, -0.8168875575065613, -0.7169560194015503, -0.6170244812965393, -0.5170927047729492, -0.41716116666793823, -0.31722962856292725, -0.21729809045791626, -0.11736655235290527, -0.017435014247894287, 0.0824965238571167, 0.18242806196212769, 0.28235960006713867, 0.38229113817214966, 0.48222267627716064, 0.5821542143821716, 0.6820857524871826, 0.7820172905921936, 0.8819488286972046, 0.9818803668022156, 1.0818119049072266, 1.1817433834075928, 1.2816749811172485, 1.3816065788269043, 1.4815380573272705, 1.5814695358276367, 1.6814011335372925, 1.7813327312469482, 1.8812642097473145, 1.9811956882476807, 2.081127166748047, 2.181058883666992, 2.2809903621673584, 2.3809218406677246, 2.48085355758667, 2.580785036087036, 2.6807165145874023]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 6.0, 5.0, 10.0, 14.0, 19.0, 40.0, 55.0, 81.0, 159.0, 277.0, 503.0, 891.0, 1618.0, 3078.0, 5674.0, 10667.0, 19712.0, 36696.0, 68105.0, 125655.0, 202574.0, 224128.0, 156983.0, 88866.0, 47493.0, 25410.0, 13501.0, 7454.0, 4041.0, 2135.0, 1167.0, 661.0, 359.0, 234.0, 121.0, 65.0, 36.0, 28.0, 14.0, 6.0, 8.0, 5.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2255859375, -1.18975830078125, -1.1539306640625, -1.11810302734375, -1.082275390625, -1.04644775390625, -1.0106201171875, -0.97479248046875, -0.93896484375, -0.90313720703125, -0.8673095703125, -0.83148193359375, -0.795654296875, -0.75982666015625, -0.7239990234375, -0.68817138671875, -0.65234375, -0.61651611328125, -0.5806884765625, -0.54486083984375, -0.509033203125, -0.47320556640625, -0.4373779296875, -0.40155029296875, -0.36572265625, -0.32989501953125, -0.2940673828125, -0.25823974609375, -0.222412109375, -0.18658447265625, -0.1507568359375, -0.11492919921875, -0.0791015625, -0.04327392578125, -0.0074462890625, 0.02838134765625, 0.064208984375, 0.10003662109375, 0.1358642578125, 0.17169189453125, 0.20751953125, 0.24334716796875, 0.2791748046875, 0.31500244140625, 0.350830078125, 0.38665771484375, 0.4224853515625, 0.45831298828125, 0.494140625, 0.52996826171875, 0.5657958984375, 0.60162353515625, 0.637451171875, 0.67327880859375, 0.7091064453125, 0.74493408203125, 0.78076171875, 0.81658935546875, 0.8524169921875, 0.88824462890625, 0.924072265625, 0.95989990234375, 0.9957275390625, 1.03155517578125, 1.0673828125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 9.0, 7.0, 11.0, 15.0, 9.0, 8.0, 13.0, 25.0, 25.0, 22.0, 29.0, 24.0, 28.0, 33.0, 40.0, 36.0, 39.0, 28.0, 44.0, 37.0, 25.0, 35.0, 38.0, 33.0, 38.0, 39.0, 36.0, 33.0, 32.0, 25.0, 14.0, 21.0, 23.0, 21.0, 12.0, 20.0, 13.0, 12.0, 7.0, 11.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.421630859375, -0.408111572265625, -0.39459228515625, -0.381072998046875, -0.3675537109375, -0.354034423828125, -0.34051513671875, -0.326995849609375, -0.3134765625, -0.299957275390625, -0.28643798828125, -0.272918701171875, -0.2593994140625, -0.245880126953125, -0.23236083984375, -0.218841552734375, -0.205322265625, -0.191802978515625, -0.17828369140625, -0.164764404296875, -0.1512451171875, -0.137725830078125, -0.12420654296875, -0.110687255859375, -0.09716796875, -0.083648681640625, -0.07012939453125, -0.056610107421875, -0.0430908203125, -0.029571533203125, -0.01605224609375, -0.002532958984375, 0.010986328125, 0.024505615234375, 0.03802490234375, 0.051544189453125, 0.0650634765625, 0.078582763671875, 0.09210205078125, 0.105621337890625, 0.119140625, 0.132659912109375, 0.14617919921875, 0.159698486328125, 0.1732177734375, 0.186737060546875, 0.20025634765625, 0.213775634765625, 0.227294921875, 0.240814208984375, 0.25433349609375, 0.267852783203125, 0.2813720703125, 0.294891357421875, 0.30841064453125, 0.321929931640625, 0.33544921875, 0.348968505859375, 0.36248779296875, 0.376007080078125, 0.3895263671875, 0.403045654296875, 0.41656494140625, 0.430084228515625, 0.443603515625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 17.0, 15.0, 19.0, 29.0, 54.0, 69.0, 80.0, 132.0, 233.0, 494.0, 1238.0, 2939.0, 8023.0, 22900.0, 68065.0, 202044.0, 378916.0, 237223.0, 82185.0, 27829.0, 9848.0, 3547.0, 1319.0, 563.0, 273.0, 135.0, 111.0, 59.0, 41.0, 35.0, 17.0, 21.0, 13.0, 13.0, 9.0, 9.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8056640625, -1.7466278076171875, -1.687591552734375, -1.6285552978515625, -1.56951904296875, -1.5104827880859375, -1.451446533203125, -1.3924102783203125, -1.3333740234375, -1.2743377685546875, -1.215301513671875, -1.1562652587890625, -1.09722900390625, -1.0381927490234375, -0.979156494140625, -0.9201202392578125, -0.861083984375, -0.8020477294921875, -0.743011474609375, -0.6839752197265625, -0.62493896484375, -0.5659027099609375, -0.506866455078125, -0.4478302001953125, -0.3887939453125, -0.3297576904296875, -0.270721435546875, -0.2116851806640625, -0.15264892578125, -0.0936126708984375, -0.034576416015625, 0.0244598388671875, 0.08349609375, 0.1425323486328125, 0.201568603515625, 0.2606048583984375, 0.31964111328125, 0.3786773681640625, 0.437713623046875, 0.4967498779296875, 0.5557861328125, 0.6148223876953125, 0.673858642578125, 0.7328948974609375, 0.79193115234375, 0.8509674072265625, 0.910003662109375, 0.9690399169921875, 1.028076171875, 1.0871124267578125, 1.146148681640625, 1.2051849365234375, 1.26422119140625, 1.3232574462890625, 1.382293701171875, 1.4413299560546875, 1.5003662109375, 1.5594024658203125, 1.618438720703125, 1.6774749755859375, 1.73651123046875, 1.7955474853515625, 1.854583740234375, 1.9136199951171875, 1.97265625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 10.0, 12.0, 9.0, 15.0, 15.0, 14.0, 22.0, 32.0, 25.0, 36.0, 27.0, 33.0, 57.0, 56.0, 46.0, 50.0, 52.0, 53.0, 49.0, 46.0, 45.0, 49.0, 49.0, 29.0, 26.0, 25.0, 23.0, 21.0, 10.0, 15.0, 12.0, 6.0, 6.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.09765625, -2.0387725830078125, -1.979888916015625, -1.9210052490234375, -1.86212158203125, -1.8032379150390625, -1.744354248046875, -1.6854705810546875, -1.6265869140625, -1.5677032470703125, -1.508819580078125, -1.4499359130859375, -1.39105224609375, -1.3321685791015625, -1.273284912109375, -1.2144012451171875, -1.155517578125, -1.0966339111328125, -1.037750244140625, -0.9788665771484375, -0.91998291015625, -0.8610992431640625, -0.802215576171875, -0.7433319091796875, -0.6844482421875, -0.6255645751953125, -0.566680908203125, -0.5077972412109375, -0.44891357421875, -0.3900299072265625, -0.331146240234375, -0.2722625732421875, -0.21337890625, -0.1544952392578125, -0.095611572265625, -0.0367279052734375, 0.02215576171875, 0.0810394287109375, 0.139923095703125, 0.1988067626953125, 0.2576904296875, 0.3165740966796875, 0.375457763671875, 0.4343414306640625, 0.49322509765625, 0.5521087646484375, 0.610992431640625, 0.6698760986328125, 0.728759765625, 0.7876434326171875, 0.846527099609375, 0.9054107666015625, 0.96429443359375, 1.0231781005859375, 1.082061767578125, 1.1409454345703125, 1.1998291015625, 1.2587127685546875, 1.317596435546875, 1.3764801025390625, 1.43536376953125, 1.4942474365234375, 1.553131103515625, 1.6120147705078125, 1.6708984375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 8.0, 18.0, 23.0, 37.0, 60.0, 86.0, 174.0, 292.0, 538.0, 911.0, 1593.0, 2896.0, 5369.0, 9790.0, 18123.0, 32791.0, 57490.0, 97885.0, 153271.0, 195066.0, 178608.0, 123067.0, 74319.0, 43213.0, 23795.0, 13125.0, 7255.0, 3947.0, 2106.0, 1157.0, 647.0, 352.0, 223.0, 119.0, 74.0, 51.0, 29.0, 21.0, 7.0, 8.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.5029296875, -0.48708343505859375, -0.4712371826171875, -0.45539093017578125, -0.439544677734375, -0.42369842529296875, -0.4078521728515625, -0.39200592041015625, -0.37615966796875, -0.36031341552734375, -0.3444671630859375, -0.32862091064453125, -0.312774658203125, -0.29692840576171875, -0.2810821533203125, -0.26523590087890625, -0.2493896484375, -0.23354339599609375, -0.2176971435546875, -0.20185089111328125, -0.186004638671875, -0.17015838623046875, -0.1543121337890625, -0.13846588134765625, -0.12261962890625, -0.10677337646484375, -0.0909271240234375, -0.07508087158203125, -0.059234619140625, -0.04338836669921875, -0.0275421142578125, -0.01169586181640625, 0.004150390625, 0.01999664306640625, 0.0358428955078125, 0.05168914794921875, 0.067535400390625, 0.08338165283203125, 0.0992279052734375, 0.11507415771484375, 0.13092041015625, 0.14676666259765625, 0.1626129150390625, 0.17845916748046875, 0.194305419921875, 0.21015167236328125, 0.2259979248046875, 0.24184417724609375, 0.2576904296875, 0.27353668212890625, 0.2893829345703125, 0.30522918701171875, 0.321075439453125, 0.33692169189453125, 0.3527679443359375, 0.36861419677734375, 0.38446044921875, 0.40030670166015625, 0.4161529541015625, 0.43199920654296875, 0.447845458984375, 0.46369171142578125, 0.4795379638671875, 0.49538421630859375, 0.51123046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 7.0, 5.0, 7.0, 5.0, 6.0, 6.0, 11.0, 10.0, 15.0, 20.0, 26.0, 24.0, 32.0, 32.0, 54.0, 60.0, 83.0, 78.0, 76.0, 78.0, 56.0, 55.0, 51.0, 43.0, 38.0, 37.0, 15.0, 21.0, 11.0, 12.0, 10.0, 6.0, 5.0, 4.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000133514404296875, -0.00012909993529319763, -0.00012468546628952026, -0.0001202709972858429, -0.00011585652828216553, -0.00011144205927848816, -0.00010702759027481079, -0.00010261312127113342, -9.819865226745605e-05, -9.378418326377869e-05, -8.936971426010132e-05, -8.495524525642395e-05, -8.054077625274658e-05, -7.612630724906921e-05, -7.171183824539185e-05, -6.729736924171448e-05, -6.288290023803711e-05, -5.846843123435974e-05, -5.405396223068237e-05, -4.9639493227005005e-05, -4.522502422332764e-05, -4.081055521965027e-05, -3.63960862159729e-05, -3.198161721229553e-05, -2.7567148208618164e-05, -2.3152679204940796e-05, -1.8738210201263428e-05, -1.432374119758606e-05, -9.909272193908691e-06, -5.494803190231323e-06, -1.080334186553955e-06, 3.334134817123413e-06, 7.748603820800781e-06, 1.216307282447815e-05, 1.6577541828155518e-05, 2.0992010831832886e-05, 2.5406479835510254e-05, 2.9820948839187622e-05, 3.423541784286499e-05, 3.864988684654236e-05, 4.3064355850219727e-05, 4.7478824853897095e-05, 5.189329385757446e-05, 5.630776286125183e-05, 6.07222318649292e-05, 6.513670086860657e-05, 6.955116987228394e-05, 7.39656388759613e-05, 7.838010787963867e-05, 8.279457688331604e-05, 8.720904588699341e-05, 9.162351489067078e-05, 9.603798389434814e-05, 0.00010045245289802551, 0.00010486692190170288, 0.00010928139090538025, 0.00011369585990905762, 0.00011811032891273499, 0.00012252479791641235, 0.00012693926692008972, 0.0001313537359237671, 0.00013576820492744446, 0.00014018267393112183, 0.0001445971429347992, 0.00014901161193847656]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 7.0, 8.0, 13.0, 23.0, 35.0, 45.0, 69.0, 138.0, 181.0, 353.0, 760.0, 1584.0, 3654.0, 9127.0, 22346.0, 53636.0, 120577.0, 232570.0, 278542.0, 178788.0, 84670.0, 35920.0, 14949.0, 5882.0, 2381.0, 1053.0, 537.0, 265.0, 165.0, 86.0, 62.0, 31.0, 19.0, 16.0, 12.0, 16.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.681640625, -0.6598434448242188, -0.6380462646484375, -0.6162490844726562, -0.594451904296875, -0.5726547241210938, -0.5508575439453125, -0.5290603637695312, -0.50726318359375, -0.48546600341796875, -0.4636688232421875, -0.44187164306640625, -0.420074462890625, -0.39827728271484375, -0.3764801025390625, -0.35468292236328125, -0.3328857421875, -0.31108856201171875, -0.2892913818359375, -0.26749420166015625, -0.245697021484375, -0.22389984130859375, -0.2021026611328125, -0.18030548095703125, -0.15850830078125, -0.13671112060546875, -0.1149139404296875, -0.09311676025390625, -0.071319580078125, -0.04952239990234375, -0.0277252197265625, -0.00592803955078125, 0.015869140625, 0.03766632080078125, 0.0594635009765625, 0.08126068115234375, 0.103057861328125, 0.12485504150390625, 0.1466522216796875, 0.16844940185546875, 0.19024658203125, 0.21204376220703125, 0.2338409423828125, 0.25563812255859375, 0.277435302734375, 0.29923248291015625, 0.3210296630859375, 0.34282684326171875, 0.3646240234375, 0.38642120361328125, 0.4082183837890625, 0.43001556396484375, 0.451812744140625, 0.47360992431640625, 0.4954071044921875, 0.5172042846679688, 0.53900146484375, 0.5607986450195312, 0.5825958251953125, 0.6043930053710938, 0.626190185546875, 0.6479873657226562, 0.6697845458984375, 0.6915817260742188, 0.71337890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 7.0, 7.0, 7.0, 14.0, 15.0, 18.0, 37.0, 28.0, 25.0, 47.0, 57.0, 52.0, 60.0, 80.0, 71.0, 63.0, 69.0, 58.0, 55.0, 48.0, 34.0, 28.0, 23.0, 23.0, 20.0, 14.0, 12.0, 7.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51416015625, -0.4940032958984375, -0.473846435546875, -0.4536895751953125, -0.43353271484375, -0.4133758544921875, -0.393218994140625, -0.3730621337890625, -0.3529052734375, -0.3327484130859375, -0.312591552734375, -0.2924346923828125, -0.27227783203125, -0.2521209716796875, -0.231964111328125, -0.2118072509765625, -0.191650390625, -0.1714935302734375, -0.151336669921875, -0.1311798095703125, -0.11102294921875, -0.0908660888671875, -0.070709228515625, -0.0505523681640625, -0.0303955078125, -0.0102386474609375, 0.009918212890625, 0.0300750732421875, 0.05023193359375, 0.0703887939453125, 0.090545654296875, 0.1107025146484375, 0.130859375, 0.1510162353515625, 0.171173095703125, 0.1913299560546875, 0.21148681640625, 0.2316436767578125, 0.251800537109375, 0.2719573974609375, 0.2921142578125, 0.3122711181640625, 0.332427978515625, 0.3525848388671875, 0.37274169921875, 0.3928985595703125, 0.413055419921875, 0.4332122802734375, 0.453369140625, 0.4735260009765625, 0.493682861328125, 0.5138397216796875, 0.53399658203125, 0.5541534423828125, 0.574310302734375, 0.5944671630859375, 0.6146240234375, 0.6347808837890625, 0.654937744140625, 0.6750946044921875, 0.69525146484375, 0.7154083251953125, 0.735565185546875, 0.7557220458984375, 0.77587890625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 7.0, 8.0, 24.0, 36.0, 53.0, 52.0, 73.0, 105.0, 116.0, 107.0, 115.0, 87.0, 78.0, 54.0, 35.0, 22.0, 14.0, 11.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.66262674331665, -5.426645755767822, -5.190664768218994, -4.954683303833008, -4.71870231628418, -4.482721328735352, -4.246740341186523, -4.010759353637695, -3.774778127670288, -3.53879714012146, -3.3028159141540527, -3.0668349266052246, -2.8308539390563965, -2.5948727130889893, -2.358891725540161, -2.122910499572754, -1.8869295120239258, -1.650948405265808, -1.4149672985076904, -1.1789863109588623, -0.9430052042007446, -0.707024097442627, -0.47104310989379883, -0.23506200313568115, 0.0009191036224365234, 0.2369001805782318, 0.4728812575340271, 0.7088623046875, 0.9448434114456177, 1.1808245182037354, 1.4168055057525635, 1.6527866125106812, 1.888768196105957, 2.124749183654785, 2.3607304096221924, 2.5967113971710205, 2.8326926231384277, 3.068673610687256, 3.304654598236084, 3.540635585784912, 3.7766168117523193, 4.012598037719727, 4.248579025268555, 4.484560012817383, 4.720541000366211, 4.956521987915039, 5.192502975463867, 5.4284844398498535, 5.664465427398682, 5.90044641494751, 6.136427402496338, 6.372408866882324, 6.608389854431152, 6.8443708419799805, 7.080351829528809, 7.316332817077637, 7.552313804626465, 7.788294792175293, 8.024275779724121, 8.26025676727295, 8.496237754821777, 8.732219696044922, 8.96820068359375, 9.204181671142578, 9.440162658691406]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 7.0, 5.0, 7.0, 17.0, 7.0, 16.0, 18.0, 20.0, 22.0, 27.0, 23.0, 23.0, 25.0, 29.0, 36.0, 33.0, 53.0, 51.0, 41.0, 51.0, 29.0, 35.0, 43.0, 41.0, 30.0, 33.0, 41.0, 23.0, 29.0, 29.0, 25.0, 19.0, 18.0, 14.0, 12.0, 9.0, 5.0, 15.0, 4.0, 5.0, 6.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.800487995147705, -3.6718077659606934, -3.5431272983551025, -3.4144468307495117, -3.2857666015625, -3.1570863723754883, -3.0284059047698975, -2.8997254371643066, -2.771045207977295, -2.642364978790283, -2.5136845111846924, -2.3850040435791016, -2.25632381439209, -2.127643585205078, -1.9989631175994873, -1.870282769203186, -1.7416024208068848, -1.6129220724105835, -1.4842417240142822, -1.355561375617981, -1.2268810272216797, -1.0982006788253784, -0.9695203304290771, -0.8408399820327759, -0.7121596336364746, -0.5834792852401733, -0.45479893684387207, -0.3261185884475708, -0.19743824005126953, -0.06875789165496826, 0.05992245674133301, 0.18860280513763428, 0.31728363037109375, 0.445963978767395, 0.5746443271636963, 0.7033246755599976, 0.8320050239562988, 0.9606853723526001, 1.0893657207489014, 1.2180460691452026, 1.346726417541504, 1.4754067659378052, 1.6040871143341064, 1.7327674627304077, 1.861447811126709, 1.9901281595230103, 2.1188085079193115, 2.2474889755249023, 2.376169204711914, 2.504849433898926, 2.6335299015045166, 2.7622103691101074, 2.890890598297119, 3.019570827484131, 3.1482512950897217, 3.2769317626953125, 3.405611991882324, 3.534292221069336, 3.6629726886749268, 3.7916531562805176, 3.9203333854675293, 4.049013614654541, 4.177694320678711, 4.306374549865723, 4.435054779052734]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 10.0, 7.0, 12.0, 16.0, 17.0, 19.0, 33.0, 47.0, 74.0, 130.0, 246.0, 455.0, 1010.0, 2374.0, 5881.0, 15080.0, 42643.0, 130399.0, 432100.0, 1454178.0, 1462551.0, 443675.0, 133288.0, 44270.0, 15651.0, 5836.0, 2356.0, 998.0, 420.0, 208.0, 100.0, 53.0, 43.0, 29.0, 14.0, 13.0, 15.0, 10.0, 4.0, 4.0, 6.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.0703125, -1.04058837890625, -1.0108642578125, -0.98114013671875, -0.951416015625, -0.92169189453125, -0.8919677734375, -0.86224365234375, -0.83251953125, -0.80279541015625, -0.7730712890625, -0.74334716796875, -0.713623046875, -0.68389892578125, -0.6541748046875, -0.62445068359375, -0.5947265625, -0.56500244140625, -0.5352783203125, -0.50555419921875, -0.475830078125, -0.44610595703125, -0.4163818359375, -0.38665771484375, -0.35693359375, -0.32720947265625, -0.2974853515625, -0.26776123046875, -0.238037109375, -0.20831298828125, -0.1785888671875, -0.14886474609375, -0.119140625, -0.08941650390625, -0.0596923828125, -0.02996826171875, -0.000244140625, 0.02947998046875, 0.0592041015625, 0.08892822265625, 0.11865234375, 0.14837646484375, 0.1781005859375, 0.20782470703125, 0.237548828125, 0.26727294921875, 0.2969970703125, 0.32672119140625, 0.3564453125, 0.38616943359375, 0.4158935546875, 0.44561767578125, 0.475341796875, 0.50506591796875, 0.5347900390625, 0.56451416015625, 0.59423828125, 0.62396240234375, 0.6536865234375, 0.68341064453125, 0.713134765625, 0.74285888671875, 0.7725830078125, 0.80230712890625, 0.83203125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 0.0, 1.0, 4.0, 7.0, 3.0, 9.0, 11.0, 14.0, 5.0, 16.0, 13.0, 27.0, 14.0, 13.0, 19.0, 30.0, 26.0, 38.0, 31.0, 25.0, 43.0, 34.0, 34.0, 36.0, 44.0, 43.0, 41.0, 46.0, 42.0, 42.0, 26.0, 29.0, 27.0, 32.0, 23.0, 21.0, 25.0, 14.0, 19.0, 11.0, 20.0, 6.0, 14.0, 8.0, 6.0, 0.0, 5.0, 0.0, 3.0, 3.0, 2.0, 2.0], "bins": [-0.56982421875, -0.5541801452636719, -0.5385360717773438, -0.5228919982910156, -0.5072479248046875, -0.4916038513183594, -0.47595977783203125, -0.4603157043457031, -0.444671630859375, -0.4290275573730469, -0.41338348388671875, -0.3977394104003906, -0.3820953369140625, -0.3664512634277344, -0.35080718994140625, -0.3351631164550781, -0.31951904296875, -0.3038749694824219, -0.28823089599609375, -0.2725868225097656, -0.2569427490234375, -0.24129867553710938, -0.22565460205078125, -0.21001052856445312, -0.194366455078125, -0.17872238159179688, -0.16307830810546875, -0.14743423461914062, -0.1317901611328125, -0.11614608764648438, -0.10050201416015625, -0.08485794067382812, -0.0692138671875, -0.053569793701171875, -0.03792572021484375, -0.022281646728515625, -0.0066375732421875, 0.009006500244140625, 0.02465057373046875, 0.040294647216796875, 0.055938720703125, 0.07158279418945312, 0.08722686767578125, 0.10287094116210938, 0.1185150146484375, 0.13415908813476562, 0.14980316162109375, 0.16544723510742188, 0.18109130859375, 0.19673538208007812, 0.21237945556640625, 0.22802352905273438, 0.2436676025390625, 0.2593116760253906, 0.27495574951171875, 0.2905998229980469, 0.306243896484375, 0.3218879699707031, 0.33753204345703125, 0.3531761169433594, 0.3688201904296875, 0.3844642639160156, 0.40010833740234375, 0.4157524108886719, 0.431396484375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 10.0, 7.0, 16.0, 29.0, 38.0, 57.0, 76.0, 127.0, 203.0, 321.0, 502.0, 818.0, 1417.0, 2345.0, 4158.0, 7631.0, 14806.0, 29915.0, 64311.0, 142713.0, 322212.0, 710527.0, 1232813.0, 896243.0, 417937.0, 184937.0, 82182.0, 38131.0, 18400.0, 9426.0, 4909.0, 2752.0, 1696.0, 949.0, 599.0, 366.0, 272.0, 179.0, 94.0, 66.0, 23.0, 29.0, 17.0, 11.0, 8.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8876953125, -0.8596572875976562, -0.8316192626953125, -0.8035812377929688, -0.775543212890625, -0.7475051879882812, -0.7194671630859375, -0.6914291381835938, -0.66339111328125, -0.6353530883789062, -0.6073150634765625, -0.5792770385742188, -0.551239013671875, -0.5232009887695312, -0.4951629638671875, -0.46712493896484375, -0.4390869140625, -0.41104888916015625, -0.3830108642578125, -0.35497283935546875, -0.326934814453125, -0.29889678955078125, -0.2708587646484375, -0.24282073974609375, -0.21478271484375, -0.18674468994140625, -0.1587066650390625, -0.13066864013671875, -0.102630615234375, -0.07459259033203125, -0.0465545654296875, -0.01851654052734375, 0.009521484375, 0.03755950927734375, 0.0655975341796875, 0.09363555908203125, 0.121673583984375, 0.14971160888671875, 0.1777496337890625, 0.20578765869140625, 0.23382568359375, 0.26186370849609375, 0.2899017333984375, 0.31793975830078125, 0.345977783203125, 0.37401580810546875, 0.4020538330078125, 0.43009185791015625, 0.4581298828125, 0.48616790771484375, 0.5142059326171875, 0.5422439575195312, 0.570281982421875, 0.5983200073242188, 0.6263580322265625, 0.6543960571289062, 0.68243408203125, 0.7104721069335938, 0.7385101318359375, 0.7665481567382812, 0.794586181640625, 0.8226242065429688, 0.8506622314453125, 0.8787002563476562, 0.90673828125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 5.0, 9.0, 8.0, 7.0, 19.0, 19.0, 19.0, 30.0, 30.0, 46.0, 69.0, 76.0, 99.0, 114.0, 146.0, 204.0, 243.0, 301.0, 369.0, 377.0, 373.0, 332.0, 248.0, 230.0, 162.0, 129.0, 93.0, 70.0, 61.0, 44.0, 32.0, 25.0, 23.0, 12.0, 12.0, 6.0, 10.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.94384765625, -0.9129409790039062, -0.8820343017578125, -0.8511276245117188, -0.820220947265625, -0.7893142700195312, -0.7584075927734375, -0.7275009155273438, -0.69659423828125, -0.6656875610351562, -0.6347808837890625, -0.6038742065429688, -0.572967529296875, -0.5420608520507812, -0.5111541748046875, -0.48024749755859375, -0.4493408203125, -0.41843414306640625, -0.3875274658203125, -0.35662078857421875, -0.325714111328125, -0.29480743408203125, -0.2639007568359375, -0.23299407958984375, -0.20208740234375, -0.17118072509765625, -0.1402740478515625, -0.10936737060546875, -0.078460693359375, -0.04755401611328125, -0.0166473388671875, 0.01425933837890625, 0.045166015625, 0.07607269287109375, 0.1069793701171875, 0.13788604736328125, 0.168792724609375, 0.19969940185546875, 0.2306060791015625, 0.26151275634765625, 0.29241943359375, 0.32332611083984375, 0.3542327880859375, 0.38513946533203125, 0.416046142578125, 0.44695281982421875, 0.4778594970703125, 0.5087661743164062, 0.5396728515625, 0.5705795288085938, 0.6014862060546875, 0.6323928833007812, 0.663299560546875, 0.6942062377929688, 0.7251129150390625, 0.7560195922851562, 0.78692626953125, 0.8178329467773438, 0.8487396240234375, 0.8796463012695312, 0.910552978515625, 0.9414596557617188, 0.9723663330078125, 1.0032730102539062, 1.0341796875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 3.0, 10.0, 13.0, 24.0, 24.0, 53.0, 83.0, 115.0, 115.0, 139.0, 130.0, 98.0, 60.0, 56.0, 41.0, 26.0, 11.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5737380981445312, -3.2795794010162354, -2.9854207038879395, -2.6912622451782227, -2.3971033096313477, -2.102944850921631, -1.808786153793335, -1.514627456665039, -1.2204687595367432, -0.9263100624084473, -0.6321514248847961, -0.337992787361145, -0.04383409023284912, 0.2503246068954468, 0.5444831848144531, 0.838641881942749, 1.132800579071045, 1.4269592761993408, 1.7211179733276367, 2.0152764320373535, 2.3094353675842285, 2.6035938262939453, 2.897752523422241, 3.191911220550537, 3.486069917678833, 3.780228614807129, 4.074387073516846, 4.368546009063721, 4.6627044677734375, 4.9568634033203125, 5.251021862030029, 5.545180320739746, 5.839339256286621, 6.133497714996338, 6.427656650543213, 6.72181510925293, 7.015974044799805, 7.3101325035095215, 7.604290962219238, 7.898449897766113, 8.192608833312988, 8.486767768859863, 8.780925750732422, 9.075084686279297, 9.369243621826172, 9.663402557373047, 9.957560539245605, 10.25171947479248, 10.545877456665039, 10.840036392211914, 11.134194374084473, 11.428353309631348, 11.722512245178223, 12.016671180725098, 12.310829162597656, 12.604988098144531, 12.899147033691406, 13.193305969238281, 13.48746395111084, 13.781622886657715, 14.07578182220459, 14.369940757751465, 14.664098739624023, 14.958257675170898, 15.252416610717773]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 1.0, 2.0, 7.0, 6.0, 10.0, 9.0, 14.0, 17.0, 22.0, 23.0, 23.0, 23.0, 28.0, 43.0, 38.0, 39.0, 46.0, 48.0, 41.0, 52.0, 46.0, 47.0, 71.0, 41.0, 41.0, 48.0, 33.0, 28.0, 19.0, 22.0, 18.0, 16.0, 12.0, 18.0, 18.0, 7.0, 6.0, 4.0, 4.0, 3.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0], "bins": [-5.072872638702393, -4.9396467208862305, -4.806420803070068, -4.673194408416748, -4.539968490600586, -4.406742572784424, -4.273516654968262, -4.1402907371521, -4.0070648193359375, -3.8738389015197754, -3.740612745285034, -3.607386827468872, -3.474160671234131, -3.3409347534179688, -3.2077088356018066, -3.0744829177856445, -2.941256523132324, -2.808030605316162, -2.674804449081421, -2.541578531265259, -2.4083523750305176, -2.2751264572143555, -2.1419005393981934, -2.0086746215820312, -1.87544846534729, -1.7422224283218384, -1.6089963912963867, -1.4757704734802246, -1.342544436454773, -1.2093183994293213, -1.0760924816131592, -0.9428664445877075, -0.8096408843994141, -0.6764148473739624, -0.5431888699531555, -0.40996286273002625, -0.276736855506897, -0.1435108184814453, -0.010284841060638428, 0.12294113636016846, 0.2561671733856201, 0.3893931806087494, 0.5226191878318787, 0.6558451652526855, 0.7890712022781372, 0.9222972393035889, 1.055523157119751, 1.1887491941452026, 1.3219752311706543, 1.455201268196106, 1.5884273052215576, 1.7216532230377197, 1.8548792600631714, 1.988105297088623, 2.121331214904785, 2.2545571327209473, 2.3877832889556885, 2.5210092067718506, 2.654235363006592, 2.787461280822754, 2.920687198638916, 3.0539133548736572, 3.1871392726898193, 3.3203654289245605, 3.4535913467407227]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 8.0, 16.0, 30.0, 50.0, 98.0, 146.0, 248.0, 385.0, 615.0, 1043.0, 1797.0, 2867.0, 4640.0, 7553.0, 12203.0, 19397.0, 32281.0, 55943.0, 103591.0, 181454.0, 227822.0, 171209.0, 95252.0, 51852.0, 30065.0, 18346.0, 11367.0, 7071.0, 4516.0, 2586.0, 1638.0, 956.0, 601.0, 356.0, 213.0, 140.0, 76.0, 49.0, 29.0, 17.0, 8.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75537109375, -0.7278366088867188, -0.7003021240234375, -0.6727676391601562, -0.645233154296875, -0.6176986694335938, -0.5901641845703125, -0.5626296997070312, -0.53509521484375, -0.5075607299804688, -0.4800262451171875, -0.45249176025390625, -0.424957275390625, -0.39742279052734375, -0.3698883056640625, -0.34235382080078125, -0.3148193359375, -0.28728485107421875, -0.2597503662109375, -0.23221588134765625, -0.204681396484375, -0.17714691162109375, -0.1496124267578125, -0.12207794189453125, -0.09454345703125, -0.06700897216796875, -0.0394744873046875, -0.01194000244140625, 0.015594482421875, 0.04312896728515625, 0.0706634521484375, 0.09819793701171875, 0.125732421875, 0.15326690673828125, 0.1808013916015625, 0.20833587646484375, 0.235870361328125, 0.26340484619140625, 0.2909393310546875, 0.31847381591796875, 0.34600830078125, 0.37354278564453125, 0.4010772705078125, 0.42861175537109375, 0.456146240234375, 0.48368072509765625, 0.5112152099609375, 0.5387496948242188, 0.5662841796875, 0.5938186645507812, 0.6213531494140625, 0.6488876342773438, 0.676422119140625, 0.7039566040039062, 0.7314910888671875, 0.7590255737304688, 0.78656005859375, 0.8140945434570312, 0.8416290283203125, 0.8691635131835938, 0.896697998046875, 0.9242324829101562, 0.9517669677734375, 0.9793014526367188, 1.0068359375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 5.0, 7.0, 7.0, 8.0, 8.0, 7.0, 11.0, 10.0, 15.0, 12.0, 14.0, 19.0, 23.0, 19.0, 20.0, 20.0, 26.0, 28.0, 30.0, 27.0, 38.0, 28.0, 46.0, 35.0, 39.0, 34.0, 35.0, 39.0, 35.0, 38.0, 23.0, 28.0, 33.0, 28.0, 26.0, 26.0, 9.0, 18.0, 16.0, 18.0, 17.0, 6.0, 12.0, 11.0, 8.0, 10.0, 7.0, 1.0, 7.0, 2.0, 3.0, 1.0, 3.0], "bins": [-0.4873046875, -0.47342681884765625, -0.4595489501953125, -0.44567108154296875, -0.431793212890625, -0.41791534423828125, -0.4040374755859375, -0.39015960693359375, -0.37628173828125, -0.36240386962890625, -0.3485260009765625, -0.33464813232421875, -0.320770263671875, -0.30689239501953125, -0.2930145263671875, -0.27913665771484375, -0.2652587890625, -0.25138092041015625, -0.2375030517578125, -0.22362518310546875, -0.209747314453125, -0.19586944580078125, -0.1819915771484375, -0.16811370849609375, -0.15423583984375, -0.14035797119140625, -0.1264801025390625, -0.11260223388671875, -0.098724365234375, -0.08484649658203125, -0.0709686279296875, -0.05709075927734375, -0.043212890625, -0.02933502197265625, -0.0154571533203125, -0.00157928466796875, 0.012298583984375, 0.02617645263671875, 0.0400543212890625, 0.05393218994140625, 0.06781005859375, 0.08168792724609375, 0.0955657958984375, 0.10944366455078125, 0.123321533203125, 0.13719940185546875, 0.1510772705078125, 0.16495513916015625, 0.1788330078125, 0.19271087646484375, 0.2065887451171875, 0.22046661376953125, 0.234344482421875, 0.24822235107421875, 0.2621002197265625, 0.27597808837890625, 0.28985595703125, 0.30373382568359375, 0.3176116943359375, 0.33148956298828125, 0.345367431640625, 0.35924530029296875, 0.3731231689453125, 0.38700103759765625, 0.40087890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 4.0, 7.0, 7.0, 10.0, 9.0, 11.0, 18.0, 23.0, 46.0, 30.0, 68.0, 104.0, 174.0, 303.0, 658.0, 1518.0, 3716.0, 10389.0, 31094.0, 100981.0, 398538.0, 366103.0, 90657.0, 28218.0, 9451.0, 3550.0, 1427.0, 655.0, 310.0, 158.0, 95.0, 71.0, 42.0, 33.0, 19.0, 11.0, 11.0, 19.0, 8.0, 2.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9765625, -1.9127197265625, -1.848876953125, -1.7850341796875, -1.72119140625, -1.6573486328125, -1.593505859375, -1.5296630859375, -1.4658203125, -1.4019775390625, -1.338134765625, -1.2742919921875, -1.21044921875, -1.1466064453125, -1.082763671875, -1.0189208984375, -0.955078125, -0.8912353515625, -0.827392578125, -0.7635498046875, -0.69970703125, -0.6358642578125, -0.572021484375, -0.5081787109375, -0.4443359375, -0.3804931640625, -0.316650390625, -0.2528076171875, -0.18896484375, -0.1251220703125, -0.061279296875, 0.0025634765625, 0.06640625, 0.1302490234375, 0.194091796875, 0.2579345703125, 0.32177734375, 0.3856201171875, 0.449462890625, 0.5133056640625, 0.5771484375, 0.6409912109375, 0.704833984375, 0.7686767578125, 0.83251953125, 0.8963623046875, 0.960205078125, 1.0240478515625, 1.087890625, 1.1517333984375, 1.215576171875, 1.2794189453125, 1.34326171875, 1.4071044921875, 1.470947265625, 1.5347900390625, 1.5986328125, 1.6624755859375, 1.726318359375, 1.7901611328125, 1.85400390625, 1.9178466796875, 1.981689453125, 2.0455322265625, 2.109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 8.0, 7.0, 10.0, 14.0, 9.0, 18.0, 19.0, 17.0, 19.0, 25.0, 25.0, 27.0, 34.0, 28.0, 41.0, 34.0, 32.0, 32.0, 49.0, 41.0, 40.0, 52.0, 44.0, 50.0, 34.0, 30.0, 39.0, 31.0, 29.0, 18.0, 24.0, 16.0, 12.0, 30.0, 9.0, 14.0, 8.0, 5.0, 1.0, 4.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0], "bins": [-1.90234375, -1.8513641357421875, -1.800384521484375, -1.7494049072265625, -1.69842529296875, -1.6474456787109375, -1.596466064453125, -1.5454864501953125, -1.4945068359375, -1.4435272216796875, -1.392547607421875, -1.3415679931640625, -1.29058837890625, -1.2396087646484375, -1.188629150390625, -1.1376495361328125, -1.086669921875, -1.0356903076171875, -0.984710693359375, -0.9337310791015625, -0.88275146484375, -0.8317718505859375, -0.780792236328125, -0.7298126220703125, -0.6788330078125, -0.6278533935546875, -0.576873779296875, -0.5258941650390625, -0.47491455078125, -0.4239349365234375, -0.372955322265625, -0.3219757080078125, -0.27099609375, -0.2200164794921875, -0.169036865234375, -0.1180572509765625, -0.06707763671875, -0.0160980224609375, 0.034881591796875, 0.0858612060546875, 0.1368408203125, 0.1878204345703125, 0.238800048828125, 0.2897796630859375, 0.34075927734375, 0.3917388916015625, 0.442718505859375, 0.4936981201171875, 0.544677734375, 0.5956573486328125, 0.646636962890625, 0.6976165771484375, 0.74859619140625, 0.7995758056640625, 0.850555419921875, 0.9015350341796875, 0.9525146484375, 1.0034942626953125, 1.054473876953125, 1.1054534912109375, 1.15643310546875, 1.2074127197265625, 1.258392333984375, 1.3093719482421875, 1.3603515625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 9.0, 11.0, 24.0, 27.0, 49.0, 93.0, 115.0, 219.0, 347.0, 604.0, 1043.0, 1812.0, 3422.0, 6244.0, 11939.0, 23561.0, 50146.0, 130711.0, 351249.0, 287466.0, 97627.0, 40529.0, 19369.0, 10007.0, 5311.0, 2825.0, 1561.0, 939.0, 523.0, 319.0, 185.0, 115.0, 63.0, 36.0, 37.0, 9.0, 5.0, 10.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76171875, -0.7343826293945312, -0.7070465087890625, -0.6797103881835938, -0.652374267578125, -0.6250381469726562, -0.5977020263671875, -0.5703659057617188, -0.54302978515625, -0.5156936645507812, -0.4883575439453125, -0.46102142333984375, -0.433685302734375, -0.40634918212890625, -0.3790130615234375, -0.35167694091796875, -0.3243408203125, -0.29700469970703125, -0.2696685791015625, -0.24233245849609375, -0.214996337890625, -0.18766021728515625, -0.1603240966796875, -0.13298797607421875, -0.10565185546875, -0.07831573486328125, -0.0509796142578125, -0.02364349365234375, 0.003692626953125, 0.03102874755859375, 0.0583648681640625, 0.08570098876953125, 0.113037109375, 0.14037322998046875, 0.1677093505859375, 0.19504547119140625, 0.222381591796875, 0.24971771240234375, 0.2770538330078125, 0.30438995361328125, 0.33172607421875, 0.35906219482421875, 0.3863983154296875, 0.41373443603515625, 0.441070556640625, 0.46840667724609375, 0.4957427978515625, 0.5230789184570312, 0.5504150390625, 0.5777511596679688, 0.6050872802734375, 0.6324234008789062, 0.659759521484375, 0.6870956420898438, 0.7144317626953125, 0.7417678833007812, 0.76910400390625, 0.7964401245117188, 0.8237762451171875, 0.8511123657226562, 0.878448486328125, 0.9057846069335938, 0.9331207275390625, 0.9604568481445312, 0.98779296875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 7.0, 5.0, 8.0, 16.0, 13.0, 15.0, 24.0, 28.0, 53.0, 83.0, 114.0, 165.0, 148.0, 98.0, 61.0, 37.0, 24.0, 18.0, 11.0, 8.0, 12.0, 13.0, 10.0, 6.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002262592315673828, -0.00021934323012828827, -0.00021242722868919373, -0.00020551122725009918, -0.00019859522581100464, -0.0001916792243719101, -0.00018476322293281555, -0.000177847221493721, -0.00017093122005462646, -0.00016401521861553192, -0.00015709921717643738, -0.00015018321573734283, -0.0001432672142982483, -0.00013635121285915375, -0.0001294352114200592, -0.00012251920998096466, -0.00011560320854187012, -0.00010868720710277557, -0.00010177120566368103, -9.485520422458649e-05, -8.793920278549194e-05, -8.10232013463974e-05, -7.410719990730286e-05, -6.719119846820831e-05, -6.027519702911377e-05, -5.3359195590019226e-05, -4.644319415092468e-05, -3.952719271183014e-05, -3.2611191272735596e-05, -2.5695189833641052e-05, -1.877918839454651e-05, -1.1863186955451965e-05, -4.947185516357422e-06, 1.9688159227371216e-06, 8.884817361831665e-06, 1.580081880092621e-05, 2.2716820240020752e-05, 2.9632821679115295e-05, 3.654882311820984e-05, 4.346482455730438e-05, 5.0380825996398926e-05, 5.729682743549347e-05, 6.421282887458801e-05, 7.112883031368256e-05, 7.80448317527771e-05, 8.496083319187164e-05, 9.187683463096619e-05, 9.879283607006073e-05, 0.00010570883750915527, 0.00011262483894824982, 0.00011954084038734436, 0.0001264568418264389, 0.00013337284326553345, 0.000140288844704628, 0.00014720484614372253, 0.00015412084758281708, 0.00016103684902191162, 0.00016795285046100616, 0.0001748688519001007, 0.00018178485333919525, 0.0001887008547782898, 0.00019561685621738434, 0.00020253285765647888, 0.00020944885909557343, 0.00021636486053466797]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 6.0, 10.0, 19.0, 28.0, 50.0, 78.0, 142.0, 241.0, 408.0, 852.0, 1750.0, 3889.0, 8597.0, 21003.0, 54732.0, 185110.0, 488255.0, 190085.0, 55678.0, 21137.0, 8934.0, 3861.0, 1812.0, 824.0, 419.0, 271.0, 128.0, 90.0, 57.0, 28.0, 18.0, 9.0, 11.0, 6.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.064453125, -1.02838134765625, -0.9923095703125, -0.95623779296875, -0.920166015625, -0.88409423828125, -0.8480224609375, -0.81195068359375, -0.77587890625, -0.73980712890625, -0.7037353515625, -0.66766357421875, -0.631591796875, -0.59552001953125, -0.5594482421875, -0.52337646484375, -0.4873046875, -0.45123291015625, -0.4151611328125, -0.37908935546875, -0.343017578125, -0.30694580078125, -0.2708740234375, -0.23480224609375, -0.19873046875, -0.16265869140625, -0.1265869140625, -0.09051513671875, -0.054443359375, -0.01837158203125, 0.0177001953125, 0.05377197265625, 0.08984375, 0.12591552734375, 0.1619873046875, 0.19805908203125, 0.234130859375, 0.27020263671875, 0.3062744140625, 0.34234619140625, 0.37841796875, 0.41448974609375, 0.4505615234375, 0.48663330078125, 0.522705078125, 0.55877685546875, 0.5948486328125, 0.63092041015625, 0.6669921875, 0.70306396484375, 0.7391357421875, 0.77520751953125, 0.811279296875, 0.84735107421875, 0.8834228515625, 0.91949462890625, 0.95556640625, 0.99163818359375, 1.0277099609375, 1.06378173828125, 1.099853515625, 1.13592529296875, 1.1719970703125, 1.20806884765625, 1.244140625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 6.0, 10.0, 8.0, 13.0, 16.0, 27.0, 30.0, 52.0, 73.0, 78.0, 137.0, 132.0, 125.0, 68.0, 62.0, 43.0, 23.0, 23.0, 13.0, 12.0, 14.0, 14.0, 1.0, 6.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1337890625, -1.098663330078125, -1.06353759765625, -1.028411865234375, -0.9932861328125, -0.958160400390625, -0.92303466796875, -0.887908935546875, -0.852783203125, -0.817657470703125, -0.78253173828125, -0.747406005859375, -0.7122802734375, -0.677154541015625, -0.64202880859375, -0.606903076171875, -0.57177734375, -0.536651611328125, -0.50152587890625, -0.466400146484375, -0.4312744140625, -0.396148681640625, -0.36102294921875, -0.325897216796875, -0.290771484375, -0.255645751953125, -0.22052001953125, -0.185394287109375, -0.1502685546875, -0.115142822265625, -0.08001708984375, -0.044891357421875, -0.009765625, 0.025360107421875, 0.06048583984375, 0.095611572265625, 0.1307373046875, 0.165863037109375, 0.20098876953125, 0.236114501953125, 0.271240234375, 0.306365966796875, 0.34149169921875, 0.376617431640625, 0.4117431640625, 0.446868896484375, 0.48199462890625, 0.517120361328125, 0.55224609375, 0.587371826171875, 0.62249755859375, 0.657623291015625, 0.6927490234375, 0.727874755859375, 0.76300048828125, 0.798126220703125, 0.833251953125, 0.868377685546875, 0.90350341796875, 0.938629150390625, 0.9737548828125, 1.008880615234375, 1.04400634765625, 1.079132080078125, 1.1142578125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 30.0, 116.0, 290.0, 337.0, 161.0, 61.0, 9.0, 6.0, 1.0], "bins": [-51.201934814453125, -50.319786071777344, -49.43764114379883, -48.55549240112305, -47.673343658447266, -46.79119873046875, -45.90904998779297, -45.02690124511719, -44.14475631713867, -43.26260757446289, -42.380462646484375, -41.498313903808594, -40.61616516113281, -39.7340202331543, -38.851871490478516, -37.969722747802734, -37.08757781982422, -36.20542907714844, -35.32328414916992, -34.44113540649414, -33.55898666381836, -32.676841735839844, -31.794692993164062, -30.912546157836914, -30.0303955078125, -29.14824867248535, -28.26609992980957, -27.383953094482422, -26.501806259155273, -25.619659423828125, -24.737510681152344, -23.855363845825195, -22.973217010498047, -22.0910701751709, -21.208921432495117, -20.32677459716797, -19.44462776184082, -18.562480926513672, -17.68033218383789, -16.798185348510742, -15.916037559509277, -15.033889770507812, -14.151742935180664, -13.2695951461792, -12.387447357177734, -11.505300521850586, -10.623152732849121, -9.741004943847656, -8.858858108520508, -7.976710796356201, -7.0945634841918945, -6.21241569519043, -5.330268383026123, -4.448121070861816, -3.5659732818603516, -2.683825969696045, -1.8016786575317383, -0.9195312261581421, -0.0373837947845459, 0.8447637557983398, 1.7269110679626465, 2.609058380126953, 3.491206169128418, 4.373353481292725, 5.255500793457031]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 1.0, 7.0, 5.0, 7.0, 15.0, 11.0, 18.0, 14.0, 22.0, 30.0, 27.0, 36.0, 38.0, 41.0, 29.0, 32.0, 60.0, 40.0, 46.0, 49.0, 39.0, 34.0, 44.0, 35.0, 33.0, 39.0, 38.0, 33.0, 42.0, 21.0, 23.0, 15.0, 25.0, 11.0, 13.0, 10.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.403284072875977, -5.234786510467529, -5.066288948059082, -4.897791385650635, -4.7292938232421875, -4.560795783996582, -4.392298698425293, -4.2238006591796875, -4.05530309677124, -3.886805534362793, -3.7183079719543457, -3.5498104095458984, -3.381312608718872, -3.212815046310425, -3.0443174839019775, -2.875819683074951, -2.707322359085083, -2.5388247966766357, -2.3703272342681885, -2.201829433441162, -2.033331871032715, -1.8648343086242676, -1.6963367462158203, -1.5278390645980835, -1.3593415021896362, -1.190843939781189, -1.0223462581634521, -0.8538486957550049, -0.6853510737419128, -0.5168534517288208, -0.34835588932037354, -0.17985820770263672, -0.011360645294189453, 0.1571369618177414, 0.32563456892967224, 0.4941321611404419, 0.6626297831535339, 0.831127405166626, 0.9996249675750732, 1.16812264919281, 1.3366202116012573, 1.5051177740097046, 1.6736154556274414, 1.8421130180358887, 2.010610580444336, 2.179108142852783, 2.3476057052612305, 2.516103506088257, 2.684601068496704, 2.8530986309051514, 3.0215961933135986, 3.190093994140625, 3.3585915565490723, 3.5270891189575195, 3.695586681365967, 3.864084243774414, 4.032581806182861, 4.201079368591309, 4.369576930999756, 4.538074493408203, 4.70657205581665, 4.875069618225098, 5.043567657470703, 5.21206521987915, 5.380562782287598]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 8.0, 4.0, 9.0, 12.0, 18.0, 23.0, 37.0, 38.0, 83.0, 108.0, 201.0, 312.0, 593.0, 1120.0, 2339.0, 4998.0, 10926.0, 25447.0, 64043.0, 170591.0, 485846.0, 1609306.0, 1220142.0, 376882.0, 133499.0, 50493.0, 20748.0, 8669.0, 3914.0, 1834.0, 941.0, 492.0, 236.0, 126.0, 77.0, 57.0, 45.0, 26.0, 15.0, 9.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.1064453125, -1.0756072998046875, -1.044769287109375, -1.0139312744140625, -0.98309326171875, -0.9522552490234375, -0.921417236328125, -0.8905792236328125, -0.8597412109375, -0.8289031982421875, -0.798065185546875, -0.7672271728515625, -0.73638916015625, -0.7055511474609375, -0.674713134765625, -0.6438751220703125, -0.613037109375, -0.5821990966796875, -0.551361083984375, -0.5205230712890625, -0.48968505859375, -0.4588470458984375, -0.428009033203125, -0.3971710205078125, -0.3663330078125, -0.3354949951171875, -0.304656982421875, -0.2738189697265625, -0.24298095703125, -0.2121429443359375, -0.181304931640625, -0.1504669189453125, -0.11962890625, -0.0887908935546875, -0.057952880859375, -0.0271148681640625, 0.00372314453125, 0.0345611572265625, 0.065399169921875, 0.0962371826171875, 0.1270751953125, 0.1579132080078125, 0.188751220703125, 0.2195892333984375, 0.25042724609375, 0.2812652587890625, 0.312103271484375, 0.3429412841796875, 0.373779296875, 0.4046173095703125, 0.435455322265625, 0.4662933349609375, 0.49713134765625, 0.5279693603515625, 0.558807373046875, 0.5896453857421875, 0.6204833984375, 0.6513214111328125, 0.682159423828125, 0.7129974365234375, 0.74383544921875, 0.7746734619140625, 0.805511474609375, 0.8363494873046875, 0.8671875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 12.0, 6.0, 11.0, 5.0, 4.0, 12.0, 13.0, 11.0, 18.0, 13.0, 19.0, 10.0, 18.0, 23.0, 28.0, 16.0, 28.0, 28.0, 26.0, 33.0, 43.0, 28.0, 44.0, 36.0, 48.0, 31.0, 34.0, 28.0, 38.0, 36.0, 36.0, 26.0, 43.0, 13.0, 24.0, 18.0, 21.0, 10.0, 9.0, 15.0, 10.0, 12.0, 14.0, 11.0, 7.0, 9.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.48486328125, -0.46923065185546875, -0.4535980224609375, -0.43796539306640625, -0.422332763671875, -0.40670013427734375, -0.3910675048828125, -0.37543487548828125, -0.35980224609375, -0.34416961669921875, -0.3285369873046875, -0.31290435791015625, -0.297271728515625, -0.28163909912109375, -0.2660064697265625, -0.25037384033203125, -0.2347412109375, -0.21910858154296875, -0.2034759521484375, -0.18784332275390625, -0.172210693359375, -0.15657806396484375, -0.1409454345703125, -0.12531280517578125, -0.10968017578125, -0.09404754638671875, -0.0784149169921875, -0.06278228759765625, -0.047149658203125, -0.03151702880859375, -0.0158843994140625, -0.00025177001953125, 0.015380859375, 0.03101348876953125, 0.0466461181640625, 0.06227874755859375, 0.077911376953125, 0.09354400634765625, 0.1091766357421875, 0.12480926513671875, 0.14044189453125, 0.15607452392578125, 0.1717071533203125, 0.18733978271484375, 0.202972412109375, 0.21860504150390625, 0.2342376708984375, 0.24987030029296875, 0.2655029296875, 0.28113555908203125, 0.2967681884765625, 0.31240081787109375, 0.328033447265625, 0.34366607666015625, 0.3592987060546875, 0.37493133544921875, 0.39056396484375, 0.40619659423828125, 0.4218292236328125, 0.43746185302734375, 0.453094482421875, 0.46872711181640625, 0.4843597412109375, 0.49999237060546875, 0.515625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 7.0, 7.0, 9.0, 6.0, 6.0, 19.0, 13.0, 17.0, 38.0, 40.0, 36.0, 76.0, 132.0, 271.0, 518.0, 1153.0, 3458.0, 12606.0, 57930.0, 335802.0, 2011280.0, 1478882.0, 235335.0, 42140.0, 9633.0, 2873.0, 1002.0, 425.0, 203.0, 104.0, 76.0, 51.0, 29.0, 18.0, 16.0, 6.0, 11.0, 9.0, 6.0, 9.0, 5.0, 3.0, 6.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.552734375, -2.47271728515625, -2.3927001953125, -2.31268310546875, -2.232666015625, -2.15264892578125, -2.0726318359375, -1.99261474609375, -1.91259765625, -1.83258056640625, -1.7525634765625, -1.67254638671875, -1.592529296875, -1.51251220703125, -1.4324951171875, -1.35247802734375, -1.2724609375, -1.19244384765625, -1.1124267578125, -1.03240966796875, -0.952392578125, -0.87237548828125, -0.7923583984375, -0.71234130859375, -0.63232421875, -0.55230712890625, -0.4722900390625, -0.39227294921875, -0.312255859375, -0.23223876953125, -0.1522216796875, -0.07220458984375, 0.0078125, 0.08782958984375, 0.1678466796875, 0.24786376953125, 0.327880859375, 0.40789794921875, 0.4879150390625, 0.56793212890625, 0.64794921875, 0.72796630859375, 0.8079833984375, 0.88800048828125, 0.968017578125, 1.04803466796875, 1.1280517578125, 1.20806884765625, 1.2880859375, 1.36810302734375, 1.4481201171875, 1.52813720703125, 1.608154296875, 1.68817138671875, 1.7681884765625, 1.84820556640625, 1.92822265625, 2.00823974609375, 2.0882568359375, 2.16827392578125, 2.248291015625, 2.32830810546875, 2.4083251953125, 2.48834228515625, 2.568359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 11.0, 19.0, 42.0, 77.0, 148.0, 309.0, 617.0, 1021.0, 874.0, 489.0, 237.0, 127.0, 53.0, 28.0, 13.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.60546875, -4.5148773193359375, -4.424285888671875, -4.3336944580078125, -4.24310302734375, -4.1525115966796875, -4.061920166015625, -3.9713287353515625, -3.8807373046875, -3.7901458740234375, -3.699554443359375, -3.6089630126953125, -3.51837158203125, -3.4277801513671875, -3.337188720703125, -3.2465972900390625, -3.156005859375, -3.0654144287109375, -2.974822998046875, -2.8842315673828125, -2.79364013671875, -2.7030487060546875, -2.612457275390625, -2.5218658447265625, -2.4312744140625, -2.3406829833984375, -2.250091552734375, -2.1595001220703125, -2.06890869140625, -1.9783172607421875, -1.887725830078125, -1.7971343994140625, -1.70654296875, -1.6159515380859375, -1.525360107421875, -1.4347686767578125, -1.34417724609375, -1.2535858154296875, -1.162994384765625, -1.0724029541015625, -0.9818115234375, -0.8912200927734375, -0.800628662109375, -0.7100372314453125, -0.61944580078125, -0.5288543701171875, -0.438262939453125, -0.3476715087890625, -0.257080078125, -0.1664886474609375, -0.075897216796875, 0.0146942138671875, 0.10528564453125, 0.1958770751953125, 0.286468505859375, 0.3770599365234375, 0.4676513671875, 0.5582427978515625, 0.648834228515625, 0.7394256591796875, 0.83001708984375, 0.9206085205078125, 1.011199951171875, 1.1017913818359375, 1.1923828125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 12.0, 17.0, 23.0, 32.0, 64.0, 65.0, 85.0, 110.0, 112.0, 104.0, 86.0, 92.0, 76.0, 41.0, 29.0, 20.0, 15.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.186923027038574, -9.913362503051758, -9.639801025390625, -9.366240501403809, -9.092679023742676, -8.81911849975586, -8.545557022094727, -8.27199649810791, -7.9984354972839355, -7.724874496459961, -7.451313495635986, -7.177752494812012, -6.904191970825195, -6.6306304931640625, -6.357069969177246, -6.0835089683532715, -5.809947967529297, -5.536386966705322, -5.262825965881348, -4.989264965057373, -4.715703964233398, -4.442143440246582, -4.168582439422607, -3.895021438598633, -3.621460437774658, -3.3478994369506836, -3.074338436126709, -2.8007776737213135, -2.527216672897339, -2.2536556720733643, -1.9800947904586792, -1.7065339088439941, -1.4329719543457031, -1.1594109535217285, -0.8858500719070435, -0.6122891306877136, -0.3387281894683838, -0.06516718864440918, 0.20839369297027588, 0.48195457458496094, 0.7555155754089355, 1.0290765762329102, 1.3026374578475952, 1.5761983394622803, 1.8497593402862549, 2.1233203411102295, 2.396881103515625, 2.6704421043395996, 2.944003105163574, 3.217564105987549, 3.4911251068115234, 3.764685869216919, 4.038247108459473, 4.311807632446289, 4.585368633270264, 4.858929634094238, 5.132490634918213, 5.4060516357421875, 5.679612636566162, 5.953173637390137, 6.226734161376953, 6.500295639038086, 6.773856163024902, 7.047417163848877, 7.320978164672852]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 6.0, 6.0, 8.0, 11.0, 9.0, 13.0, 15.0, 16.0, 10.0, 18.0, 20.0, 15.0, 31.0, 24.0, 28.0, 33.0, 35.0, 30.0, 32.0, 32.0, 41.0, 38.0, 26.0, 38.0, 30.0, 37.0, 34.0, 30.0, 31.0, 28.0, 23.0, 33.0, 20.0, 20.0, 17.0, 21.0, 19.0, 18.0, 12.0, 14.0, 15.0, 12.0, 8.0, 9.0, 5.0, 6.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0], "bins": [-3.7600393295288086, -3.64656925201416, -3.5330991744995117, -3.4196293354034424, -3.306159257888794, -3.1926891803741455, -3.079219341278076, -2.9657492637634277, -2.8522791862487793, -2.738809108734131, -2.6253390312194824, -2.511869192123413, -2.3983991146087646, -2.284929037094116, -2.171459197998047, -2.0579891204833984, -1.94451904296875, -1.8310489654541016, -1.7175790071487427, -1.6041090488433838, -1.4906389713287354, -1.377168893814087, -1.263698935508728, -1.1502289772033691, -1.0367588996887207, -0.923288881778717, -0.8098188638687134, -0.6963488459587097, -0.582878828048706, -0.4694088101387024, -0.35593879222869873, -0.24246877431869507, -0.1289987564086914, -0.015528738498687744, 0.09794127941131592, 0.21141129732131958, 0.32488131523132324, 0.4383513331413269, 0.5518213510513306, 0.6652913689613342, 0.7787613868713379, 0.8922314047813416, 1.0057014226913452, 1.119171380996704, 1.2326414585113525, 1.346111536026001, 1.4595814943313599, 1.5730514526367188, 1.6865215301513672, 1.7999916076660156, 1.9134615659713745, 2.0269315242767334, 2.140401601791382, 2.2538716793060303, 2.3673415184020996, 2.480811595916748, 2.5942816734313965, 2.707751750946045, 2.8212218284606934, 2.9346916675567627, 3.048161745071411, 3.1616318225860596, 3.275101661682129, 3.3885717391967773, 3.502041816711426]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 9.0, 17.0, 25.0, 41.0, 93.0, 172.0, 225.0, 315.0, 539.0, 932.0, 1258.0, 1963.0, 3178.0, 4466.0, 6945.0, 9930.0, 15100.0, 22090.0, 33683.0, 54834.0, 104591.0, 204504.0, 244451.0, 144902.0, 71954.0, 41712.0, 26517.0, 17703.0, 12083.0, 8184.0, 5627.0, 3675.0, 2371.0, 1632.0, 1030.0, 677.0, 413.0, 258.0, 163.0, 94.0, 75.0, 35.0, 34.0, 14.0, 16.0, 5.0, 7.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.77978515625, -0.7531051635742188, -0.7264251708984375, -0.6997451782226562, -0.673065185546875, -0.6463851928710938, -0.6197052001953125, -0.5930252075195312, -0.56634521484375, -0.5396652221679688, -0.5129852294921875, -0.48630523681640625, -0.459625244140625, -0.43294525146484375, -0.4062652587890625, -0.37958526611328125, -0.3529052734375, -0.32622528076171875, -0.2995452880859375, -0.27286529541015625, -0.246185302734375, -0.21950531005859375, -0.1928253173828125, -0.16614532470703125, -0.13946533203125, -0.11278533935546875, -0.0861053466796875, -0.05942535400390625, -0.032745361328125, -0.00606536865234375, 0.0206146240234375, 0.04729461669921875, 0.073974609375, 0.10065460205078125, 0.1273345947265625, 0.15401458740234375, 0.180694580078125, 0.20737457275390625, 0.2340545654296875, 0.26073455810546875, 0.28741455078125, 0.31409454345703125, 0.3407745361328125, 0.36745452880859375, 0.394134521484375, 0.42081451416015625, 0.4474945068359375, 0.47417449951171875, 0.5008544921875, 0.5275344848632812, 0.5542144775390625, 0.5808944702148438, 0.607574462890625, 0.6342544555664062, 0.6609344482421875, 0.6876144409179688, 0.71429443359375, 0.7409744262695312, 0.7676544189453125, 0.7943344116210938, 0.821014404296875, 0.8476943969726562, 0.8743743896484375, 0.9010543823242188, 0.927734375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 7.0, 7.0, 1.0, 7.0, 10.0, 11.0, 11.0, 22.0, 22.0, 14.0, 20.0, 23.0, 23.0, 38.0, 22.0, 31.0, 40.0, 37.0, 47.0, 39.0, 45.0, 44.0, 42.0, 42.0, 41.0, 48.0, 37.0, 43.0, 33.0, 37.0, 27.0, 21.0, 13.0, 21.0, 17.0, 11.0, 9.0, 6.0, 10.0, 9.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65087890625, -0.6299591064453125, -0.609039306640625, -0.5881195068359375, -0.56719970703125, -0.5462799072265625, -0.525360107421875, -0.5044403076171875, -0.4835205078125, -0.4626007080078125, -0.441680908203125, -0.4207611083984375, -0.39984130859375, -0.3789215087890625, -0.358001708984375, -0.3370819091796875, -0.316162109375, -0.2952423095703125, -0.274322509765625, -0.2534027099609375, -0.23248291015625, -0.2115631103515625, -0.190643310546875, -0.1697235107421875, -0.1488037109375, -0.1278839111328125, -0.106964111328125, -0.0860443115234375, -0.06512451171875, -0.0442047119140625, -0.023284912109375, -0.0023651123046875, 0.0185546875, 0.0394744873046875, 0.060394287109375, 0.0813140869140625, 0.10223388671875, 0.1231536865234375, 0.144073486328125, 0.1649932861328125, 0.1859130859375, 0.2068328857421875, 0.227752685546875, 0.2486724853515625, 0.26959228515625, 0.2905120849609375, 0.311431884765625, 0.3323516845703125, 0.353271484375, 0.3741912841796875, 0.395111083984375, 0.4160308837890625, 0.43695068359375, 0.4578704833984375, 0.478790283203125, 0.4997100830078125, 0.5206298828125, 0.5415496826171875, 0.562469482421875, 0.5833892822265625, 0.60430908203125, 0.6252288818359375, 0.646148681640625, 0.6670684814453125, 0.68798828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 5.0, 6.0, 7.0, 15.0, 19.0, 25.0, 42.0, 54.0, 65.0, 91.0, 137.0, 303.0, 885.0, 2942.0, 10906.0, 37871.0, 152608.0, 654926.0, 137648.0, 35319.0, 10327.0, 2790.0, 806.0, 320.0, 134.0, 91.0, 46.0, 36.0, 37.0, 26.0, 17.0, 20.0, 11.0, 10.0, 7.0, 0.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.91015625, -2.81768798828125, -2.7252197265625, -2.63275146484375, -2.540283203125, -2.44781494140625, -2.3553466796875, -2.26287841796875, -2.17041015625, -2.07794189453125, -1.9854736328125, -1.89300537109375, -1.800537109375, -1.70806884765625, -1.6156005859375, -1.52313232421875, -1.4306640625, -1.33819580078125, -1.2457275390625, -1.15325927734375, -1.060791015625, -0.96832275390625, -0.8758544921875, -0.78338623046875, -0.69091796875, -0.59844970703125, -0.5059814453125, -0.41351318359375, -0.321044921875, -0.22857666015625, -0.1361083984375, -0.04364013671875, 0.048828125, 0.14129638671875, 0.2337646484375, 0.32623291015625, 0.418701171875, 0.51116943359375, 0.6036376953125, 0.69610595703125, 0.78857421875, 0.88104248046875, 0.9735107421875, 1.06597900390625, 1.158447265625, 1.25091552734375, 1.3433837890625, 1.43585205078125, 1.5283203125, 1.62078857421875, 1.7132568359375, 1.80572509765625, 1.898193359375, 1.99066162109375, 2.0831298828125, 2.17559814453125, 2.26806640625, 2.36053466796875, 2.4530029296875, 2.54547119140625, 2.637939453125, 2.73040771484375, 2.8228759765625, 2.91534423828125, 3.0078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 8.0, 5.0, 5.0, 13.0, 10.0, 20.0, 20.0, 13.0, 19.0, 28.0, 20.0, 30.0, 42.0, 39.0, 47.0, 42.0, 49.0, 46.0, 53.0, 42.0, 42.0, 43.0, 46.0, 44.0, 39.0, 30.0, 35.0, 20.0, 32.0, 26.0, 15.0, 15.0, 10.0, 11.0, 10.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-2.208984375, -2.141265869140625, -2.07354736328125, -2.005828857421875, -1.9381103515625, -1.870391845703125, -1.80267333984375, -1.734954833984375, -1.667236328125, -1.599517822265625, -1.53179931640625, -1.464080810546875, -1.3963623046875, -1.328643798828125, -1.26092529296875, -1.193206787109375, -1.12548828125, -1.057769775390625, -0.99005126953125, -0.922332763671875, -0.8546142578125, -0.786895751953125, -0.71917724609375, -0.651458740234375, -0.583740234375, -0.516021728515625, -0.44830322265625, -0.380584716796875, -0.3128662109375, -0.245147705078125, -0.17742919921875, -0.109710693359375, -0.0419921875, 0.025726318359375, 0.09344482421875, 0.161163330078125, 0.2288818359375, 0.296600341796875, 0.36431884765625, 0.432037353515625, 0.499755859375, 0.567474365234375, 0.63519287109375, 0.702911376953125, 0.7706298828125, 0.838348388671875, 0.90606689453125, 0.973785400390625, 1.04150390625, 1.109222412109375, 1.17694091796875, 1.244659423828125, 1.3123779296875, 1.380096435546875, 1.44781494140625, 1.515533447265625, 1.583251953125, 1.650970458984375, 1.71868896484375, 1.786407470703125, 1.8541259765625, 1.921844482421875, 1.98956298828125, 2.057281494140625, 2.125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 11.0, 14.0, 19.0, 20.0, 30.0, 49.0, 82.0, 110.0, 153.0, 268.0, 398.0, 634.0, 1041.0, 1541.0, 2443.0, 3834.0, 6241.0, 10384.0, 17071.0, 30376.0, 71137.0, 278728.0, 415421.0, 114613.0, 40074.0, 21028.0, 12538.0, 7695.0, 4676.0, 2836.0, 1818.0, 1130.0, 713.0, 502.0, 304.0, 186.0, 145.0, 105.0, 62.0, 36.0, 32.0, 17.0, 19.0, 9.0, 8.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.83837890625, -0.8115005493164062, -0.7846221923828125, -0.7577438354492188, -0.730865478515625, -0.7039871215820312, -0.6771087646484375, -0.6502304077148438, -0.62335205078125, -0.5964736938476562, -0.5695953369140625, -0.5427169799804688, -0.515838623046875, -0.48896026611328125, -0.4620819091796875, -0.43520355224609375, -0.4083251953125, -0.38144683837890625, -0.3545684814453125, -0.32769012451171875, -0.300811767578125, -0.27393341064453125, -0.2470550537109375, -0.22017669677734375, -0.19329833984375, -0.16641998291015625, -0.1395416259765625, -0.11266326904296875, -0.085784912109375, -0.05890655517578125, -0.0320281982421875, -0.00514984130859375, 0.021728515625, 0.04860687255859375, 0.0754852294921875, 0.10236358642578125, 0.129241943359375, 0.15612030029296875, 0.1829986572265625, 0.20987701416015625, 0.23675537109375, 0.26363372802734375, 0.2905120849609375, 0.31739044189453125, 0.344268798828125, 0.37114715576171875, 0.3980255126953125, 0.42490386962890625, 0.4517822265625, 0.47866058349609375, 0.5055389404296875, 0.5324172973632812, 0.559295654296875, 0.5861740112304688, 0.6130523681640625, 0.6399307250976562, 0.66680908203125, 0.6936874389648438, 0.7205657958984375, 0.7474441528320312, 0.774322509765625, 0.8012008666992188, 0.8280792236328125, 0.8549575805664062, 0.8818359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 9.0, 6.0, 14.0, 8.0, 11.0, 20.0, 20.0, 38.0, 38.0, 48.0, 109.0, 169.0, 203.0, 120.0, 48.0, 29.0, 15.0, 16.0, 16.0, 12.0, 4.0, 1.0, 6.0, 1.0, 7.0, 3.0, 1.0, 3.0, 3.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0002658367156982422, -0.0002586543560028076, -0.00025147199630737305, -0.0002442896366119385, -0.0002371072769165039, -0.00022992491722106934, -0.00022274255752563477, -0.0002155601978302002, -0.00020837783813476562, -0.00020119547843933105, -0.00019401311874389648, -0.00018683075904846191, -0.00017964839935302734, -0.00017246603965759277, -0.0001652836799621582, -0.00015810132026672363, -0.00015091896057128906, -0.0001437366008758545, -0.00013655424118041992, -0.00012937188148498535, -0.00012218952178955078, -0.00011500716209411621, -0.00010782480239868164, -0.00010064244270324707, -9.34600830078125e-05, -8.627772331237793e-05, -7.909536361694336e-05, -7.191300392150879e-05, -6.473064422607422e-05, -5.754828453063965e-05, -5.036592483520508e-05, -4.318356513977051e-05, -3.600120544433594e-05, -2.8818845748901367e-05, -2.1636486053466797e-05, -1.4454126358032227e-05, -7.271766662597656e-06, -8.940696716308594e-08, 7.092952728271484e-06, 1.4275312423706055e-05, 2.1457672119140625e-05, 2.8640031814575195e-05, 3.5822391510009766e-05, 4.3004751205444336e-05, 5.0187110900878906e-05, 5.7369470596313477e-05, 6.455183029174805e-05, 7.173418998718262e-05, 7.891654968261719e-05, 8.609890937805176e-05, 9.328126907348633e-05, 0.0001004636287689209, 0.00010764598846435547, 0.00011482834815979004, 0.00012201070785522461, 0.00012919306755065918, 0.00013637542724609375, 0.00014355778694152832, 0.0001507401466369629, 0.00015792250633239746, 0.00016510486602783203, 0.0001722872257232666, 0.00017946958541870117, 0.00018665194511413574, 0.0001938343048095703]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 7.0, 1.0, 5.0, 8.0, 16.0, 11.0, 30.0, 37.0, 73.0, 100.0, 233.0, 462.0, 1058.0, 2472.0, 6463.0, 17323.0, 49254.0, 280547.0, 567938.0, 81621.0, 25237.0, 9312.0, 3598.0, 1465.0, 600.0, 309.0, 161.0, 76.0, 60.0, 32.0, 11.0, 8.0, 10.0, 4.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5673828125, -1.5201568603515625, -1.472930908203125, -1.4257049560546875, -1.37847900390625, -1.3312530517578125, -1.284027099609375, -1.2368011474609375, -1.1895751953125, -1.1423492431640625, -1.095123291015625, -1.0478973388671875, -1.00067138671875, -0.9534454345703125, -0.906219482421875, -0.8589935302734375, -0.811767578125, -0.7645416259765625, -0.717315673828125, -0.6700897216796875, -0.62286376953125, -0.5756378173828125, -0.528411865234375, -0.4811859130859375, -0.4339599609375, -0.3867340087890625, -0.339508056640625, -0.2922821044921875, -0.24505615234375, -0.1978302001953125, -0.150604248046875, -0.1033782958984375, -0.05615234375, -0.0089263916015625, 0.038299560546875, 0.0855255126953125, 0.13275146484375, 0.1799774169921875, 0.227203369140625, 0.2744293212890625, 0.3216552734375, 0.3688812255859375, 0.416107177734375, 0.4633331298828125, 0.51055908203125, 0.5577850341796875, 0.605010986328125, 0.6522369384765625, 0.699462890625, 0.7466888427734375, 0.793914794921875, 0.8411407470703125, 0.88836669921875, 0.9355926513671875, 0.982818603515625, 1.0300445556640625, 1.0772705078125, 1.1244964599609375, 1.171722412109375, 1.2189483642578125, 1.26617431640625, 1.3134002685546875, 1.360626220703125, 1.4078521728515625, 1.455078125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 4.0, 8.0, 14.0, 7.0, 19.0, 28.0, 25.0, 72.0, 141.0, 230.0, 214.0, 95.0, 52.0, 18.0, 19.0, 10.0, 12.0, 6.0, 6.0, 8.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.134765625, -2.0860824584960938, -2.0373992919921875, -1.9887161254882812, -1.940032958984375, -1.8913497924804688, -1.8426666259765625, -1.7939834594726562, -1.74530029296875, -1.6966171264648438, -1.6479339599609375, -1.5992507934570312, -1.550567626953125, -1.5018844604492188, -1.4532012939453125, -1.4045181274414062, -1.3558349609375, -1.3071517944335938, -1.2584686279296875, -1.2097854614257812, -1.161102294921875, -1.1124191284179688, -1.0637359619140625, -1.0150527954101562, -0.96636962890625, -0.9176864624023438, -0.8690032958984375, -0.8203201293945312, -0.771636962890625, -0.7229537963867188, -0.6742706298828125, -0.6255874633789062, -0.576904296875, -0.5282211303710938, -0.4795379638671875, -0.43085479736328125, -0.382171630859375, -0.33348846435546875, -0.2848052978515625, -0.23612213134765625, -0.18743896484375, -0.13875579833984375, -0.0900726318359375, -0.04138946533203125, 0.007293701171875, 0.05597686767578125, 0.1046600341796875, 0.15334320068359375, 0.2020263671875, 0.25070953369140625, 0.2993927001953125, 0.34807586669921875, 0.396759033203125, 0.44544219970703125, 0.4941253662109375, 0.5428085327148438, 0.59149169921875, 0.6401748657226562, 0.6888580322265625, 0.7375411987304688, 0.786224365234375, 0.8349075317382812, 0.8835906982421875, 0.9322738647460938, 0.98095703125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 11.0, 14.0, 27.0, 35.0, 48.0, 64.0, 86.0, 101.0, 121.0, 110.0, 106.0, 80.0, 70.0, 51.0, 37.0, 10.0, 9.0, 9.0, 7.0, 3.0, 0.0, 0.0, 1.0], "bins": [-15.339574813842773, -15.03327751159668, -14.726980209350586, -14.420681953430176, -14.114384651184082, -13.808087348937988, -13.501790046691895, -13.1954927444458, -12.88919448852539, -12.582897186279297, -12.276599884033203, -11.970301628112793, -11.6640043258667, -11.357707023620605, -11.051409721374512, -10.745112419128418, -10.438815116882324, -10.13251781463623, -9.826220512390137, -9.519922256469727, -9.213624954223633, -8.907327651977539, -8.601030349731445, -8.294733047485352, -7.9884352684021, -7.682137966156006, -7.375840187072754, -7.06954288482666, -6.763245582580566, -6.4569478034973145, -6.150650501251221, -5.844352722167969, -5.538055419921875, -5.231758117675781, -4.925460338592529, -4.6191630363464355, -4.312865257263184, -4.00656795501709, -3.700270652770996, -3.3939731121063232, -3.0876755714416504, -2.7813780307769775, -2.4750804901123047, -2.168783187866211, -1.862485647201538, -1.5561881065368652, -1.249890685081482, -0.9435932636260986, -0.6372957229614258, -0.3309982419013977, -0.02470076084136963, 0.28159672021865845, 0.5878942012786865, 0.8941917419433594, 1.2004891633987427, 1.506786584854126, 1.8130841255187988, 2.1193816661834717, 2.4256792068481445, 2.7319765090942383, 3.038274049758911, 3.344571590423584, 3.6508688926696777, 3.9571664333343506, 4.263463973999023]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 3.0, 10.0, 5.0, 11.0, 11.0, 11.0, 17.0, 15.0, 19.0, 26.0, 27.0, 29.0, 39.0, 38.0, 42.0, 36.0, 49.0, 45.0, 41.0, 48.0, 50.0, 47.0, 37.0, 52.0, 33.0, 27.0, 35.0, 32.0, 31.0, 29.0, 21.0, 16.0, 19.0, 15.0, 10.0, 5.0, 6.0, 5.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.193408489227295, -6.000701427459717, -5.8079938888549805, -5.615286827087402, -5.422579765319824, -5.229872226715088, -5.03716516494751, -4.844457626342773, -4.651750564575195, -4.459043502807617, -4.266335964202881, -4.073628902435303, -3.8809216022491455, -3.6882143020629883, -3.49550724029541, -3.302799940109253, -3.1100926399230957, -2.9173853397369385, -2.7246780395507812, -2.531970977783203, -2.339263677597046, -2.1465563774108887, -1.953849196434021, -1.7611420154571533, -1.568434715270996, -1.3757274150848389, -1.1830202341079712, -0.9903129935264587, -0.7976057529449463, -0.6048985123634338, -0.4121912717819214, -0.2194840908050537, -0.02677631378173828, 0.16593092679977417, 0.3586381673812866, 0.5513454079627991, 0.7440526485443115, 0.936759889125824, 1.1294671297073364, 1.322174310684204, 1.5148816108703613, 1.7075889110565186, 1.9002960920333862, 2.093003273010254, 2.285710573196411, 2.4784178733825684, 2.6711249351501465, 2.8638322353363037, 3.056539535522461, 3.249246835708618, 3.4419541358947754, 3.6346611976623535, 3.8273684978485107, 4.020075798034668, 4.212782859802246, 4.405489921569824, 4.5981974601745605, 4.790904521942139, 4.983612060546875, 5.176319122314453, 5.369026184082031, 5.561733722686768, 5.754440784454346, 5.947148323059082, 6.13985538482666]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 12.0, 21.0, 25.0, 58.0, 57.0, 128.0, 187.0, 315.0, 445.0, 848.0, 1421.0, 2503.0, 4724.0, 8800.0, 17299.0, 35382.0, 75552.0, 169680.0, 415948.0, 1358047.0, 1367933.0, 417099.0, 169814.0, 75928.0, 35556.0, 17182.0, 8816.0, 4622.0, 2533.0, 1359.0, 792.0, 467.0, 274.0, 172.0, 106.0, 63.0, 36.0, 22.0, 15.0, 10.0, 8.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0556640625, -1.0255050659179688, -0.9953460693359375, -0.9651870727539062, -0.935028076171875, -0.9048690795898438, -0.8747100830078125, -0.8445510864257812, -0.81439208984375, -0.7842330932617188, -0.7540740966796875, -0.7239151000976562, -0.693756103515625, -0.6635971069335938, -0.6334381103515625, -0.6032791137695312, -0.5731201171875, -0.5429611206054688, -0.5128021240234375, -0.48264312744140625, -0.452484130859375, -0.42232513427734375, -0.3921661376953125, -0.36200714111328125, -0.33184814453125, -0.30168914794921875, -0.2715301513671875, -0.24137115478515625, -0.211212158203125, -0.18105316162109375, -0.1508941650390625, -0.12073516845703125, -0.090576171875, -0.06041717529296875, -0.0302581787109375, -9.918212890625e-05, 0.030059814453125, 0.06021881103515625, 0.0903778076171875, 0.12053680419921875, 0.15069580078125, 0.18085479736328125, 0.2110137939453125, 0.24117279052734375, 0.271331787109375, 0.30149078369140625, 0.3316497802734375, 0.36180877685546875, 0.3919677734375, 0.42212677001953125, 0.4522857666015625, 0.48244476318359375, 0.512603759765625, 0.5427627563476562, 0.5729217529296875, 0.6030807495117188, 0.63323974609375, 0.6633987426757812, 0.6935577392578125, 0.7237167358398438, 0.753875732421875, 0.7840347290039062, 0.8141937255859375, 0.8443527221679688, 0.87451171875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 2.0, 8.0, 2.0, 7.0, 5.0, 8.0, 20.0, 14.0, 10.0, 26.0, 16.0, 30.0, 22.0, 26.0, 30.0, 39.0, 33.0, 27.0, 27.0, 33.0, 43.0, 39.0, 35.0, 47.0, 43.0, 30.0, 33.0, 40.0, 27.0, 29.0, 37.0, 27.0, 26.0, 23.0, 20.0, 16.0, 14.0, 12.0, 13.0, 13.0, 9.0, 7.0, 5.0, 3.0, 3.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.65673828125, -0.6363906860351562, -0.6160430908203125, -0.5956954956054688, -0.575347900390625, -0.5550003051757812, -0.5346527099609375, -0.5143051147460938, -0.49395751953125, -0.47360992431640625, -0.4532623291015625, -0.43291473388671875, -0.412567138671875, -0.39221954345703125, -0.3718719482421875, -0.35152435302734375, -0.3311767578125, -0.31082916259765625, -0.2904815673828125, -0.27013397216796875, -0.249786376953125, -0.22943878173828125, -0.2090911865234375, -0.18874359130859375, -0.16839599609375, -0.14804840087890625, -0.1277008056640625, -0.10735321044921875, -0.087005615234375, -0.06665802001953125, -0.0463104248046875, -0.02596282958984375, -0.005615234375, 0.01473236083984375, 0.0350799560546875, 0.05542755126953125, 0.075775146484375, 0.09612274169921875, 0.1164703369140625, 0.13681793212890625, 0.15716552734375, 0.17751312255859375, 0.1978607177734375, 0.21820831298828125, 0.238555908203125, 0.25890350341796875, 0.2792510986328125, 0.29959869384765625, 0.3199462890625, 0.34029388427734375, 0.3606414794921875, 0.38098907470703125, 0.401336669921875, 0.42168426513671875, 0.4420318603515625, 0.46237945556640625, 0.48272705078125, 0.5030746459960938, 0.5234222412109375, 0.5437698364257812, 0.564117431640625, 0.5844650268554688, 0.6048126220703125, 0.6251602172851562, 0.6455078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 5.0, 7.0, 8.0, 7.0, 10.0, 14.0, 18.0, 26.0, 39.0, 44.0, 59.0, 73.0, 153.0, 191.0, 246.0, 413.0, 683.0, 1071.0, 2018.0, 3747.0, 7385.0, 16870.0, 41267.0, 112131.0, 326853.0, 1091261.0, 1768995.0, 535349.0, 176028.0, 63126.0, 24667.0, 10275.0, 4939.0, 2583.0, 1443.0, 783.0, 467.0, 350.0, 205.0, 132.0, 87.0, 78.0, 55.0, 43.0, 29.0, 12.0, 13.0, 12.0, 10.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-1.990234375, -1.9337158203125, -1.877197265625, -1.8206787109375, -1.76416015625, -1.7076416015625, -1.651123046875, -1.5946044921875, -1.5380859375, -1.4815673828125, -1.425048828125, -1.3685302734375, -1.31201171875, -1.2554931640625, -1.198974609375, -1.1424560546875, -1.0859375, -1.0294189453125, -0.972900390625, -0.9163818359375, -0.85986328125, -0.8033447265625, -0.746826171875, -0.6903076171875, -0.6337890625, -0.5772705078125, -0.520751953125, -0.4642333984375, -0.40771484375, -0.3511962890625, -0.294677734375, -0.2381591796875, -0.181640625, -0.1251220703125, -0.068603515625, -0.0120849609375, 0.04443359375, 0.1009521484375, 0.157470703125, 0.2139892578125, 0.2705078125, 0.3270263671875, 0.383544921875, 0.4400634765625, 0.49658203125, 0.5531005859375, 0.609619140625, 0.6661376953125, 0.72265625, 0.7791748046875, 0.835693359375, 0.8922119140625, 0.94873046875, 1.0052490234375, 1.061767578125, 1.1182861328125, 1.1748046875, 1.2313232421875, 1.287841796875, 1.3443603515625, 1.40087890625, 1.4573974609375, 1.513916015625, 1.5704345703125, 1.626953125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 8.0, 15.0, 19.0, 23.0, 36.0, 50.0, 87.0, 130.0, 220.0, 334.0, 459.0, 818.0, 579.0, 423.0, 282.0, 179.0, 131.0, 91.0, 65.0, 45.0, 16.0, 23.0, 11.0, 9.0, 8.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.443359375, -2.381988525390625, -2.32061767578125, -2.259246826171875, -2.1978759765625, -2.136505126953125, -2.07513427734375, -2.013763427734375, -1.952392578125, -1.891021728515625, -1.82965087890625, -1.768280029296875, -1.7069091796875, -1.645538330078125, -1.58416748046875, -1.522796630859375, -1.46142578125, -1.400054931640625, -1.33868408203125, -1.277313232421875, -1.2159423828125, -1.154571533203125, -1.09320068359375, -1.031829833984375, -0.970458984375, -0.909088134765625, -0.84771728515625, -0.786346435546875, -0.7249755859375, -0.663604736328125, -0.60223388671875, -0.540863037109375, -0.4794921875, -0.418121337890625, -0.35675048828125, -0.295379638671875, -0.2340087890625, -0.172637939453125, -0.11126708984375, -0.049896240234375, 0.011474609375, 0.072845458984375, 0.13421630859375, 0.195587158203125, 0.2569580078125, 0.318328857421875, 0.37969970703125, 0.441070556640625, 0.50244140625, 0.563812255859375, 0.62518310546875, 0.686553955078125, 0.7479248046875, 0.809295654296875, 0.87066650390625, 0.932037353515625, 0.993408203125, 1.054779052734375, 1.11614990234375, 1.177520751953125, 1.2388916015625, 1.300262451171875, 1.36163330078125, 1.423004150390625, 1.484375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 1.0, 9.0, 13.0, 25.0, 28.0, 64.0, 73.0, 94.0, 111.0, 121.0, 124.0, 97.0, 91.0, 59.0, 40.0, 26.0, 13.0, 8.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.29092788696289, -9.970525741577148, -9.65012264251709, -9.329720497131348, -9.009317398071289, -8.688915252685547, -8.368513107299805, -8.048110961914062, -7.727707862854004, -7.4073052406311035, -7.086902618408203, -6.766500473022461, -6.4460978507995605, -6.12569522857666, -5.805293083190918, -5.484890460968018, -5.164487838745117, -4.844085216522217, -4.523682594299316, -4.203280448913574, -3.882877826690674, -3.5624752044677734, -3.242072820663452, -2.921670436859131, -2.6012678146362305, -2.28086519241333, -1.9604628086090088, -1.640060305595398, -1.319657802581787, -0.9992552995681763, -0.6788527965545654, -0.35845041275024414, -0.03804779052734375, 0.2823547124862671, 0.6027572154998779, 0.9231597185134888, 1.2435622215270996, 1.5639647245407104, 1.8843672275543213, 2.2047696113586426, 2.525172233581543, 2.8455748558044434, 3.1659772396087646, 3.486379623413086, 3.8067822456359863, 4.127184867858887, 4.447587013244629, 4.767989635467529, 5.08839225769043, 5.40879487991333, 5.7291975021362305, 6.049599647521973, 6.370002269744873, 6.690404891967773, 7.010807037353516, 7.331209659576416, 7.651612281799316, 7.972014904022217, 8.292417526245117, 8.61281967163086, 8.933221817016602, 9.25362491607666, 9.574027061462402, 9.894430160522461, 10.214832305908203]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 6.0, 5.0, 8.0, 7.0, 7.0, 12.0, 7.0, 9.0, 15.0, 16.0, 21.0, 16.0, 23.0, 23.0, 26.0, 28.0, 51.0, 42.0, 44.0, 45.0, 51.0, 52.0, 43.0, 53.0, 42.0, 44.0, 40.0, 39.0, 32.0, 23.0, 27.0, 20.0, 24.0, 25.0, 15.0, 12.0, 8.0, 10.0, 16.0, 5.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.292178630828857, -4.137743949890137, -3.983309507369995, -3.8288750648498535, -3.674440383911133, -3.520005702972412, -3.3655712604522705, -3.211136817932129, -3.056702136993408, -2.9022674560546875, -2.747833013534546, -2.5933985710144043, -2.4389638900756836, -2.284529209136963, -2.1300947666168213, -1.9756602048873901, -1.821225643157959, -1.6667910814285278, -1.5123565196990967, -1.3579219579696655, -1.2034873962402344, -1.0490528345108032, -0.8946182727813721, -0.7401837110519409, -0.5857491493225098, -0.4313145875930786, -0.27688002586364746, -0.12244546413421631, 0.031989097595214844, 0.186423659324646, 0.34085822105407715, 0.4952927827835083, 0.6497268676757812, 0.8041614294052124, 0.9585959911346436, 1.1130305528640747, 1.2674651145935059, 1.421899676322937, 1.5763342380523682, 1.7307687997817993, 1.8852033615112305, 2.039638042449951, 2.1940724849700928, 2.3485069274902344, 2.502941608428955, 2.657376289367676, 2.8118107318878174, 2.966245174407959, 3.1206798553466797, 3.2751145362854004, 3.429548978805542, 3.5839834213256836, 3.7384181022644043, 3.892852783203125, 4.0472869873046875, 4.201721668243408, 4.356156349182129, 4.51059103012085, 4.66502571105957, 4.819459915161133, 4.9738945960998535, 5.128329277038574, 5.282763481140137, 5.437198162078857, 5.591632843017578]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 10.0, 22.0, 25.0, 41.0, 42.0, 91.0, 108.0, 161.0, 278.0, 421.0, 603.0, 925.0, 1380.0, 2052.0, 3116.0, 4553.0, 6706.0, 9634.0, 14229.0, 20497.0, 30659.0, 46910.0, 76860.0, 131971.0, 193484.0, 183441.0, 119287.0, 70025.0, 42825.0, 28037.0, 19263.0, 13130.0, 9241.0, 6018.0, 4143.0, 2766.0, 1844.0, 1256.0, 771.0, 576.0, 398.0, 236.0, 170.0, 120.0, 73.0, 46.0, 40.0, 22.0, 14.0, 12.0, 14.0, 5.0, 4.0, 1.0, 2.0], "bins": [-0.77978515625, -0.7567825317382812, -0.7337799072265625, -0.7107772827148438, -0.687774658203125, -0.6647720336914062, -0.6417694091796875, -0.6187667846679688, -0.59576416015625, -0.5727615356445312, -0.5497589111328125, -0.5267562866210938, -0.503753662109375, -0.48075103759765625, -0.4577484130859375, -0.43474578857421875, -0.4117431640625, -0.38874053955078125, -0.3657379150390625, -0.34273529052734375, -0.319732666015625, -0.29673004150390625, -0.2737274169921875, -0.25072479248046875, -0.22772216796875, -0.20471954345703125, -0.1817169189453125, -0.15871429443359375, -0.135711669921875, -0.11270904541015625, -0.0897064208984375, -0.06670379638671875, -0.043701171875, -0.02069854736328125, 0.0023040771484375, 0.02530670166015625, 0.048309326171875, 0.07131195068359375, 0.0943145751953125, 0.11731719970703125, 0.14031982421875, 0.16332244873046875, 0.1863250732421875, 0.20932769775390625, 0.232330322265625, 0.25533294677734375, 0.2783355712890625, 0.30133819580078125, 0.3243408203125, 0.34734344482421875, 0.3703460693359375, 0.39334869384765625, 0.416351318359375, 0.43935394287109375, 0.4623565673828125, 0.48535919189453125, 0.50836181640625, 0.5313644409179688, 0.5543670654296875, 0.5773696899414062, 0.600372314453125, 0.6233749389648438, 0.6463775634765625, 0.6693801879882812, 0.6923828125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 11.0, 10.0, 6.0, 14.0, 22.0, 20.0, 16.0, 19.0, 12.0, 25.0, 44.0, 40.0, 36.0, 38.0, 42.0, 41.0, 43.0, 39.0, 43.0, 50.0, 41.0, 43.0, 54.0, 32.0, 35.0, 32.0, 34.0, 23.0, 24.0, 20.0, 19.0, 12.0, 10.0, 8.0, 6.0, 2.0, 4.0, 5.0, 5.0, 5.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.81689453125, -0.791290283203125, -0.76568603515625, -0.740081787109375, -0.7144775390625, -0.688873291015625, -0.66326904296875, -0.637664794921875, -0.612060546875, -0.586456298828125, -0.56085205078125, -0.535247802734375, -0.5096435546875, -0.484039306640625, -0.45843505859375, -0.432830810546875, -0.4072265625, -0.381622314453125, -0.35601806640625, -0.330413818359375, -0.3048095703125, -0.279205322265625, -0.25360107421875, -0.227996826171875, -0.202392578125, -0.176788330078125, -0.15118408203125, -0.125579833984375, -0.0999755859375, -0.074371337890625, -0.04876708984375, -0.023162841796875, 0.00244140625, 0.028045654296875, 0.05364990234375, 0.079254150390625, 0.1048583984375, 0.130462646484375, 0.15606689453125, 0.181671142578125, 0.207275390625, 0.232879638671875, 0.25848388671875, 0.284088134765625, 0.3096923828125, 0.335296630859375, 0.36090087890625, 0.386505126953125, 0.412109375, 0.437713623046875, 0.46331787109375, 0.488922119140625, 0.5145263671875, 0.540130615234375, 0.56573486328125, 0.591339111328125, 0.616943359375, 0.642547607421875, 0.66815185546875, 0.693756103515625, 0.7193603515625, 0.744964599609375, 0.77056884765625, 0.796173095703125, 0.82177734375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 5.0, 6.0, 7.0, 7.0, 9.0, 14.0, 11.0, 19.0, 26.0, 29.0, 33.0, 48.0, 87.0, 112.0, 253.0, 591.0, 1600.0, 6270.0, 30941.0, 178839.0, 660040.0, 137297.0, 24814.0, 5141.0, 1351.0, 461.0, 194.0, 102.0, 76.0, 47.0, 38.0, 15.0, 12.0, 18.0, 14.0, 8.0, 11.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.96875, -2.86053466796875, -2.7523193359375, -2.64410400390625, -2.535888671875, -2.42767333984375, -2.3194580078125, -2.21124267578125, -2.10302734375, -1.99481201171875, -1.8865966796875, -1.77838134765625, -1.670166015625, -1.56195068359375, -1.4537353515625, -1.34552001953125, -1.2373046875, -1.12908935546875, -1.0208740234375, -0.91265869140625, -0.804443359375, -0.69622802734375, -0.5880126953125, -0.47979736328125, -0.37158203125, -0.26336669921875, -0.1551513671875, -0.04693603515625, 0.061279296875, 0.16949462890625, 0.2777099609375, 0.38592529296875, 0.494140625, 0.60235595703125, 0.7105712890625, 0.81878662109375, 0.927001953125, 1.03521728515625, 1.1434326171875, 1.25164794921875, 1.35986328125, 1.46807861328125, 1.5762939453125, 1.68450927734375, 1.792724609375, 1.90093994140625, 2.0091552734375, 2.11737060546875, 2.2255859375, 2.33380126953125, 2.4420166015625, 2.55023193359375, 2.658447265625, 2.76666259765625, 2.8748779296875, 2.98309326171875, 3.09130859375, 3.19952392578125, 3.3077392578125, 3.41595458984375, 3.524169921875, 3.63238525390625, 3.7406005859375, 3.84881591796875, 3.95703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 3.0, 3.0, 11.0, 8.0, 15.0, 13.0, 19.0, 16.0, 22.0, 31.0, 26.0, 43.0, 34.0, 40.0, 36.0, 56.0, 57.0, 43.0, 52.0, 63.0, 39.0, 47.0, 40.0, 34.0, 35.0, 32.0, 24.0, 24.0, 26.0, 23.0, 13.0, 12.0, 15.0, 13.0, 5.0, 7.0, 7.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.560546875, -2.468292236328125, -2.37603759765625, -2.283782958984375, -2.1915283203125, -2.099273681640625, -2.00701904296875, -1.914764404296875, -1.822509765625, -1.730255126953125, -1.63800048828125, -1.545745849609375, -1.4534912109375, -1.361236572265625, -1.26898193359375, -1.176727294921875, -1.08447265625, -0.992218017578125, -0.89996337890625, -0.807708740234375, -0.7154541015625, -0.623199462890625, -0.53094482421875, -0.438690185546875, -0.346435546875, -0.254180908203125, -0.16192626953125, -0.069671630859375, 0.0225830078125, 0.114837646484375, 0.20709228515625, 0.299346923828125, 0.3916015625, 0.483856201171875, 0.57611083984375, 0.668365478515625, 0.7606201171875, 0.852874755859375, 0.94512939453125, 1.037384033203125, 1.129638671875, 1.221893310546875, 1.31414794921875, 1.406402587890625, 1.4986572265625, 1.590911865234375, 1.68316650390625, 1.775421142578125, 1.86767578125, 1.959930419921875, 2.05218505859375, 2.144439697265625, 2.2366943359375, 2.328948974609375, 2.42120361328125, 2.513458251953125, 2.605712890625, 2.697967529296875, 2.79022216796875, 2.882476806640625, 2.9747314453125, 3.066986083984375, 3.15924072265625, 3.251495361328125, 3.34375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 5.0, 6.0, 8.0, 20.0, 23.0, 32.0, 39.0, 49.0, 67.0, 107.0, 209.0, 253.0, 433.0, 652.0, 1127.0, 2079.0, 3938.0, 8123.0, 16665.0, 35404.0, 78711.0, 252811.0, 410784.0, 135512.0, 52590.0, 24590.0, 11732.0, 5791.0, 2924.0, 1533.0, 826.0, 519.0, 315.0, 224.0, 141.0, 98.0, 60.0, 49.0, 36.0, 29.0, 17.0, 14.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.98828125, -0.9602508544921875, -0.932220458984375, -0.9041900634765625, -0.87615966796875, -0.8481292724609375, -0.820098876953125, -0.7920684814453125, -0.7640380859375, -0.7360076904296875, -0.707977294921875, -0.6799468994140625, -0.65191650390625, -0.6238861083984375, -0.595855712890625, -0.5678253173828125, -0.539794921875, -0.5117645263671875, -0.483734130859375, -0.4557037353515625, -0.42767333984375, -0.3996429443359375, -0.371612548828125, -0.3435821533203125, -0.3155517578125, -0.2875213623046875, -0.259490966796875, -0.2314605712890625, -0.20343017578125, -0.1753997802734375, -0.147369384765625, -0.1193389892578125, -0.09130859375, -0.0632781982421875, -0.035247802734375, -0.0072174072265625, 0.02081298828125, 0.0488433837890625, 0.076873779296875, 0.1049041748046875, 0.1329345703125, 0.1609649658203125, 0.188995361328125, 0.2170257568359375, 0.24505615234375, 0.2730865478515625, 0.301116943359375, 0.3291473388671875, 0.357177734375, 0.3852081298828125, 0.413238525390625, 0.4412689208984375, 0.46929931640625, 0.4973297119140625, 0.525360107421875, 0.5533905029296875, 0.5814208984375, 0.6094512939453125, 0.637481689453125, 0.6655120849609375, 0.69354248046875, 0.7215728759765625, 0.749603271484375, 0.7776336669921875, 0.8056640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 6.0, 4.0, 5.0, 8.0, 11.0, 10.0, 5.0, 15.0, 21.0, 17.0, 32.0, 49.0, 71.0, 89.0, 118.0, 153.0, 103.0, 70.0, 52.0, 25.0, 19.0, 19.0, 13.0, 12.0, 11.0, 9.0, 9.0, 7.0, 9.0, 4.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014543533325195312, -0.00013988465070724487, -0.00013433396816253662, -0.00012878328561782837, -0.00012323260307312012, -0.00011768192052841187, -0.00011213123798370361, -0.00010658055543899536, -0.00010102987289428711, -9.547919034957886e-05, -8.99285078048706e-05, -8.437782526016235e-05, -7.88271427154541e-05, -7.327646017074585e-05, -6.77257776260376e-05, -6.217509508132935e-05, -5.6624412536621094e-05, -5.107372999191284e-05, -4.552304744720459e-05, -3.997236490249634e-05, -3.4421682357788086e-05, -2.8870999813079834e-05, -2.3320317268371582e-05, -1.776963472366333e-05, -1.2218952178955078e-05, -6.668269634246826e-06, -1.1175870895385742e-06, 4.433095455169678e-06, 9.98377799987793e-06, 1.553446054458618e-05, 2.1085143089294434e-05, 2.6635825634002686e-05, 3.218650817871094e-05, 3.773719072341919e-05, 4.328787326812744e-05, 4.883855581283569e-05, 5.4389238357543945e-05, 5.99399209022522e-05, 6.549060344696045e-05, 7.10412859916687e-05, 7.659196853637695e-05, 8.21426510810852e-05, 8.769333362579346e-05, 9.324401617050171e-05, 9.879469871520996e-05, 0.00010434538125991821, 0.00010989606380462646, 0.00011544674634933472, 0.00012099742889404297, 0.00012654811143875122, 0.00013209879398345947, 0.00013764947652816772, 0.00014320015907287598, 0.00014875084161758423, 0.00015430152416229248, 0.00015985220670700073, 0.00016540288925170898, 0.00017095357179641724, 0.0001765042543411255, 0.00018205493688583374, 0.000187605619430542, 0.00019315630197525024, 0.0001987069845199585, 0.00020425766706466675, 0.000209808349609375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 7.0, 14.0, 10.0, 25.0, 35.0, 42.0, 79.0, 96.0, 183.0, 355.0, 937.0, 3236.0, 14349.0, 73658.0, 562948.0, 332170.0, 46983.0, 9635.0, 2309.0, 769.0, 281.0, 157.0, 103.0, 60.0, 44.0, 26.0, 17.0, 9.0, 11.0, 9.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1640625, -1.10546875, -1.046875, -0.98828125, -0.9296875, -0.87109375, -0.8125, -0.75390625, -0.6953125, -0.63671875, -0.578125, -0.51953125, -0.4609375, -0.40234375, -0.34375, -0.28515625, -0.2265625, -0.16796875, -0.109375, -0.05078125, 0.0078125, 0.06640625, 0.125, 0.18359375, 0.2421875, 0.30078125, 0.359375, 0.41796875, 0.4765625, 0.53515625, 0.59375, 0.65234375, 0.7109375, 0.76953125, 0.828125, 0.88671875, 0.9453125, 1.00390625, 1.0625, 1.12109375, 1.1796875, 1.23828125, 1.296875, 1.35546875, 1.4140625, 1.47265625, 1.53125, 1.58984375, 1.6484375, 1.70703125, 1.765625, 1.82421875, 1.8828125, 1.94140625, 2.0, 2.05859375, 2.1171875, 2.17578125, 2.234375, 2.29296875, 2.3515625, 2.41015625, 2.46875, 2.52734375, 2.5859375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 3.0, 5.0, 6.0, 8.0, 6.0, 14.0, 10.0, 19.0, 14.0, 17.0, 20.0, 28.0, 43.0, 67.0, 74.0, 88.0, 81.0, 114.0, 78.0, 78.0, 40.0, 33.0, 35.0, 16.0, 17.0, 15.0, 13.0, 8.0, 10.0, 8.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85595703125, -0.8297500610351562, -0.8035430908203125, -0.7773361206054688, -0.751129150390625, -0.7249221801757812, -0.6987152099609375, -0.6725082397460938, -0.64630126953125, -0.6200942993164062, -0.5938873291015625, -0.5676803588867188, -0.541473388671875, -0.5152664184570312, -0.4890594482421875, -0.46285247802734375, -0.4366455078125, -0.41043853759765625, -0.3842315673828125, -0.35802459716796875, -0.331817626953125, -0.30561065673828125, -0.2794036865234375, -0.25319671630859375, -0.22698974609375, -0.20078277587890625, -0.1745758056640625, -0.14836883544921875, -0.122161865234375, -0.09595489501953125, -0.0697479248046875, -0.04354095458984375, -0.017333984375, 0.00887298583984375, 0.0350799560546875, 0.06128692626953125, 0.087493896484375, 0.11370086669921875, 0.1399078369140625, 0.16611480712890625, 0.19232177734375, 0.21852874755859375, 0.2447357177734375, 0.27094268798828125, 0.297149658203125, 0.32335662841796875, 0.3495635986328125, 0.37577056884765625, 0.4019775390625, 0.42818450927734375, 0.4543914794921875, 0.48059844970703125, 0.506805419921875, 0.5330123901367188, 0.5592193603515625, 0.5854263305664062, 0.61163330078125, 0.6378402709960938, 0.6640472412109375, 0.6902542114257812, 0.716461181640625, 0.7426681518554688, 0.7688751220703125, 0.7950820922851562, 0.8212890625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 18.0, 69.0, 193.0, 324.0, 272.0, 85.0, 32.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.42273998260498, -13.508069038391113, -12.593398094177246, -11.678727149963379, -10.764056205749512, -9.849384307861328, -8.934713363647461, -8.020042419433594, -7.105371952056885, -6.190701007843018, -5.27603006362915, -4.361358642578125, -3.446687936782837, -2.5320167541503906, -1.6173458099365234, -0.7026748657226562, 0.21199607849121094, 1.1266670227050781, 2.0413379669189453, 2.9560091495513916, 3.870680093765259, 4.785351276397705, 5.700022220611572, 6.6146931648254395, 7.529364109039307, 8.444035530090332, 9.3587064743042, 10.273377418518066, 11.188048362731934, 12.1027193069458, 13.017390251159668, 13.932061195373535, 14.846731185913086, 15.761402130126953, 16.67607307434082, 17.590744018554688, 18.505414962768555, 19.420085906982422, 20.33475685119629, 21.249427795410156, 22.164098739624023, 23.07876968383789, 23.993440628051758, 24.908111572265625, 25.822782516479492, 26.73745346069336, 27.652124404907227, 28.566795349121094, 29.481468200683594, 30.39613914489746, 31.310810089111328, 32.22548294067383, 33.14015197753906, 34.05482482910156, 34.9694938659668, 35.8841667175293, 36.79883575439453, 37.71350860595703, 38.628177642822266, 39.542850494384766, 40.45751953125, 41.3721923828125, 42.286861419677734, 43.201534271240234, 44.11620330810547]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 4.0, 3.0, 5.0, 2.0, 2.0, 4.0, 7.0, 13.0, 10.0, 13.0, 12.0, 17.0, 24.0, 21.0, 38.0, 26.0, 30.0, 41.0, 46.0, 45.0, 49.0, 44.0, 41.0, 27.0, 39.0, 44.0, 38.0, 33.0, 38.0, 48.0, 25.0, 31.0, 31.0, 19.0, 17.0, 29.0, 15.0, 13.0, 11.0, 13.0, 9.0, 9.0, 8.0, 4.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.444147109985352, -6.227850914001465, -6.011554718017578, -5.795258522033691, -5.578962326049805, -5.362666130065918, -5.1463704109191895, -4.930074214935303, -4.713778018951416, -4.497481822967529, -4.281185626983643, -4.064889430999756, -3.8485934734344482, -3.6322972774505615, -3.416001319885254, -3.199705123901367, -2.9834089279174805, -2.7671127319335938, -2.550816535949707, -2.3345205783843994, -2.1182243824005127, -1.901928186416626, -1.6856321096420288, -1.4693360328674316, -1.253039836883545, -1.0367436408996582, -0.820447564125061, -0.6041514277458191, -0.38785529136657715, -0.17155909538269043, 0.04473698139190674, 0.2610330581665039, 0.4773292541503906, 0.6936253905296326, 0.9099215269088745, 1.1262176036834717, 1.3425137996673584, 1.5588099956512451, 1.7751060724258423, 1.9914021492004395, 2.207698345184326, 2.423994541168213, 2.6402907371520996, 2.8565866947174072, 3.072882890701294, 3.2891790866851807, 3.5054750442504883, 3.721771240234375, 3.9380674362182617, 4.154363632202148, 4.370659828186035, 4.586956024169922, 4.803252220153809, 5.019548416137695, 5.235844135284424, 5.4521403312683105, 5.668436527252197, 5.884732723236084, 6.101028919219971, 6.317325115203857, 6.533620834350586, 6.749917030334473, 6.966213226318359, 7.182509422302246, 7.398805618286133]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 7.0, 14.0, 17.0, 26.0, 34.0, 64.0, 91.0, 151.0, 223.0, 359.0, 597.0, 915.0, 1585.0, 2629.0, 4717.0, 8200.0, 14677.0, 27019.0, 51233.0, 99864.0, 204367.0, 464770.0, 1208673.0, 1217416.0, 468342.0, 205634.0, 100381.0, 51226.0, 27110.0, 14462.0, 8192.0, 4578.0, 2611.0, 1473.0, 987.0, 611.0, 345.0, 227.0, 149.0, 93.0, 61.0, 33.0, 37.0, 20.0, 15.0, 16.0, 8.0, 7.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.8876953125, -0.8581085205078125, -0.828521728515625, -0.7989349365234375, -0.76934814453125, -0.7397613525390625, -0.710174560546875, -0.6805877685546875, -0.6510009765625, -0.6214141845703125, -0.591827392578125, -0.5622406005859375, -0.53265380859375, -0.5030670166015625, -0.473480224609375, -0.4438934326171875, -0.414306640625, -0.3847198486328125, -0.355133056640625, -0.3255462646484375, -0.29595947265625, -0.2663726806640625, -0.236785888671875, -0.2071990966796875, -0.1776123046875, -0.1480255126953125, -0.118438720703125, -0.0888519287109375, -0.05926513671875, -0.0296783447265625, -9.1552734375e-05, 0.0294952392578125, 0.05908203125, 0.0886688232421875, 0.118255615234375, 0.1478424072265625, 0.17742919921875, 0.2070159912109375, 0.236602783203125, 0.2661895751953125, 0.2957763671875, 0.3253631591796875, 0.354949951171875, 0.3845367431640625, 0.41412353515625, 0.4437103271484375, 0.473297119140625, 0.5028839111328125, 0.532470703125, 0.5620574951171875, 0.591644287109375, 0.6212310791015625, 0.65081787109375, 0.6804046630859375, 0.709991455078125, 0.7395782470703125, 0.7691650390625, 0.7987518310546875, 0.828338623046875, 0.8579254150390625, 0.88751220703125, 0.9170989990234375, 0.946685791015625, 0.9762725830078125, 1.005859375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 7.0, 9.0, 9.0, 9.0, 11.0, 16.0, 13.0, 17.0, 32.0, 24.0, 24.0, 19.0, 41.0, 49.0, 35.0, 44.0, 44.0, 34.0, 45.0, 46.0, 46.0, 36.0, 48.0, 42.0, 31.0, 33.0, 27.0, 29.0, 28.0, 32.0, 17.0, 18.0, 18.0, 13.0, 8.0, 6.0, 14.0, 7.0, 1.0, 4.0, 5.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.85888671875, -0.8330917358398438, -0.8072967529296875, -0.7815017700195312, -0.755706787109375, -0.7299118041992188, -0.7041168212890625, -0.6783218383789062, -0.65252685546875, -0.6267318725585938, -0.6009368896484375, -0.5751419067382812, -0.549346923828125, -0.5235519409179688, -0.4977569580078125, -0.47196197509765625, -0.4461669921875, -0.42037200927734375, -0.3945770263671875, -0.36878204345703125, -0.342987060546875, -0.31719207763671875, -0.2913970947265625, -0.26560211181640625, -0.23980712890625, -0.21401214599609375, -0.1882171630859375, -0.16242218017578125, -0.136627197265625, -0.11083221435546875, -0.0850372314453125, -0.05924224853515625, -0.033447265625, -0.00765228271484375, 0.0181427001953125, 0.04393768310546875, 0.069732666015625, 0.09552764892578125, 0.1213226318359375, 0.14711761474609375, 0.17291259765625, 0.19870758056640625, 0.2245025634765625, 0.25029754638671875, 0.276092529296875, 0.30188751220703125, 0.3276824951171875, 0.35347747802734375, 0.3792724609375, 0.40506744384765625, 0.4308624267578125, 0.45665740966796875, 0.482452392578125, 0.5082473754882812, 0.5340423583984375, 0.5598373413085938, 0.58563232421875, 0.6114273071289062, 0.6372222900390625, 0.6630172729492188, 0.688812255859375, 0.7146072387695312, 0.7404022216796875, 0.7661972045898438, 0.7919921875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 2.0, 8.0, 4.0, 8.0, 12.0, 15.0, 16.0, 26.0, 35.0, 41.0, 45.0, 72.0, 89.0, 128.0, 188.0, 349.0, 670.0, 1344.0, 3566.0, 11174.0, 43805.0, 216824.0, 1466514.0, 2067597.0, 301218.0, 58366.0, 14195.0, 4467.0, 1603.0, 760.0, 402.0, 214.0, 140.0, 100.0, 62.0, 49.0, 31.0, 32.0, 18.0, 23.0, 21.0, 13.0, 10.0, 10.0, 6.0, 9.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.2109375, -3.11676025390625, -3.0225830078125, -2.92840576171875, -2.834228515625, -2.74005126953125, -2.6458740234375, -2.55169677734375, -2.45751953125, -2.36334228515625, -2.2691650390625, -2.17498779296875, -2.080810546875, -1.98663330078125, -1.8924560546875, -1.79827880859375, -1.7041015625, -1.60992431640625, -1.5157470703125, -1.42156982421875, -1.327392578125, -1.23321533203125, -1.1390380859375, -1.04486083984375, -0.95068359375, -0.85650634765625, -0.7623291015625, -0.66815185546875, -0.573974609375, -0.47979736328125, -0.3856201171875, -0.29144287109375, -0.197265625, -0.10308837890625, -0.0089111328125, 0.08526611328125, 0.179443359375, 0.27362060546875, 0.3677978515625, 0.46197509765625, 0.55615234375, 0.65032958984375, 0.7445068359375, 0.83868408203125, 0.932861328125, 1.02703857421875, 1.1212158203125, 1.21539306640625, 1.3095703125, 1.40374755859375, 1.4979248046875, 1.59210205078125, 1.686279296875, 1.78045654296875, 1.8746337890625, 1.96881103515625, 2.06298828125, 2.15716552734375, 2.2513427734375, 2.34552001953125, 2.439697265625, 2.53387451171875, 2.6280517578125, 2.72222900390625, 2.81640625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 13.0, 28.0, 63.0, 118.0, 248.0, 557.0, 1133.0, 1007.0, 474.0, 212.0, 112.0, 40.0, 27.0, 14.0, 6.0, 10.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.05859375, -5.9205322265625, -5.782470703125, -5.6444091796875, -5.50634765625, -5.3682861328125, -5.230224609375, -5.0921630859375, -4.9541015625, -4.8160400390625, -4.677978515625, -4.5399169921875, -4.40185546875, -4.2637939453125, -4.125732421875, -3.9876708984375, -3.849609375, -3.7115478515625, -3.573486328125, -3.4354248046875, -3.29736328125, -3.1593017578125, -3.021240234375, -2.8831787109375, -2.7451171875, -2.6070556640625, -2.468994140625, -2.3309326171875, -2.19287109375, -2.0548095703125, -1.916748046875, -1.7786865234375, -1.640625, -1.5025634765625, -1.364501953125, -1.2264404296875, -1.08837890625, -0.9503173828125, -0.812255859375, -0.6741943359375, -0.5361328125, -0.3980712890625, -0.260009765625, -0.1219482421875, 0.01611328125, 0.1541748046875, 0.292236328125, 0.4302978515625, 0.568359375, 0.7064208984375, 0.844482421875, 0.9825439453125, 1.12060546875, 1.2586669921875, 1.396728515625, 1.5347900390625, 1.6728515625, 1.8109130859375, 1.948974609375, 2.0870361328125, 2.22509765625, 2.3631591796875, 2.501220703125, 2.6392822265625, 2.77734375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 21.0, 27.0, 32.0, 23.0, 39.0, 71.0, 74.0, 76.0, 92.0, 90.0, 84.0, 76.0, 61.0, 60.0, 42.0, 48.0, 19.0, 15.0, 11.0, 12.0, 8.0, 5.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.539953231811523, -13.22022533416748, -12.900497436523438, -12.580769538879395, -12.261041641235352, -11.941313743591309, -11.621585845947266, -11.301858901977539, -10.98213005065918, -10.662402153015137, -10.342674255371094, -10.02294635772705, -9.703218460083008, -9.383490562438965, -9.063762664794922, -8.744035720825195, -8.424307823181152, -8.10457992553711, -7.784852027893066, -7.465124130249023, -7.1453962326049805, -6.8256683349609375, -6.505940914154053, -6.18621301651001, -5.866485118865967, -5.546757221221924, -5.227029323577881, -4.907301425933838, -4.587574005126953, -4.26784610748291, -3.948118209838867, -3.628390312194824, -3.3086633682250977, -2.9889354705810547, -2.6692075729370117, -2.349479913711548, -2.029752016067505, -1.710024118423462, -1.3902963399887085, -1.070568561553955, -0.7508406639099121, -0.4311128258705139, -0.11138498783111572, 0.20834285020828247, 0.5280706882476807, 0.8477985858917236, 1.167526364326477, 1.4872541427612305, 1.8069820404052734, 2.1267099380493164, 2.4464378356933594, 2.7661654949188232, 3.085893392562866, 3.405621290206909, 3.725348949432373, 4.045076847076416, 4.364804744720459, 4.684532642364502, 5.004260540008545, 5.323988437652588, 5.643715858459473, 5.963443756103516, 6.283171653747559, 6.602899551391602, 6.9226274490356445]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 7.0, 4.0, 13.0, 14.0, 7.0, 15.0, 20.0, 17.0, 26.0, 28.0, 19.0, 23.0, 38.0, 43.0, 40.0, 30.0, 36.0, 39.0, 53.0, 46.0, 46.0, 48.0, 46.0, 45.0, 47.0, 30.0, 25.0, 25.0, 34.0, 19.0, 19.0, 26.0, 21.0, 7.0, 6.0, 13.0, 7.0, 11.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.441129684448242, -7.210515975952148, -6.979902744293213, -6.749289512634277, -6.518675804138184, -6.28806209564209, -6.057448863983154, -5.826835632324219, -5.596221923828125, -5.365608215332031, -5.134994983673096, -4.90438175201416, -4.673768043518066, -4.443154335021973, -4.212541103363037, -3.9819276332855225, -3.751314163208008, -3.520700693130493, -3.2900872230529785, -3.059473752975464, -2.828860282897949, -2.5982468128204346, -2.36763334274292, -2.1370198726654053, -1.9064064025878906, -1.675792932510376, -1.4451794624328613, -1.2145659923553467, -0.983952522277832, -0.7533390522003174, -0.5227255821228027, -0.2921121120452881, -0.06149864196777344, 0.1691148281097412, 0.39972829818725586, 0.6303417682647705, 0.8609552383422852, 1.0915687084197998, 1.3221821784973145, 1.552795648574829, 1.7834091186523438, 2.0140225887298584, 2.244636058807373, 2.4752495288848877, 2.7058629989624023, 2.936476469039917, 3.1670899391174316, 3.3977034091949463, 3.628316879272461, 3.8589303493499756, 4.08954381942749, 4.320157051086426, 4.5507707595825195, 4.781384468078613, 5.011997699737549, 5.242610931396484, 5.473224639892578, 5.703838348388672, 5.934451580047607, 6.165064811706543, 6.395678520202637, 6.6262922286987305, 6.856905460357666, 7.087518692016602, 7.318132400512695]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 6.0, 1.0, 3.0, 1.0, 4.0, 3.0, 10.0, 19.0, 14.0, 31.0, 35.0, 59.0, 99.0, 130.0, 204.0, 251.0, 425.0, 595.0, 851.0, 1260.0, 1823.0, 2621.0, 3756.0, 5552.0, 8063.0, 11710.0, 17295.0, 25865.0, 40089.0, 63891.0, 105791.0, 166926.0, 196776.0, 145360.0, 89355.0, 54707.0, 34388.0, 22406.0, 14989.0, 10280.0, 7099.0, 5014.0, 3391.0, 2269.0, 1580.0, 1082.0, 811.0, 529.0, 373.0, 256.0, 156.0, 111.0, 78.0, 72.0, 39.0, 28.0, 18.0, 10.0, 6.0, 5.0, 1.0, 1.0, 1.0], "bins": [-1.16015625, -1.1253509521484375, -1.090545654296875, -1.0557403564453125, -1.02093505859375, -0.9861297607421875, -0.951324462890625, -0.9165191650390625, -0.8817138671875, -0.8469085693359375, -0.812103271484375, -0.7772979736328125, -0.74249267578125, -0.7076873779296875, -0.672882080078125, -0.6380767822265625, -0.603271484375, -0.5684661865234375, -0.533660888671875, -0.4988555908203125, -0.46405029296875, -0.4292449951171875, -0.394439697265625, -0.3596343994140625, -0.3248291015625, -0.2900238037109375, -0.255218505859375, -0.2204132080078125, -0.18560791015625, -0.1508026123046875, -0.115997314453125, -0.0811920166015625, -0.04638671875, -0.0115814208984375, 0.023223876953125, 0.0580291748046875, 0.09283447265625, 0.1276397705078125, 0.162445068359375, 0.1972503662109375, 0.2320556640625, 0.2668609619140625, 0.301666259765625, 0.3364715576171875, 0.37127685546875, 0.4060821533203125, 0.440887451171875, 0.4756927490234375, 0.510498046875, 0.5453033447265625, 0.580108642578125, 0.6149139404296875, 0.64971923828125, 0.6845245361328125, 0.719329833984375, 0.7541351318359375, 0.7889404296875, 0.8237457275390625, 0.858551025390625, 0.8933563232421875, 0.92816162109375, 0.9629669189453125, 0.997772216796875, 1.0325775146484375, 1.0673828125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 8.0, 1.0, 11.0, 5.0, 5.0, 13.0, 6.0, 23.0, 17.0, 15.0, 24.0, 24.0, 30.0, 32.0, 29.0, 34.0, 34.0, 43.0, 40.0, 41.0, 37.0, 34.0, 57.0, 33.0, 39.0, 43.0, 26.0, 35.0, 29.0, 26.0, 28.0, 34.0, 21.0, 15.0, 12.0, 13.0, 19.0, 15.0, 8.0, 14.0, 6.0, 8.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.98779296875, -0.9585494995117188, -0.9293060302734375, -0.9000625610351562, -0.870819091796875, -0.8415756225585938, -0.8123321533203125, -0.7830886840820312, -0.75384521484375, -0.7246017456054688, -0.6953582763671875, -0.6661148071289062, -0.636871337890625, -0.6076278686523438, -0.5783843994140625, -0.5491409301757812, -0.5198974609375, -0.49065399169921875, -0.4614105224609375, -0.43216705322265625, -0.402923583984375, -0.37368011474609375, -0.3444366455078125, -0.31519317626953125, -0.28594970703125, -0.25670623779296875, -0.2274627685546875, -0.19821929931640625, -0.168975830078125, -0.13973236083984375, -0.1104888916015625, -0.08124542236328125, -0.052001953125, -0.02275848388671875, 0.0064849853515625, 0.03572845458984375, 0.064971923828125, 0.09421539306640625, 0.1234588623046875, 0.15270233154296875, 0.18194580078125, 0.21118927001953125, 0.2404327392578125, 0.26967620849609375, 0.298919677734375, 0.32816314697265625, 0.3574066162109375, 0.38665008544921875, 0.4158935546875, 0.44513702392578125, 0.4743804931640625, 0.5036239624023438, 0.532867431640625, 0.5621109008789062, 0.5913543701171875, 0.6205978393554688, 0.64984130859375, 0.6790847778320312, 0.7083282470703125, 0.7375717163085938, 0.766815185546875, 0.7960586547851562, 0.8253021240234375, 0.8545455932617188, 0.8837890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 2.0, 6.0, 7.0, 11.0, 23.0, 25.0, 41.0, 57.0, 97.0, 105.0, 230.0, 479.0, 1071.0, 3258.0, 12746.0, 49887.0, 229737.0, 546659.0, 155414.0, 35514.0, 9041.0, 2425.0, 826.0, 339.0, 186.0, 128.0, 87.0, 44.0, 30.0, 28.0, 15.0, 14.0, 8.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.44921875, -4.323455810546875, -4.19769287109375, -4.071929931640625, -3.9461669921875, -3.820404052734375, -3.69464111328125, -3.568878173828125, -3.443115234375, -3.317352294921875, -3.19158935546875, -3.065826416015625, -2.9400634765625, -2.814300537109375, -2.68853759765625, -2.562774658203125, -2.43701171875, -2.311248779296875, -2.18548583984375, -2.059722900390625, -1.9339599609375, -1.808197021484375, -1.68243408203125, -1.556671142578125, -1.430908203125, -1.305145263671875, -1.17938232421875, -1.053619384765625, -0.9278564453125, -0.802093505859375, -0.67633056640625, -0.550567626953125, -0.4248046875, -0.299041748046875, -0.17327880859375, -0.047515869140625, 0.0782470703125, 0.204010009765625, 0.32977294921875, 0.455535888671875, 0.581298828125, 0.707061767578125, 0.83282470703125, 0.958587646484375, 1.0843505859375, 1.210113525390625, 1.33587646484375, 1.461639404296875, 1.58740234375, 1.713165283203125, 1.83892822265625, 1.964691162109375, 2.0904541015625, 2.216217041015625, 2.34197998046875, 2.467742919921875, 2.593505859375, 2.719268798828125, 2.84503173828125, 2.970794677734375, 3.0965576171875, 3.222320556640625, 3.34808349609375, 3.473846435546875, 3.599609375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 4.0, 2.0, 4.0, 4.0, 4.0, 8.0, 12.0, 13.0, 21.0, 17.0, 23.0, 17.0, 34.0, 36.0, 36.0, 40.0, 50.0, 54.0, 38.0, 48.0, 52.0, 46.0, 49.0, 42.0, 47.0, 45.0, 37.0, 34.0, 29.0, 19.0, 25.0, 21.0, 19.0, 16.0, 14.0, 14.0, 4.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.927734375, -3.792327880859375, -3.65692138671875, -3.521514892578125, -3.3861083984375, -3.250701904296875, -3.11529541015625, -2.979888916015625, -2.844482421875, -2.709075927734375, -2.57366943359375, -2.438262939453125, -2.3028564453125, -2.167449951171875, -2.03204345703125, -1.896636962890625, -1.76123046875, -1.625823974609375, -1.49041748046875, -1.355010986328125, -1.2196044921875, -1.084197998046875, -0.94879150390625, -0.813385009765625, -0.677978515625, -0.542572021484375, -0.40716552734375, -0.271759033203125, -0.1363525390625, -0.000946044921875, 0.13446044921875, 0.269866943359375, 0.4052734375, 0.540679931640625, 0.67608642578125, 0.811492919921875, 0.9468994140625, 1.082305908203125, 1.21771240234375, 1.353118896484375, 1.488525390625, 1.623931884765625, 1.75933837890625, 1.894744873046875, 2.0301513671875, 2.165557861328125, 2.30096435546875, 2.436370849609375, 2.57177734375, 2.707183837890625, 2.84259033203125, 2.977996826171875, 3.1134033203125, 3.248809814453125, 3.38421630859375, 3.519622802734375, 3.655029296875, 3.790435791015625, 3.92584228515625, 4.061248779296875, 4.1966552734375, 4.332061767578125, 4.46746826171875, 4.602874755859375, 4.73828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 2.0, 13.0, 7.0, 20.0, 19.0, 33.0, 24.0, 66.0, 75.0, 154.0, 217.0, 354.0, 673.0, 1437.0, 3537.0, 9492.0, 28188.0, 90631.0, 327764.0, 410399.0, 119590.0, 35775.0, 12047.0, 4394.0, 1728.0, 822.0, 428.0, 221.0, 159.0, 91.0, 60.0, 46.0, 33.0, 13.0, 15.0, 9.0, 3.0, 5.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.45703125, -1.41302490234375, -1.3690185546875, -1.32501220703125, -1.281005859375, -1.23699951171875, -1.1929931640625, -1.14898681640625, -1.10498046875, -1.06097412109375, -1.0169677734375, -0.97296142578125, -0.928955078125, -0.88494873046875, -0.8409423828125, -0.79693603515625, -0.7529296875, -0.70892333984375, -0.6649169921875, -0.62091064453125, -0.576904296875, -0.53289794921875, -0.4888916015625, -0.44488525390625, -0.40087890625, -0.35687255859375, -0.3128662109375, -0.26885986328125, -0.224853515625, -0.18084716796875, -0.1368408203125, -0.09283447265625, -0.048828125, -0.00482177734375, 0.0391845703125, 0.08319091796875, 0.127197265625, 0.17120361328125, 0.2152099609375, 0.25921630859375, 0.30322265625, 0.34722900390625, 0.3912353515625, 0.43524169921875, 0.479248046875, 0.52325439453125, 0.5672607421875, 0.61126708984375, 0.6552734375, 0.69927978515625, 0.7432861328125, 0.78729248046875, 0.831298828125, 0.87530517578125, 0.9193115234375, 0.96331787109375, 1.00732421875, 1.05133056640625, 1.0953369140625, 1.13934326171875, 1.183349609375, 1.22735595703125, 1.2713623046875, 1.31536865234375, 1.359375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 10.0, 8.0, 4.0, 10.0, 11.0, 6.0, 20.0, 27.0, 32.0, 37.0, 77.0, 97.0, 154.0, 167.0, 107.0, 67.0, 46.0, 36.0, 25.0, 23.0, 18.0, 8.0, 8.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023555755615234375, -0.0002248510718345642, -0.00021414458751678467, -0.00020343810319900513, -0.00019273161888122559, -0.00018202513456344604, -0.0001713186502456665, -0.00016061216592788696, -0.00014990568161010742, -0.00013919919729232788, -0.00012849271297454834, -0.0001177862286567688, -0.00010707974433898926, -9.637326002120972e-05, -8.566677570343018e-05, -7.496029138565063e-05, -6.42538070678711e-05, -5.354732275009155e-05, -4.284083843231201e-05, -3.213435411453247e-05, -2.142786979675293e-05, -1.0721385478973389e-05, -1.4901161193847656e-08, 1.0691583156585693e-05, 2.1398067474365234e-05, 3.2104551792144775e-05, 4.2811036109924316e-05, 5.351752042770386e-05, 6.42240047454834e-05, 7.493048906326294e-05, 8.563697338104248e-05, 9.634345769882202e-05, 0.00010704994201660156, 0.0001177564263343811, 0.00012846291065216064, 0.00013916939496994019, 0.00014987587928771973, 0.00016058236360549927, 0.0001712888479232788, 0.00018199533224105835, 0.0001927018165588379, 0.00020340830087661743, 0.00021411478519439697, 0.00022482126951217651, 0.00023552775382995605, 0.0002462342381477356, 0.00025694072246551514, 0.0002676472067832947, 0.0002783536911010742, 0.00028906017541885376, 0.0002997666597366333, 0.00031047314405441284, 0.0003211796283721924, 0.0003318861126899719, 0.00034259259700775146, 0.000353299081325531, 0.00036400556564331055, 0.0003747120499610901, 0.00038541853427886963, 0.00039612501859664917, 0.0004068315029144287, 0.00041753798723220825, 0.0004282444715499878, 0.00043895095586776733, 0.0004496574401855469]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 9.0, 10.0, 13.0, 19.0, 31.0, 42.0, 52.0, 126.0, 231.0, 434.0, 907.0, 2375.0, 6238.0, 17937.0, 55313.0, 181218.0, 444516.0, 233618.0, 70214.0, 22406.0, 7719.0, 2897.0, 1121.0, 484.0, 232.0, 134.0, 85.0, 54.0, 25.0, 21.0, 16.0, 20.0, 9.0, 8.0, 4.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2473297119140625, -1.206573486328125, -1.1658172607421875, -1.12506103515625, -1.0843048095703125, -1.043548583984375, -1.0027923583984375, -0.9620361328125, -0.9212799072265625, -0.880523681640625, -0.8397674560546875, -0.79901123046875, -0.7582550048828125, -0.717498779296875, -0.6767425537109375, -0.635986328125, -0.5952301025390625, -0.554473876953125, -0.5137176513671875, -0.47296142578125, -0.4322052001953125, -0.391448974609375, -0.3506927490234375, -0.3099365234375, -0.2691802978515625, -0.228424072265625, -0.1876678466796875, -0.14691162109375, -0.1061553955078125, -0.065399169921875, -0.0246429443359375, 0.01611328125, 0.0568695068359375, 0.097625732421875, 0.1383819580078125, 0.17913818359375, 0.2198944091796875, 0.260650634765625, 0.3014068603515625, 0.3421630859375, 0.3829193115234375, 0.423675537109375, 0.4644317626953125, 0.50518798828125, 0.5459442138671875, 0.586700439453125, 0.6274566650390625, 0.668212890625, 0.7089691162109375, 0.749725341796875, 0.7904815673828125, 0.83123779296875, 0.8719940185546875, 0.912750244140625, 0.9535064697265625, 0.9942626953125, 1.0350189208984375, 1.075775146484375, 1.1165313720703125, 1.15728759765625, 1.1980438232421875, 1.238800048828125, 1.2795562744140625, 1.3203125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 5.0, 9.0, 6.0, 7.0, 21.0, 23.0, 18.0, 21.0, 39.0, 46.0, 63.0, 109.0, 109.0, 107.0, 82.0, 79.0, 57.0, 45.0, 32.0, 32.0, 24.0, 14.0, 8.0, 11.0, 10.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1982421875, -1.1555938720703125, -1.112945556640625, -1.0702972412109375, -1.02764892578125, -0.9850006103515625, -0.942352294921875, -0.8997039794921875, -0.8570556640625, -0.8144073486328125, -0.771759033203125, -0.7291107177734375, -0.68646240234375, -0.6438140869140625, -0.601165771484375, -0.5585174560546875, -0.515869140625, -0.4732208251953125, -0.430572509765625, -0.3879241943359375, -0.34527587890625, -0.3026275634765625, -0.259979248046875, -0.2173309326171875, -0.1746826171875, -0.1320343017578125, -0.089385986328125, -0.0467376708984375, -0.00408935546875, 0.0385589599609375, 0.081207275390625, 0.1238555908203125, 0.16650390625, 0.2091522216796875, 0.251800537109375, 0.2944488525390625, 0.33709716796875, 0.3797454833984375, 0.422393798828125, 0.4650421142578125, 0.5076904296875, 0.5503387451171875, 0.592987060546875, 0.6356353759765625, 0.67828369140625, 0.7209320068359375, 0.763580322265625, 0.8062286376953125, 0.848876953125, 0.8915252685546875, 0.934173583984375, 0.9768218994140625, 1.01947021484375, 1.0621185302734375, 1.104766845703125, 1.1474151611328125, 1.1900634765625, 1.2327117919921875, 1.275360107421875, 1.3180084228515625, 1.36065673828125, 1.4033050537109375, 1.445953369140625, 1.4886016845703125, 1.53125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 10.0, 23.0, 46.0, 72.0, 137.0, 188.0, 189.0, 158.0, 103.0, 50.0, 20.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-33.88689422607422, -33.05841064453125, -32.229923248291016, -31.401437759399414, -30.572952270507812, -29.74446678161621, -28.91598129272461, -28.087495803833008, -27.259010314941406, -26.430524826049805, -25.602039337158203, -24.7735538482666, -23.945068359375, -23.1165828704834, -22.288097381591797, -21.459611892700195, -20.631126403808594, -19.802640914916992, -18.97415542602539, -18.14566993713379, -17.317184448242188, -16.488698959350586, -15.660213470458984, -14.831727981567383, -14.003242492675781, -13.17475700378418, -12.346271514892578, -11.517786026000977, -10.689300537109375, -9.860815048217773, -9.032329559326172, -8.20384407043457, -7.375360488891602, -6.546875, -5.718389511108398, -4.889904022216797, -4.061418533325195, -3.2329330444335938, -2.404447555541992, -1.5759620666503906, -0.7474765777587891, 0.0810089111328125, 0.9094944000244141, 1.7379798889160156, 2.566465377807617, 3.3949508666992188, 4.22343635559082, 5.051921844482422, 5.880407333374023, 6.708892822265625, 7.537378311157227, 8.365863800048828, 9.19434928894043, 10.022834777832031, 10.851320266723633, 11.679805755615234, 12.508291244506836, 13.336776733398438, 14.165262222290039, 14.99374771118164, 15.822233200073242, 16.650718688964844, 17.479204177856445, 18.307689666748047, 19.13617515563965]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 8.0, 6.0, 11.0, 9.0, 8.0, 6.0, 9.0, 13.0, 18.0, 9.0, 21.0, 34.0, 18.0, 27.0, 32.0, 37.0, 39.0, 48.0, 48.0, 55.0, 43.0, 48.0, 46.0, 47.0, 40.0, 37.0, 34.0, 30.0, 31.0, 20.0, 30.0, 23.0, 14.0, 19.0, 25.0, 17.0, 11.0, 5.0, 8.0, 7.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.066290855407715, -11.652278900146484, -11.238265991210938, -10.824254035949707, -10.410242080688477, -9.996230125427246, -9.582218170166016, -9.168205261230469, -8.754193305969238, -8.340181350708008, -7.926168918609619, -7.5121564865112305, -7.09814453125, -6.6841325759887695, -6.270120143890381, -5.856107711791992, -5.442095756530762, -5.028083801269531, -4.614071369171143, -4.200058937072754, -3.7860469818115234, -3.372034788131714, -2.9580225944519043, -2.5440104007720947, -2.129998207092285, -1.7159860134124756, -1.301973819732666, -0.8879616260528564, -0.4739494323730469, -0.059937238693237305, 0.35407495498657227, 0.7680871486663818, 1.182098388671875, 1.5961105823516846, 2.010122776031494, 2.4241349697113037, 2.8381471633911133, 3.252159357070923, 3.6661715507507324, 4.080183982849121, 4.494195938110352, 4.908207893371582, 5.322220325469971, 5.736232757568359, 6.15024471282959, 6.56425666809082, 6.978269100189209, 7.392281532287598, 7.806293487548828, 8.220305442810059, 8.634317398071289, 9.048330307006836, 9.462342262268066, 9.876354217529297, 10.290367126464844, 10.704379081726074, 11.118391036987305, 11.532402992248535, 11.946414947509766, 12.360427856445312, 12.774439811706543, 13.188451766967773, 13.60246467590332, 14.01647663116455, 14.430488586425781]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 8.0, 16.0, 17.0, 30.0, 45.0, 72.0, 102.0, 166.0, 261.0, 455.0, 768.0, 1152.0, 1953.0, 3364.0, 5757.0, 10452.0, 19352.0, 36869.0, 71688.0, 149888.0, 343327.0, 893925.0, 1506206.0, 649631.0, 257906.0, 116945.0, 57394.0, 29775.0, 15939.0, 8729.0, 4924.0, 2867.0, 1686.0, 972.0, 613.0, 375.0, 231.0, 137.0, 109.0, 66.0, 34.0, 25.0, 11.0, 16.0, 9.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.10546875, -1.0701904296875, -1.034912109375, -0.9996337890625, -0.96435546875, -0.9290771484375, -0.893798828125, -0.8585205078125, -0.8232421875, -0.7879638671875, -0.752685546875, -0.7174072265625, -0.68212890625, -0.6468505859375, -0.611572265625, -0.5762939453125, -0.541015625, -0.5057373046875, -0.470458984375, -0.4351806640625, -0.39990234375, -0.3646240234375, -0.329345703125, -0.2940673828125, -0.2587890625, -0.2235107421875, -0.188232421875, -0.1529541015625, -0.11767578125, -0.0823974609375, -0.047119140625, -0.0118408203125, 0.0234375, 0.0587158203125, 0.093994140625, 0.1292724609375, 0.16455078125, 0.1998291015625, 0.235107421875, 0.2703857421875, 0.3056640625, 0.3409423828125, 0.376220703125, 0.4114990234375, 0.44677734375, 0.4820556640625, 0.517333984375, 0.5526123046875, 0.587890625, 0.6231689453125, 0.658447265625, 0.6937255859375, 0.72900390625, 0.7642822265625, 0.799560546875, 0.8348388671875, 0.8701171875, 0.9053955078125, 0.940673828125, 0.9759521484375, 1.01123046875, 1.0465087890625, 1.081787109375, 1.1170654296875, 1.15234375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 8.0, 7.0, 11.0, 16.0, 20.0, 23.0, 22.0, 18.0, 23.0, 38.0, 36.0, 52.0, 37.0, 39.0, 46.0, 69.0, 60.0, 49.0, 47.0, 39.0, 30.0, 50.0, 37.0, 35.0, 32.0, 22.0, 19.0, 15.0, 20.0, 15.0, 18.0, 9.0, 7.0, 10.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2666015625, -1.2223358154296875, -1.178070068359375, -1.1338043212890625, -1.08953857421875, -1.0452728271484375, -1.001007080078125, -0.9567413330078125, -0.9124755859375, -0.8682098388671875, -0.823944091796875, -0.7796783447265625, -0.73541259765625, -0.6911468505859375, -0.646881103515625, -0.6026153564453125, -0.558349609375, -0.5140838623046875, -0.469818115234375, -0.4255523681640625, -0.38128662109375, -0.3370208740234375, -0.292755126953125, -0.2484893798828125, -0.2042236328125, -0.1599578857421875, -0.115692138671875, -0.0714263916015625, -0.02716064453125, 0.0171051025390625, 0.061370849609375, 0.1056365966796875, 0.14990234375, 0.1941680908203125, 0.238433837890625, 0.2826995849609375, 0.32696533203125, 0.3712310791015625, 0.415496826171875, 0.4597625732421875, 0.5040283203125, 0.5482940673828125, 0.592559814453125, 0.6368255615234375, 0.68109130859375, 0.7253570556640625, 0.769622802734375, 0.8138885498046875, 0.858154296875, 0.9024200439453125, 0.946685791015625, 0.9909515380859375, 1.03521728515625, 1.0794830322265625, 1.123748779296875, 1.1680145263671875, 1.2122802734375, 1.2565460205078125, 1.300811767578125, 1.3450775146484375, 1.38934326171875, 1.4336090087890625, 1.477874755859375, 1.5221405029296875, 1.56640625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 7.0, 4.0, 20.0, 26.0, 28.0, 49.0, 78.0, 147.0, 207.0, 309.0, 542.0, 839.0, 1555.0, 2667.0, 4750.0, 8924.0, 16995.0, 33630.0, 69133.0, 147944.0, 350736.0, 983454.0, 1539548.0, 599467.0, 230305.0, 101961.0, 49149.0, 24248.0, 12417.0, 6518.0, 3527.0, 2021.0, 1253.0, 712.0, 420.0, 251.0, 139.0, 102.0, 72.0, 52.0, 32.0, 17.0, 14.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.443359375, -1.392303466796875, -1.34124755859375, -1.290191650390625, -1.2391357421875, -1.188079833984375, -1.13702392578125, -1.085968017578125, -1.034912109375, -0.983856201171875, -0.93280029296875, -0.881744384765625, -0.8306884765625, -0.779632568359375, -0.72857666015625, -0.677520751953125, -0.62646484375, -0.575408935546875, -0.52435302734375, -0.473297119140625, -0.4222412109375, -0.371185302734375, -0.32012939453125, -0.269073486328125, -0.218017578125, -0.166961669921875, -0.11590576171875, -0.064849853515625, -0.0137939453125, 0.037261962890625, 0.08831787109375, 0.139373779296875, 0.1904296875, 0.241485595703125, 0.29254150390625, 0.343597412109375, 0.3946533203125, 0.445709228515625, 0.49676513671875, 0.547821044921875, 0.598876953125, 0.649932861328125, 0.70098876953125, 0.752044677734375, 0.8031005859375, 0.854156494140625, 0.90521240234375, 0.956268310546875, 1.00732421875, 1.058380126953125, 1.10943603515625, 1.160491943359375, 1.2115478515625, 1.262603759765625, 1.31365966796875, 1.364715576171875, 1.415771484375, 1.466827392578125, 1.51788330078125, 1.568939208984375, 1.6199951171875, 1.671051025390625, 1.72210693359375, 1.773162841796875, 1.82421875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 9.0, 8.0, 6.0, 15.0, 17.0, 18.0, 39.0, 42.0, 70.0, 78.0, 114.0, 148.0, 230.0, 324.0, 539.0, 670.0, 534.0, 407.0, 255.0, 153.0, 86.0, 93.0, 49.0, 42.0, 26.0, 20.0, 14.0, 17.0, 10.0, 5.0, 8.0, 8.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.96484375, -2.8817138671875, -2.798583984375, -2.7154541015625, -2.63232421875, -2.5491943359375, -2.466064453125, -2.3829345703125, -2.2998046875, -2.2166748046875, -2.133544921875, -2.0504150390625, -1.96728515625, -1.8841552734375, -1.801025390625, -1.7178955078125, -1.634765625, -1.5516357421875, -1.468505859375, -1.3853759765625, -1.30224609375, -1.2191162109375, -1.135986328125, -1.0528564453125, -0.9697265625, -0.8865966796875, -0.803466796875, -0.7203369140625, -0.63720703125, -0.5540771484375, -0.470947265625, -0.3878173828125, -0.3046875, -0.2215576171875, -0.138427734375, -0.0552978515625, 0.02783203125, 0.1109619140625, 0.194091796875, 0.2772216796875, 0.3603515625, 0.4434814453125, 0.526611328125, 0.6097412109375, 0.69287109375, 0.7760009765625, 0.859130859375, 0.9422607421875, 1.025390625, 1.1085205078125, 1.191650390625, 1.2747802734375, 1.35791015625, 1.4410400390625, 1.524169921875, 1.6072998046875, 1.6904296875, 1.7735595703125, 1.856689453125, 1.9398193359375, 2.02294921875, 2.1060791015625, 2.189208984375, 2.2723388671875, 2.35546875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 10.0, 9.0, 14.0, 36.0, 38.0, 61.0, 79.0, 102.0, 114.0, 126.0, 103.0, 109.0, 74.0, 42.0, 34.0, 26.0, 9.0, 7.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.861881256103516, -14.406631469726562, -13.951382637023926, -13.496132850646973, -13.04088306427002, -12.585634231567383, -12.13038444519043, -11.675134658813477, -11.219884872436523, -10.76463508605957, -10.309386253356934, -9.85413646697998, -9.398886680603027, -8.94363784790039, -8.488388061523438, -8.033138275146484, -7.5778889656066895, -7.1226396560668945, -6.667389869689941, -6.2121405601501465, -5.756890773773193, -5.301641464233398, -4.846391677856445, -4.39114236831665, -3.9358928203582764, -3.4806432723999023, -3.0253937244415283, -2.5701441764831543, -2.1148948669433594, -1.6596453189849854, -1.2043957710266113, -0.7491462230682373, -0.2938966751098633, 0.16135284304618835, 0.61660236120224, 1.0718518495559692, 1.5271013975143433, 1.9823508262634277, 2.4376003742218018, 2.892849922180176, 3.34809947013855, 3.803349018096924, 4.258598327636719, 4.713848114013672, 5.169097423553467, 5.624346733093262, 6.079596519470215, 6.534846305847168, 6.990095615386963, 7.445344924926758, 7.900594711303711, 8.355844497680664, 8.8110933303833, 9.266343116760254, 9.721592903137207, 10.176841735839844, 10.632091522216797, 11.08734130859375, 11.542590141296387, 11.99783992767334, 12.453089714050293, 12.90833854675293, 13.363588333129883, 13.818838119506836, 14.274087905883789]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 7.0, 5.0, 6.0, 14.0, 15.0, 18.0, 16.0, 18.0, 21.0, 27.0, 32.0, 30.0, 34.0, 41.0, 43.0, 54.0, 52.0, 41.0, 44.0, 52.0, 45.0, 50.0, 42.0, 33.0, 35.0, 30.0, 23.0, 25.0, 18.0, 23.0, 23.0, 16.0, 21.0, 8.0, 8.0, 5.0, 4.0, 6.0, 5.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.679339408874512, -9.3921537399292, -9.104968070983887, -8.817782402038574, -8.530596733093262, -8.24341106414795, -7.956225395202637, -7.669039726257324, -7.381854057312012, -7.094668388366699, -6.807482719421387, -6.520297050476074, -6.233111381530762, -5.945925712585449, -5.658740043640137, -5.371554374694824, -5.08436918258667, -4.797183513641357, -4.509997844696045, -4.222812175750732, -3.93562650680542, -3.6484408378601074, -3.361255407333374, -3.0740697383880615, -2.786884069442749, -2.4996984004974365, -2.212512731552124, -1.925327181816101, -1.6381415128707886, -1.350955843925476, -1.0637702941894531, -0.7765846252441406, -0.4893989562988281, -0.202213317155838, 0.0849723219871521, 0.3721579313278198, 0.6593436002731323, 0.9465292692184448, 1.2337148189544678, 1.5209004878997803, 1.8080861568450928, 2.0952718257904053, 2.3824574947357178, 2.669642925262451, 2.9568285942077637, 3.244014263153076, 3.5311999320983887, 3.818385601043701, 4.105571269989014, 4.392756938934326, 4.679942607879639, 4.967128276824951, 5.254313945770264, 5.541499614715576, 5.8286848068237305, 6.115870475769043, 6.4030561447143555, 6.690241813659668, 6.9774274826049805, 7.264613151550293, 7.5517988204956055, 7.838984489440918, 8.12617015838623, 8.413355827331543, 8.700541496276855]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 8.0, 11.0, 17.0, 20.0, 29.0, 61.0, 75.0, 101.0, 157.0, 241.0, 336.0, 534.0, 785.0, 1123.0, 1701.0, 2628.0, 3758.0, 5798.0, 8869.0, 13858.0, 21847.0, 36680.0, 66825.0, 140074.0, 271254.0, 227883.0, 106132.0, 53707.0, 30833.0, 18466.0, 11699.0, 7816.0, 5024.0, 3357.0, 2271.0, 1469.0, 1045.0, 682.0, 482.0, 309.0, 186.0, 154.0, 83.0, 57.0, 34.0, 22.0, 23.0, 12.0, 12.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.3466796875, -1.3043670654296875, -1.262054443359375, -1.2197418212890625, -1.17742919921875, -1.1351165771484375, -1.092803955078125, -1.0504913330078125, -1.0081787109375, -0.9658660888671875, -0.923553466796875, -0.8812408447265625, -0.83892822265625, -0.7966156005859375, -0.754302978515625, -0.7119903564453125, -0.669677734375, -0.6273651123046875, -0.585052490234375, -0.5427398681640625, -0.50042724609375, -0.4581146240234375, -0.415802001953125, -0.3734893798828125, -0.3311767578125, -0.2888641357421875, -0.246551513671875, -0.2042388916015625, -0.16192626953125, -0.1196136474609375, -0.077301025390625, -0.0349884033203125, 0.00732421875, 0.0496368408203125, 0.091949462890625, 0.1342620849609375, 0.17657470703125, 0.2188873291015625, 0.261199951171875, 0.3035125732421875, 0.3458251953125, 0.3881378173828125, 0.430450439453125, 0.4727630615234375, 0.51507568359375, 0.5573883056640625, 0.599700927734375, 0.6420135498046875, 0.684326171875, 0.7266387939453125, 0.768951416015625, 0.8112640380859375, 0.85357666015625, 0.8958892822265625, 0.938201904296875, 0.9805145263671875, 1.0228271484375, 1.0651397705078125, 1.107452392578125, 1.1497650146484375, 1.19207763671875, 1.2343902587890625, 1.276702880859375, 1.3190155029296875, 1.361328125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 8.0, 15.0, 13.0, 19.0, 17.0, 15.0, 27.0, 30.0, 26.0, 34.0, 34.0, 33.0, 38.0, 50.0, 31.0, 56.0, 52.0, 47.0, 32.0, 56.0, 51.0, 53.0, 35.0, 32.0, 27.0, 28.0, 24.0, 29.0, 16.0, 14.0, 14.0, 10.0, 13.0, 7.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2265625, -1.1873321533203125, -1.148101806640625, -1.1088714599609375, -1.06964111328125, -1.0304107666015625, -0.991180419921875, -0.9519500732421875, -0.9127197265625, -0.8734893798828125, -0.834259033203125, -0.7950286865234375, -0.75579833984375, -0.7165679931640625, -0.677337646484375, -0.6381072998046875, -0.598876953125, -0.5596466064453125, -0.520416259765625, -0.4811859130859375, -0.44195556640625, -0.4027252197265625, -0.363494873046875, -0.3242645263671875, -0.2850341796875, -0.2458038330078125, -0.206573486328125, -0.1673431396484375, -0.12811279296875, -0.0888824462890625, -0.049652099609375, -0.0104217529296875, 0.02880859375, 0.0680389404296875, 0.107269287109375, 0.1464996337890625, 0.18572998046875, 0.2249603271484375, 0.264190673828125, 0.3034210205078125, 0.3426513671875, 0.3818817138671875, 0.421112060546875, 0.4603424072265625, 0.49957275390625, 0.5388031005859375, 0.578033447265625, 0.6172637939453125, 0.656494140625, 0.6957244873046875, 0.734954833984375, 0.7741851806640625, 0.81341552734375, 0.8526458740234375, 0.891876220703125, 0.9311065673828125, 0.9703369140625, 1.0095672607421875, 1.048797607421875, 1.0880279541015625, 1.12725830078125, 1.1664886474609375, 1.205718994140625, 1.2449493408203125, 1.2841796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 5.0, 11.0, 6.0, 15.0, 14.0, 30.0, 34.0, 50.0, 78.0, 126.0, 209.0, 384.0, 771.0, 1658.0, 3664.0, 8014.0, 17766.0, 40265.0, 104780.0, 356839.0, 342729.0, 100560.0, 38810.0, 17039.0, 7799.0, 3585.0, 1545.0, 768.0, 395.0, 214.0, 115.0, 81.0, 46.0, 35.0, 39.0, 20.0, 12.0, 9.0, 9.0, 7.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.48046875, -2.407470703125, -2.33447265625, -2.261474609375, -2.1884765625, -2.115478515625, -2.04248046875, -1.969482421875, -1.896484375, -1.823486328125, -1.75048828125, -1.677490234375, -1.6044921875, -1.531494140625, -1.45849609375, -1.385498046875, -1.3125, -1.239501953125, -1.16650390625, -1.093505859375, -1.0205078125, -0.947509765625, -0.87451171875, -0.801513671875, -0.728515625, -0.655517578125, -0.58251953125, -0.509521484375, -0.4365234375, -0.363525390625, -0.29052734375, -0.217529296875, -0.14453125, -0.071533203125, 0.00146484375, 0.074462890625, 0.1474609375, 0.220458984375, 0.29345703125, 0.366455078125, 0.439453125, 0.512451171875, 0.58544921875, 0.658447265625, 0.7314453125, 0.804443359375, 0.87744140625, 0.950439453125, 1.0234375, 1.096435546875, 1.16943359375, 1.242431640625, 1.3154296875, 1.388427734375, 1.46142578125, 1.534423828125, 1.607421875, 1.680419921875, 1.75341796875, 1.826416015625, 1.8994140625, 1.972412109375, 2.04541015625, 2.118408203125, 2.19140625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 12.0, 8.0, 13.0, 19.0, 12.0, 23.0, 25.0, 25.0, 32.0, 27.0, 27.0, 33.0, 40.0, 35.0, 50.0, 48.0, 43.0, 50.0, 40.0, 51.0, 40.0, 50.0, 30.0, 32.0, 37.0, 26.0, 14.0, 29.0, 29.0, 20.0, 12.0, 15.0, 11.0, 6.0, 8.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.43359375, -3.326873779296875, -3.22015380859375, -3.113433837890625, -3.0067138671875, -2.899993896484375, -2.79327392578125, -2.686553955078125, -2.579833984375, -2.473114013671875, -2.36639404296875, -2.259674072265625, -2.1529541015625, -2.046234130859375, -1.93951416015625, -1.832794189453125, -1.72607421875, -1.619354248046875, -1.51263427734375, -1.405914306640625, -1.2991943359375, -1.192474365234375, -1.08575439453125, -0.979034423828125, -0.872314453125, -0.765594482421875, -0.65887451171875, -0.552154541015625, -0.4454345703125, -0.338714599609375, -0.23199462890625, -0.125274658203125, -0.0185546875, 0.088165283203125, 0.19488525390625, 0.301605224609375, 0.4083251953125, 0.515045166015625, 0.62176513671875, 0.728485107421875, 0.835205078125, 0.941925048828125, 1.04864501953125, 1.155364990234375, 1.2620849609375, 1.368804931640625, 1.47552490234375, 1.582244873046875, 1.68896484375, 1.795684814453125, 1.90240478515625, 2.009124755859375, 2.1158447265625, 2.222564697265625, 2.32928466796875, 2.436004638671875, 2.542724609375, 2.649444580078125, 2.75616455078125, 2.862884521484375, 2.9696044921875, 3.076324462890625, 3.18304443359375, 3.289764404296875, 3.396484375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 6.0, 23.0, 25.0, 32.0, 59.0, 81.0, 105.0, 197.0, 285.0, 511.0, 768.0, 1351.0, 2343.0, 3823.0, 6581.0, 11411.0, 19262.0, 32139.0, 53658.0, 93824.0, 188325.0, 268672.0, 162666.0, 83137.0, 48591.0, 28818.0, 17017.0, 10132.0, 6027.0, 3410.0, 2026.0, 1215.0, 719.0, 485.0, 277.0, 177.0, 121.0, 79.0, 44.0, 37.0, 25.0, 15.0, 11.0, 11.0, 11.0, 6.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.56494140625, -0.5480270385742188, -0.5311126708984375, -0.5141983032226562, -0.497283935546875, -0.48036956787109375, -0.4634552001953125, -0.44654083251953125, -0.42962646484375, -0.41271209716796875, -0.3957977294921875, -0.37888336181640625, -0.361968994140625, -0.34505462646484375, -0.3281402587890625, -0.31122589111328125, -0.2943115234375, -0.27739715576171875, -0.2604827880859375, -0.24356842041015625, -0.226654052734375, -0.20973968505859375, -0.1928253173828125, -0.17591094970703125, -0.15899658203125, -0.14208221435546875, -0.1251678466796875, -0.10825347900390625, -0.091339111328125, -0.07442474365234375, -0.0575103759765625, -0.04059600830078125, -0.023681640625, -0.00676727294921875, 0.0101470947265625, 0.02706146240234375, 0.043975830078125, 0.06089019775390625, 0.0778045654296875, 0.09471893310546875, 0.11163330078125, 0.12854766845703125, 0.1454620361328125, 0.16237640380859375, 0.179290771484375, 0.19620513916015625, 0.2131195068359375, 0.23003387451171875, 0.2469482421875, 0.26386260986328125, 0.2807769775390625, 0.29769134521484375, 0.314605712890625, 0.33152008056640625, 0.3484344482421875, 0.36534881591796875, 0.38226318359375, 0.39917755126953125, 0.4160919189453125, 0.43300628662109375, 0.449920654296875, 0.46683502197265625, 0.4837493896484375, 0.5006637573242188, 0.517578125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 6.0, 13.0, 8.0, 11.0, 5.0, 12.0, 4.0, 16.0, 19.0, 29.0, 30.0, 50.0, 47.0, 95.0, 105.0, 119.0, 107.0, 79.0, 58.0, 31.0, 33.0, 25.0, 20.0, 9.0, 11.0, 10.0, 8.0, 4.0, 3.0, 1.0, 1.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0001919269561767578, -0.00018578767776489258, -0.00017964839935302734, -0.0001735091209411621, -0.00016736984252929688, -0.00016123056411743164, -0.0001550912857055664, -0.00014895200729370117, -0.00014281272888183594, -0.0001366734504699707, -0.00013053417205810547, -0.00012439489364624023, -0.000118255615234375, -0.00011211633682250977, -0.00010597705841064453, -9.98377799987793e-05, -9.369850158691406e-05, -8.755922317504883e-05, -8.14199447631836e-05, -7.528066635131836e-05, -6.914138793945312e-05, -6.300210952758789e-05, -5.6862831115722656e-05, -5.072355270385742e-05, -4.458427429199219e-05, -3.844499588012695e-05, -3.230571746826172e-05, -2.6166439056396484e-05, -2.002716064453125e-05, -1.3887882232666016e-05, -7.748603820800781e-06, -1.6093254089355469e-06, 4.5299530029296875e-06, 1.0669231414794922e-05, 1.6808509826660156e-05, 2.294778823852539e-05, 2.9087066650390625e-05, 3.522634506225586e-05, 4.1365623474121094e-05, 4.750490188598633e-05, 5.364418029785156e-05, 5.97834587097168e-05, 6.592273712158203e-05, 7.206201553344727e-05, 7.82012939453125e-05, 8.434057235717773e-05, 9.047985076904297e-05, 9.66191291809082e-05, 0.00010275840759277344, 0.00010889768600463867, 0.0001150369644165039, 0.00012117624282836914, 0.00012731552124023438, 0.0001334547996520996, 0.00013959407806396484, 0.00014573335647583008, 0.0001518726348876953, 0.00015801191329956055, 0.00016415119171142578, 0.00017029047012329102, 0.00017642974853515625, 0.00018256902694702148, 0.00018870830535888672, 0.00019484758377075195, 0.0002009868621826172]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 9.0, 6.0, 6.0, 8.0, 14.0, 18.0, 28.0, 46.0, 68.0, 81.0, 118.0, 188.0, 285.0, 420.0, 790.0, 1478.0, 2961.0, 6461.0, 14092.0, 31717.0, 72266.0, 172485.0, 337242.0, 233506.0, 96352.0, 42113.0, 18887.0, 8610.0, 3974.0, 1835.0, 970.0, 549.0, 317.0, 197.0, 135.0, 107.0, 52.0, 48.0, 45.0, 26.0, 16.0, 11.0, 10.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.7939453125, -0.7696456909179688, -0.7453460693359375, -0.7210464477539062, -0.696746826171875, -0.6724472045898438, -0.6481475830078125, -0.6238479614257812, -0.59954833984375, -0.5752487182617188, -0.5509490966796875, -0.5266494750976562, -0.502349853515625, -0.47805023193359375, -0.4537506103515625, -0.42945098876953125, -0.4051513671875, -0.38085174560546875, -0.3565521240234375, -0.33225250244140625, -0.307952880859375, -0.28365325927734375, -0.2593536376953125, -0.23505401611328125, -0.21075439453125, -0.18645477294921875, -0.1621551513671875, -0.13785552978515625, -0.113555908203125, -0.08925628662109375, -0.0649566650390625, -0.04065704345703125, -0.016357421875, 0.00794219970703125, 0.0322418212890625, 0.05654144287109375, 0.080841064453125, 0.10514068603515625, 0.1294403076171875, 0.15373992919921875, 0.17803955078125, 0.20233917236328125, 0.2266387939453125, 0.25093841552734375, 0.275238037109375, 0.29953765869140625, 0.3238372802734375, 0.34813690185546875, 0.3724365234375, 0.39673614501953125, 0.4210357666015625, 0.44533538818359375, 0.469635009765625, 0.49393463134765625, 0.5182342529296875, 0.5425338745117188, 0.56683349609375, 0.5911331176757812, 0.6154327392578125, 0.6397323608398438, 0.664031982421875, 0.6883316040039062, 0.7126312255859375, 0.7369308471679688, 0.76123046875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 7.0, 3.0, 6.0, 13.0, 8.0, 11.0, 9.0, 12.0, 21.0, 19.0, 25.0, 22.0, 36.0, 39.0, 36.0, 41.0, 56.0, 44.0, 72.0, 67.0, 71.0, 51.0, 57.0, 47.0, 36.0, 32.0, 23.0, 27.0, 26.0, 14.0, 18.0, 16.0, 9.0, 6.0, 9.0, 1.0, 7.0, 2.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.7802734375, -0.7599029541015625, -0.739532470703125, -0.7191619873046875, -0.69879150390625, -0.6784210205078125, -0.658050537109375, -0.6376800537109375, -0.6173095703125, -0.5969390869140625, -0.576568603515625, -0.5561981201171875, -0.53582763671875, -0.5154571533203125, -0.495086669921875, -0.4747161865234375, -0.454345703125, -0.4339752197265625, -0.413604736328125, -0.3932342529296875, -0.37286376953125, -0.3524932861328125, -0.332122802734375, -0.3117523193359375, -0.2913818359375, -0.2710113525390625, -0.250640869140625, -0.2302703857421875, -0.20989990234375, -0.1895294189453125, -0.169158935546875, -0.1487884521484375, -0.12841796875, -0.1080474853515625, -0.087677001953125, -0.0673065185546875, -0.04693603515625, -0.0265655517578125, -0.006195068359375, 0.0141754150390625, 0.0345458984375, 0.0549163818359375, 0.075286865234375, 0.0956573486328125, 0.11602783203125, 0.1363983154296875, 0.156768798828125, 0.1771392822265625, 0.197509765625, 0.2178802490234375, 0.238250732421875, 0.2586212158203125, 0.27899169921875, 0.2993621826171875, 0.319732666015625, 0.3401031494140625, 0.3604736328125, 0.3808441162109375, 0.401214599609375, 0.4215850830078125, 0.44195556640625, 0.4623260498046875, 0.482696533203125, 0.5030670166015625, 0.5234375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 6.0, 6.0, 21.0, 29.0, 32.0, 46.0, 94.0, 79.0, 104.0, 124.0, 120.0, 85.0, 72.0, 57.0, 36.0, 36.0, 19.0, 16.0, 7.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.694219589233398, -11.348403930664062, -11.00258731842041, -10.656771659851074, -10.310956001281738, -9.965139389038086, -9.61932373046875, -9.273508071899414, -8.927691459655762, -8.581875801086426, -8.236059188842773, -7.8902435302734375, -7.544427394866943, -7.198611259460449, -6.852795600891113, -6.506979465484619, -6.161163806915283, -5.815347671508789, -5.469532012939453, -5.123715877532959, -4.777899742126465, -4.432084083557129, -4.086267948150635, -3.7404518127441406, -3.3946359157562256, -3.0488200187683105, -2.7030038833618164, -2.3571879863739014, -2.0113720893859863, -1.6655559539794922, -1.3197400569915771, -0.973923921585083, -0.628108024597168, -0.28229203820228577, 0.06352394819259644, 0.40933990478515625, 0.7551559209823608, 1.1009719371795654, 1.4467878341674805, 1.7926039695739746, 2.1384198665618896, 2.4842357635498047, 2.830051898956299, 3.175867795944214, 3.521683692932129, 3.867499828338623, 4.213315963745117, 4.559131622314453, 4.904947757720947, 5.250763893127441, 5.596579551696777, 5.9423956871032715, 6.288211822509766, 6.634027481079102, 6.979843616485596, 7.32565975189209, 7.671475410461426, 8.017291069030762, 8.363107681274414, 8.70892333984375, 9.054738998413086, 9.400555610656738, 9.746371269226074, 10.092187881469727, 10.438003540039062]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 5.0, 4.0, 8.0, 7.0, 7.0, 4.0, 11.0, 10.0, 17.0, 14.0, 20.0, 24.0, 25.0, 27.0, 19.0, 33.0, 40.0, 45.0, 23.0, 43.0, 44.0, 40.0, 51.0, 40.0, 39.0, 28.0, 31.0, 31.0, 38.0, 31.0, 26.0, 19.0, 29.0, 18.0, 26.0, 18.0, 16.0, 18.0, 4.0, 12.0, 10.0, 11.0, 11.0, 11.0, 3.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.756222724914551, -7.521072864532471, -7.285923004150391, -7.0507731437683105, -6.8156232833862305, -6.58047342300415, -6.34532356262207, -6.11017370223999, -5.87502384185791, -5.63987398147583, -5.40472412109375, -5.16957426071167, -4.93442440032959, -4.69927453994751, -4.46412467956543, -4.22897481918335, -3.9938247203826904, -3.7586748600006104, -3.5235249996185303, -3.28837513923645, -3.05322527885437, -2.818075180053711, -2.582925319671631, -2.347775459289551, -2.1126255989074707, -1.8774757385253906, -1.6423258781433105, -1.4071760177612305, -1.1720261573791504, -0.9368761777877808, -0.7017263174057007, -0.4665764570236206, -0.23142671585083008, 0.003723159432411194, 0.23887303471565247, 0.47402292490005493, 0.709172785282135, 0.9443227052688599, 1.17947256565094, 1.41462242603302, 1.6497722864151, 1.8849221467971802, 2.12007212638855, 2.35522198677063, 2.59037184715271, 2.82552170753479, 3.06067156791687, 3.29582142829895, 3.5309712886810303, 3.7661211490631104, 4.0012712478637695, 4.23642110824585, 4.47157096862793, 4.70672082901001, 4.94187068939209, 5.17702054977417, 5.41217041015625, 5.64732027053833, 5.88247013092041, 6.11761999130249, 6.35276985168457, 6.58791971206665, 6.8230695724487305, 7.0582194328308105, 7.293369293212891]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 6.0, 7.0, 9.0, 24.0, 28.0, 33.0, 58.0, 62.0, 104.0, 186.0, 339.0, 648.0, 1036.0, 2093.0, 4145.0, 8247.0, 17250.0, 37554.0, 85775.0, 214766.0, 692623.0, 2012857.0, 735779.0, 219563.0, 87331.0, 38400.0, 17883.0, 8411.0, 4181.0, 2133.0, 1157.0, 653.0, 334.0, 224.0, 141.0, 78.0, 50.0, 37.0, 28.0, 15.0, 10.0, 12.0, 8.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3359375, -1.289093017578125, -1.24224853515625, -1.195404052734375, -1.1485595703125, -1.101715087890625, -1.05487060546875, -1.008026123046875, -0.961181640625, -0.914337158203125, -0.86749267578125, -0.820648193359375, -0.7738037109375, -0.726959228515625, -0.68011474609375, -0.633270263671875, -0.58642578125, -0.539581298828125, -0.49273681640625, -0.445892333984375, -0.3990478515625, -0.352203369140625, -0.30535888671875, -0.258514404296875, -0.211669921875, -0.164825439453125, -0.11798095703125, -0.071136474609375, -0.0242919921875, 0.022552490234375, 0.06939697265625, 0.116241455078125, 0.1630859375, 0.209930419921875, 0.25677490234375, 0.303619384765625, 0.3504638671875, 0.397308349609375, 0.44415283203125, 0.490997314453125, 0.537841796875, 0.584686279296875, 0.63153076171875, 0.678375244140625, 0.7252197265625, 0.772064208984375, 0.81890869140625, 0.865753173828125, 0.91259765625, 0.959442138671875, 1.00628662109375, 1.053131103515625, 1.0999755859375, 1.146820068359375, 1.19366455078125, 1.240509033203125, 1.287353515625, 1.334197998046875, 1.38104248046875, 1.427886962890625, 1.4747314453125, 1.521575927734375, 1.56842041015625, 1.615264892578125, 1.662109375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 7.0, 7.0, 17.0, 7.0, 18.0, 8.0, 14.0, 26.0, 21.0, 27.0, 23.0, 28.0, 24.0, 30.0, 36.0, 37.0, 45.0, 37.0, 52.0, 48.0, 35.0, 37.0, 45.0, 36.0, 38.0, 40.0, 39.0, 23.0, 28.0, 23.0, 18.0, 9.0, 16.0, 17.0, 12.0, 12.0, 7.0, 8.0, 7.0, 13.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.8955078125, -0.8654022216796875, -0.835296630859375, -0.8051910400390625, -0.77508544921875, -0.7449798583984375, -0.714874267578125, -0.6847686767578125, -0.6546630859375, -0.6245574951171875, -0.594451904296875, -0.5643463134765625, -0.53424072265625, -0.5041351318359375, -0.474029541015625, -0.4439239501953125, -0.413818359375, -0.3837127685546875, -0.353607177734375, -0.3235015869140625, -0.29339599609375, -0.2632904052734375, -0.233184814453125, -0.2030792236328125, -0.1729736328125, -0.1428680419921875, -0.112762451171875, -0.0826568603515625, -0.05255126953125, -0.0224456787109375, 0.007659912109375, 0.0377655029296875, 0.06787109375, 0.0979766845703125, 0.128082275390625, 0.1581878662109375, 0.18829345703125, 0.2183990478515625, 0.248504638671875, 0.2786102294921875, 0.3087158203125, 0.3388214111328125, 0.368927001953125, 0.3990325927734375, 0.42913818359375, 0.4592437744140625, 0.489349365234375, 0.5194549560546875, 0.549560546875, 0.5796661376953125, 0.609771728515625, 0.6398773193359375, 0.66998291015625, 0.7000885009765625, 0.730194091796875, 0.7602996826171875, 0.7904052734375, 0.8205108642578125, 0.850616455078125, 0.8807220458984375, 0.91082763671875, 0.9409332275390625, 0.971038818359375, 1.0011444091796875, 1.03125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 11.0, 11.0, 12.0, 16.0, 33.0, 57.0, 73.0, 110.0, 168.0, 297.0, 413.0, 716.0, 1266.0, 1864.0, 3289.0, 5327.0, 8969.0, 15548.0, 26578.0, 47598.0, 85771.0, 164250.0, 348701.0, 899606.0, 1438591.0, 606553.0, 254802.0, 126348.0, 67008.0, 37959.0, 21555.0, 12470.0, 7200.0, 4374.0, 2574.0, 1585.0, 950.0, 590.0, 370.0, 237.0, 134.0, 100.0, 68.0, 46.0, 28.0, 16.0, 19.0, 7.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.2919921875, -1.2519989013671875, -1.212005615234375, -1.1720123291015625, -1.13201904296875, -1.0920257568359375, -1.052032470703125, -1.0120391845703125, -0.9720458984375, -0.9320526123046875, -0.892059326171875, -0.8520660400390625, -0.81207275390625, -0.7720794677734375, -0.732086181640625, -0.6920928955078125, -0.652099609375, -0.6121063232421875, -0.572113037109375, -0.5321197509765625, -0.49212646484375, -0.4521331787109375, -0.412139892578125, -0.3721466064453125, -0.3321533203125, -0.2921600341796875, -0.252166748046875, -0.2121734619140625, -0.17218017578125, -0.1321868896484375, -0.092193603515625, -0.0522003173828125, -0.01220703125, 0.0277862548828125, 0.067779541015625, 0.1077728271484375, 0.14776611328125, 0.1877593994140625, 0.227752685546875, 0.2677459716796875, 0.3077392578125, 0.3477325439453125, 0.387725830078125, 0.4277191162109375, 0.46771240234375, 0.5077056884765625, 0.547698974609375, 0.5876922607421875, 0.627685546875, 0.6676788330078125, 0.707672119140625, 0.7476654052734375, 0.78765869140625, 0.8276519775390625, 0.867645263671875, 0.9076385498046875, 0.9476318359375, 0.9876251220703125, 1.027618408203125, 1.0676116943359375, 1.10760498046875, 1.1475982666015625, 1.187591552734375, 1.2275848388671875, 1.267578125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 6.0, 7.0, 11.0, 14.0, 14.0, 21.0, 17.0, 29.0, 36.0, 54.0, 58.0, 69.0, 70.0, 140.0, 156.0, 208.0, 311.0, 380.0, 537.0, 505.0, 393.0, 268.0, 185.0, 118.0, 93.0, 80.0, 61.0, 47.0, 37.0, 32.0, 17.0, 18.0, 13.0, 14.0, 7.0, 8.0, 14.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-2.009765625, -1.952056884765625, -1.89434814453125, -1.836639404296875, -1.7789306640625, -1.721221923828125, -1.66351318359375, -1.605804443359375, -1.548095703125, -1.490386962890625, -1.43267822265625, -1.374969482421875, -1.3172607421875, -1.259552001953125, -1.20184326171875, -1.144134521484375, -1.08642578125, -1.028717041015625, -0.97100830078125, -0.913299560546875, -0.8555908203125, -0.797882080078125, -0.74017333984375, -0.682464599609375, -0.624755859375, -0.567047119140625, -0.50933837890625, -0.451629638671875, -0.3939208984375, -0.336212158203125, -0.27850341796875, -0.220794677734375, -0.1630859375, -0.105377197265625, -0.04766845703125, 0.010040283203125, 0.0677490234375, 0.125457763671875, 0.18316650390625, 0.240875244140625, 0.298583984375, 0.356292724609375, 0.41400146484375, 0.471710205078125, 0.5294189453125, 0.587127685546875, 0.64483642578125, 0.702545166015625, 0.76025390625, 0.817962646484375, 0.87567138671875, 0.933380126953125, 0.9910888671875, 1.048797607421875, 1.10650634765625, 1.164215087890625, 1.221923828125, 1.279632568359375, 1.33734130859375, 1.395050048828125, 1.4527587890625, 1.510467529296875, 1.56817626953125, 1.625885009765625, 1.68359375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 10.0, 3.0, 14.0, 18.0, 28.0, 32.0, 50.0, 47.0, 60.0, 82.0, 83.0, 106.0, 94.0, 81.0, 83.0, 51.0, 54.0, 27.0, 25.0, 17.0, 16.0, 9.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.151763916015625, -7.824233055114746, -7.496702671051025, -7.1691718101501465, -6.841640949249268, -6.514110565185547, -6.186579704284668, -5.859048843383789, -5.53151798248291, -5.203987121582031, -4.8764567375183105, -4.548925876617432, -4.221395015716553, -3.893864393234253, -3.566333770751953, -3.238802909851074, -2.9112725257873535, -2.5837419033050537, -2.256211042404175, -1.928680419921875, -1.6011496782302856, -1.2736189365386963, -0.9460883140563965, -0.6185574531555176, -0.2910268306732178, 0.036503881216049194, 0.36403459310531616, 0.6915652751922607, 1.01909601688385, 1.3466267585754395, 1.6741573810577393, 2.001688241958618, 2.329218864440918, 2.6567494869232178, 2.9842803478240967, 3.3118109703063965, 3.6393418312072754, 3.966872453689575, 4.294403076171875, 4.621933937072754, 4.949464797973633, 5.276995658874512, 5.604526042938232, 5.932056903839111, 6.25958776473999, 6.587118148803711, 6.91464900970459, 7.242179870605469, 7.5697102546691895, 7.897241115570068, 8.224771499633789, 8.552302360534668, 8.879833221435547, 9.207364082336426, 9.534894943237305, 9.862424850463867, 10.189955711364746, 10.517486572265625, 10.845017433166504, 11.172548294067383, 11.500078201293945, 11.827609062194824, 12.155139923095703, 12.482670783996582, 12.810201644897461]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 4.0, 4.0, 4.0, 7.0, 12.0, 10.0, 13.0, 13.0, 15.0, 25.0, 38.0, 31.0, 25.0, 33.0, 44.0, 43.0, 37.0, 55.0, 42.0, 47.0, 42.0, 45.0, 40.0, 45.0, 38.0, 32.0, 38.0, 35.0, 35.0, 30.0, 19.0, 24.0, 14.0, 16.0, 7.0, 10.0, 4.0, 5.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.754355430603027, -6.549143314361572, -6.343930721282959, -6.138718605041504, -5.933506011962891, -5.7282938957214355, -5.5230817794799805, -5.317869186401367, -5.112657070159912, -4.907444953918457, -4.702232360839844, -4.497020244598389, -4.291807651519775, -4.08659553527832, -3.881383180618286, -3.676170825958252, -3.4709584712982178, -3.2657461166381836, -3.0605337619781494, -2.8553214073181152, -2.65010929107666, -2.444896936416626, -2.239684581756592, -2.0344724655151367, -1.829259991645813, -1.6240476369857788, -1.4188354015350342, -1.213623046875, -1.0084106922149658, -0.8031984567642212, -0.597986102104187, -0.3927738666534424, -0.1875615119934082, 0.017650797963142395, 0.222863107919693, 0.4280754327774048, 0.6332877278327942, 0.8385000228881836, 1.0437123775482178, 1.2489246129989624, 1.4541369676589966, 1.6593493223190308, 1.8645615577697754, 2.0697739124298096, 2.2749862670898438, 2.480198383331299, 2.685410976409912, 2.890623092651367, 3.0958354473114014, 3.3010478019714355, 3.5062601566314697, 3.711472511291504, 3.916684627532959, 4.121896743774414, 4.327109336853027, 4.532321453094482, 4.737534046173096, 4.942746162414551, 5.147958755493164, 5.353170871734619, 5.558383464813232, 5.7635955810546875, 5.968808174133301, 6.174020290374756, 6.379232406616211]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 9.0, 12.0, 11.0, 35.0, 33.0, 65.0, 98.0, 132.0, 188.0, 260.0, 398.0, 608.0, 857.0, 1260.0, 1636.0, 2498.0, 3549.0, 5067.0, 7872.0, 12158.0, 19490.0, 32902.0, 59491.0, 109475.0, 191343.0, 228953.0, 160671.0, 87399.0, 47278.0, 26658.0, 16017.0, 10477.0, 6920.0, 4527.0, 3153.0, 2183.0, 1510.0, 1068.0, 681.0, 511.0, 332.0, 243.0, 152.0, 104.0, 94.0, 34.0, 35.0, 38.0, 29.0, 11.0, 13.0, 3.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.03125, -0.998321533203125, -0.96539306640625, -0.932464599609375, -0.8995361328125, -0.866607666015625, -0.83367919921875, -0.800750732421875, -0.767822265625, -0.734893798828125, -0.70196533203125, -0.669036865234375, -0.6361083984375, -0.603179931640625, -0.57025146484375, -0.537322998046875, -0.50439453125, -0.471466064453125, -0.43853759765625, -0.405609130859375, -0.3726806640625, -0.339752197265625, -0.30682373046875, -0.273895263671875, -0.240966796875, -0.208038330078125, -0.17510986328125, -0.142181396484375, -0.1092529296875, -0.076324462890625, -0.04339599609375, -0.010467529296875, 0.0224609375, 0.055389404296875, 0.08831787109375, 0.121246337890625, 0.1541748046875, 0.187103271484375, 0.22003173828125, 0.252960205078125, 0.285888671875, 0.318817138671875, 0.35174560546875, 0.384674072265625, 0.4176025390625, 0.450531005859375, 0.48345947265625, 0.516387939453125, 0.54931640625, 0.582244873046875, 0.61517333984375, 0.648101806640625, 0.6810302734375, 0.713958740234375, 0.74688720703125, 0.779815673828125, 0.812744140625, 0.845672607421875, 0.87860107421875, 0.911529541015625, 0.9444580078125, 0.977386474609375, 1.01031494140625, 1.043243408203125, 1.076171875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 8.0, 7.0, 9.0, 9.0, 21.0, 18.0, 19.0, 25.0, 19.0, 20.0, 30.0, 39.0, 45.0, 44.0, 38.0, 50.0, 47.0, 38.0, 36.0, 46.0, 35.0, 30.0, 40.0, 32.0, 38.0, 29.0, 27.0, 23.0, 34.0, 26.0, 16.0, 16.0, 20.0, 13.0, 8.0, 11.0, 5.0, 4.0, 5.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.94580078125, -0.9147109985351562, -0.8836212158203125, -0.8525314331054688, -0.821441650390625, -0.7903518676757812, -0.7592620849609375, -0.7281723022460938, -0.69708251953125, -0.6659927368164062, -0.6349029541015625, -0.6038131713867188, -0.572723388671875, -0.5416336059570312, -0.5105438232421875, -0.47945404052734375, -0.4483642578125, -0.41727447509765625, -0.3861846923828125, -0.35509490966796875, -0.324005126953125, -0.29291534423828125, -0.2618255615234375, -0.23073577880859375, -0.19964599609375, -0.16855621337890625, -0.1374664306640625, -0.10637664794921875, -0.075286865234375, -0.04419708251953125, -0.0131072998046875, 0.01798248291015625, 0.049072265625, 0.08016204833984375, 0.1112518310546875, 0.14234161376953125, 0.173431396484375, 0.20452117919921875, 0.2356109619140625, 0.26670074462890625, 0.29779052734375, 0.32888031005859375, 0.3599700927734375, 0.39105987548828125, 0.422149658203125, 0.45323944091796875, 0.4843292236328125, 0.5154190063476562, 0.5465087890625, 0.5775985717773438, 0.6086883544921875, 0.6397781372070312, 0.670867919921875, 0.7019577026367188, 0.7330474853515625, 0.7641372680664062, 0.79522705078125, 0.8263168334960938, 0.8574066162109375, 0.8884963989257812, 0.919586181640625, 0.9506759643554688, 0.9817657470703125, 1.0128555297851562, 1.0439453125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 8.0, 8.0, 24.0, 25.0, 44.0, 59.0, 111.0, 225.0, 511.0, 1465.0, 4475.0, 15503.0, 61289.0, 318991.0, 498711.0, 111364.0, 24927.0, 7143.0, 2245.0, 790.0, 293.0, 143.0, 79.0, 44.0, 25.0, 22.0, 7.0, 8.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.406158447265625, -2.31427001953125, -2.222381591796875, -2.1304931640625, -2.038604736328125, -1.94671630859375, -1.854827880859375, -1.762939453125, -1.671051025390625, -1.57916259765625, -1.487274169921875, -1.3953857421875, -1.303497314453125, -1.21160888671875, -1.119720458984375, -1.02783203125, -0.935943603515625, -0.84405517578125, -0.752166748046875, -0.6602783203125, -0.568389892578125, -0.47650146484375, -0.384613037109375, -0.292724609375, -0.200836181640625, -0.10894775390625, -0.017059326171875, 0.0748291015625, 0.166717529296875, 0.25860595703125, 0.350494384765625, 0.4423828125, 0.534271240234375, 0.62615966796875, 0.718048095703125, 0.8099365234375, 0.901824951171875, 0.99371337890625, 1.085601806640625, 1.177490234375, 1.269378662109375, 1.36126708984375, 1.453155517578125, 1.5450439453125, 1.636932373046875, 1.72882080078125, 1.820709228515625, 1.91259765625, 2.004486083984375, 2.09637451171875, 2.188262939453125, 2.2801513671875, 2.372039794921875, 2.46392822265625, 2.555816650390625, 2.647705078125, 2.739593505859375, 2.83148193359375, 2.923370361328125, 3.0152587890625, 3.107147216796875, 3.19903564453125, 3.290924072265625, 3.3828125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 2.0, 9.0, 5.0, 4.0, 5.0, 11.0, 12.0, 14.0, 12.0, 10.0, 14.0, 26.0, 28.0, 20.0, 25.0, 33.0, 23.0, 23.0, 31.0, 35.0, 46.0, 37.0, 41.0, 38.0, 26.0, 48.0, 47.0, 40.0, 32.0, 33.0, 32.0, 23.0, 23.0, 28.0, 18.0, 20.0, 22.0, 14.0, 13.0, 15.0, 6.0, 8.0, 9.0, 8.0, 9.0, 7.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.234375, -2.16046142578125, -2.0865478515625, -2.01263427734375, -1.938720703125, -1.86480712890625, -1.7908935546875, -1.71697998046875, -1.64306640625, -1.56915283203125, -1.4952392578125, -1.42132568359375, -1.347412109375, -1.27349853515625, -1.1995849609375, -1.12567138671875, -1.0517578125, -0.97784423828125, -0.9039306640625, -0.83001708984375, -0.756103515625, -0.68218994140625, -0.6082763671875, -0.53436279296875, -0.46044921875, -0.38653564453125, -0.3126220703125, -0.23870849609375, -0.164794921875, -0.09088134765625, -0.0169677734375, 0.05694580078125, 0.130859375, 0.20477294921875, 0.2786865234375, 0.35260009765625, 0.426513671875, 0.50042724609375, 0.5743408203125, 0.64825439453125, 0.72216796875, 0.79608154296875, 0.8699951171875, 0.94390869140625, 1.017822265625, 1.09173583984375, 1.1656494140625, 1.23956298828125, 1.3134765625, 1.38739013671875, 1.4613037109375, 1.53521728515625, 1.609130859375, 1.68304443359375, 1.7569580078125, 1.83087158203125, 1.90478515625, 1.97869873046875, 2.0526123046875, 2.12652587890625, 2.200439453125, 2.27435302734375, 2.3482666015625, 2.42218017578125, 2.49609375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 12.0, 14.0, 31.0, 63.0, 113.0, 225.0, 419.0, 770.0, 1547.0, 3053.0, 5793.0, 11366.0, 22702.0, 48369.0, 121523.0, 299560.0, 307634.0, 127334.0, 50064.0, 23461.0, 11953.0, 6138.0, 3120.0, 1586.0, 794.0, 418.0, 203.0, 111.0, 68.0, 30.0, 25.0, 15.0, 16.0, 5.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62109375, -0.5989303588867188, -0.5767669677734375, -0.5546035766601562, -0.532440185546875, -0.5102767944335938, -0.4881134033203125, -0.46595001220703125, -0.44378662109375, -0.42162322998046875, -0.3994598388671875, -0.37729644775390625, -0.355133056640625, -0.33296966552734375, -0.3108062744140625, -0.28864288330078125, -0.2664794921875, -0.24431610107421875, -0.2221527099609375, -0.19998931884765625, -0.177825927734375, -0.15566253662109375, -0.1334991455078125, -0.11133575439453125, -0.08917236328125, -0.06700897216796875, -0.0448455810546875, -0.02268218994140625, -0.000518798828125, 0.02164459228515625, 0.0438079833984375, 0.06597137451171875, 0.088134765625, 0.11029815673828125, 0.1324615478515625, 0.15462493896484375, 0.176788330078125, 0.19895172119140625, 0.2211151123046875, 0.24327850341796875, 0.26544189453125, 0.28760528564453125, 0.3097686767578125, 0.33193206787109375, 0.354095458984375, 0.37625885009765625, 0.3984222412109375, 0.42058563232421875, 0.4427490234375, 0.46491241455078125, 0.4870758056640625, 0.5092391967773438, 0.531402587890625, 0.5535659790039062, 0.5757293701171875, 0.5978927612304688, 0.62005615234375, 0.6422195434570312, 0.6643829345703125, 0.6865463256835938, 0.708709716796875, 0.7308731079101562, 0.7530364990234375, 0.7751998901367188, 0.79736328125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 7.0, 4.0, 4.0, 6.0, 9.0, 7.0, 14.0, 23.0, 10.0, 22.0, 20.0, 33.0, 55.0, 87.0, 102.0, 115.0, 111.0, 96.0, 65.0, 42.0, 37.0, 22.0, 12.0, 14.0, 14.0, 10.0, 8.0, 5.0, 3.0, 2.0, 2.0, 9.0, 7.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00015020370483398438, -0.0001445971429347992, -0.00013899058103561401, -0.00013338401913642883, -0.00012777745723724365, -0.00012217089533805847, -0.00011656433343887329, -0.00011095777153968811, -0.00010535120964050293, -9.974464774131775e-05, -9.413808584213257e-05, -8.853152394294739e-05, -8.292496204376221e-05, -7.731840014457703e-05, -7.171183824539185e-05, -6.610527634620667e-05, -6.0498714447021484e-05, -5.4892152547836304e-05, -4.928559064865112e-05, -4.367902874946594e-05, -3.807246685028076e-05, -3.246590495109558e-05, -2.68593430519104e-05, -2.125278115272522e-05, -1.564621925354004e-05, -1.0039657354354858e-05, -4.433095455169678e-06, 1.173466444015503e-06, 6.780028343200684e-06, 1.2386590242385864e-05, 1.7993152141571045e-05, 2.3599714040756226e-05, 2.9206275939941406e-05, 3.481283783912659e-05, 4.041939973831177e-05, 4.602596163749695e-05, 5.163252353668213e-05, 5.723908543586731e-05, 6.284564733505249e-05, 6.845220923423767e-05, 7.405877113342285e-05, 7.966533303260803e-05, 8.527189493179321e-05, 9.08784568309784e-05, 9.648501873016357e-05, 0.00010209158062934875, 0.00010769814252853394, 0.00011330470442771912, 0.0001189112663269043, 0.00012451782822608948, 0.00013012439012527466, 0.00013573095202445984, 0.00014133751392364502, 0.0001469440758228302, 0.00015255063772201538, 0.00015815719962120056, 0.00016376376152038574, 0.00016937032341957092, 0.0001749768853187561, 0.00018058344721794128, 0.00018619000911712646, 0.00019179657101631165, 0.00019740313291549683, 0.000203009694814682, 0.0002086162567138672]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 6.0, 4.0, 5.0, 17.0, 12.0, 14.0, 25.0, 55.0, 98.0, 138.0, 309.0, 486.0, 931.0, 1998.0, 4004.0, 8754.0, 18865.0, 43250.0, 107832.0, 261976.0, 325439.0, 161609.0, 63293.0, 26394.0, 11980.0, 5629.0, 2642.0, 1299.0, 621.0, 355.0, 199.0, 122.0, 69.0, 44.0, 25.0, 26.0, 12.0, 10.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.77880859375, -0.7546310424804688, -0.7304534912109375, -0.7062759399414062, -0.682098388671875, -0.6579208374023438, -0.6337432861328125, -0.6095657348632812, -0.58538818359375, -0.5612106323242188, -0.5370330810546875, -0.5128555297851562, -0.488677978515625, -0.46450042724609375, -0.4403228759765625, -0.41614532470703125, -0.3919677734375, -0.36779022216796875, -0.3436126708984375, -0.31943511962890625, -0.295257568359375, -0.27108001708984375, -0.2469024658203125, -0.22272491455078125, -0.19854736328125, -0.17436981201171875, -0.1501922607421875, -0.12601470947265625, -0.101837158203125, -0.07765960693359375, -0.0534820556640625, -0.02930450439453125, -0.005126953125, 0.01905059814453125, 0.0432281494140625, 0.06740570068359375, 0.091583251953125, 0.11576080322265625, 0.1399383544921875, 0.16411590576171875, 0.18829345703125, 0.21247100830078125, 0.2366485595703125, 0.26082611083984375, 0.285003662109375, 0.30918121337890625, 0.3333587646484375, 0.35753631591796875, 0.3817138671875, 0.40589141845703125, 0.4300689697265625, 0.45424652099609375, 0.478424072265625, 0.5026016235351562, 0.5267791748046875, 0.5509567260742188, 0.57513427734375, 0.5993118286132812, 0.6234893798828125, 0.6476669311523438, 0.671844482421875, 0.6960220336914062, 0.7201995849609375, 0.7443771362304688, 0.7685546875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 10.0, 9.0, 10.0, 14.0, 15.0, 19.0, 15.0, 25.0, 32.0, 31.0, 55.0, 55.0, 73.0, 84.0, 75.0, 67.0, 67.0, 47.0, 63.0, 33.0, 29.0, 30.0, 21.0, 18.0, 11.0, 16.0, 9.0, 9.0, 6.0, 7.0, 5.0, 9.0, 2.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.611328125, -0.5888519287109375, -0.566375732421875, -0.5438995361328125, -0.52142333984375, -0.4989471435546875, -0.476470947265625, -0.4539947509765625, -0.4315185546875, -0.4090423583984375, -0.386566162109375, -0.3640899658203125, -0.34161376953125, -0.3191375732421875, -0.296661376953125, -0.2741851806640625, -0.251708984375, -0.2292327880859375, -0.206756591796875, -0.1842803955078125, -0.16180419921875, -0.1393280029296875, -0.116851806640625, -0.0943756103515625, -0.0718994140625, -0.0494232177734375, -0.026947021484375, -0.0044708251953125, 0.01800537109375, 0.0404815673828125, 0.062957763671875, 0.0854339599609375, 0.10791015625, 0.1303863525390625, 0.152862548828125, 0.1753387451171875, 0.19781494140625, 0.2202911376953125, 0.242767333984375, 0.2652435302734375, 0.2877197265625, 0.3101959228515625, 0.332672119140625, 0.3551483154296875, 0.37762451171875, 0.4001007080078125, 0.422576904296875, 0.4450531005859375, 0.467529296875, 0.4900054931640625, 0.512481689453125, 0.5349578857421875, 0.55743408203125, 0.5799102783203125, 0.602386474609375, 0.6248626708984375, 0.6473388671875, 0.6698150634765625, 0.692291259765625, 0.7147674560546875, 0.73724365234375, 0.7597198486328125, 0.782196044921875, 0.8046722412109375, 0.8271484375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 9.0, 10.0, 23.0, 65.0, 103.0, 149.0, 180.0, 187.0, 132.0, 79.0, 32.0, 17.0, 9.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.308792114257812, -13.811792373657227, -13.31479263305664, -12.817791938781738, -12.320792198181152, -11.823792457580566, -11.326791763305664, -10.829792022705078, -10.332792282104492, -9.835792541503906, -9.33879280090332, -8.841792106628418, -8.344792366027832, -7.847792625427246, -7.350792407989502, -6.853792190551758, -6.356792449951172, -5.859792709350586, -5.362792491912842, -4.865792274475098, -4.368792533874512, -3.8717925548553467, -3.3747925758361816, -2.8777925968170166, -2.3807926177978516, -1.8837926387786865, -1.3867926597595215, -0.8897926807403564, -0.3927927017211914, 0.10420727729797363, 0.6012072563171387, 1.0982072353363037, 1.5952072143554688, 2.092207193374634, 2.589207172393799, 3.086207151412964, 3.583207130432129, 4.080206871032715, 4.577207088470459, 5.074207305908203, 5.571207046508789, 6.068206787109375, 6.565207004547119, 7.062207221984863, 7.559206962585449, 8.056206703186035, 8.553207397460938, 9.050207138061523, 9.54720687866211, 10.044206619262695, 10.541206359863281, 11.038207054138184, 11.53520679473877, 12.032206535339355, 12.529207229614258, 13.026206970214844, 13.52320671081543, 14.020206451416016, 14.517206192016602, 15.014206886291504, 15.51120662689209, 16.008207321166992, 16.505207061767578, 17.002206802368164, 17.49920654296875]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 2.0, 2.0, 6.0, 12.0, 6.0, 8.0, 12.0, 7.0, 12.0, 10.0, 19.0, 22.0, 13.0, 31.0, 27.0, 42.0, 31.0, 38.0, 42.0, 43.0, 38.0, 36.0, 36.0, 36.0, 40.0, 49.0, 29.0, 25.0, 34.0, 37.0, 23.0, 35.0, 31.0, 24.0, 21.0, 23.0, 17.0, 16.0, 9.0, 13.0, 10.0, 5.0, 9.0, 5.0, 7.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.051413536071777, -5.8567118644714355, -5.6620097160339355, -5.467308044433594, -5.272605895996094, -5.077904224395752, -4.88320255279541, -4.68850040435791, -4.493798732757568, -4.299097061157227, -4.104394912719727, -3.9096932411193848, -3.714991331100464, -3.520289421081543, -3.325587749481201, -3.1308858394622803, -2.9361839294433594, -2.7414820194244385, -2.5467801094055176, -2.352078437805176, -2.157376527786255, -1.962674617767334, -1.7679728269577026, -1.5732710361480713, -1.3785691261291504, -1.1838672161102295, -0.9891654253005981, -0.794463574886322, -0.5997617244720459, -0.4050598740577698, -0.21035802364349365, -0.015656232833862305, 0.1790456771850586, 0.3737475275993347, 0.5684493780136108, 0.763151228427887, 0.9578530788421631, 1.152554988861084, 1.3472567796707153, 1.5419585704803467, 1.7366604804992676, 1.9313623905181885, 2.1260643005371094, 2.320765972137451, 2.515467882156372, 2.710169792175293, 2.9048714637756348, 3.0995733737945557, 3.2942752838134766, 3.4889771938323975, 3.6836791038513184, 3.87838077545166, 4.07308292388916, 4.267784595489502, 4.462486267089844, 4.657188415527344, 4.8518900871276855, 5.046591758728027, 5.241293907165527, 5.435995578765869, 5.630697250366211, 5.825399398803711, 6.020101070404053, 6.2148027420043945, 6.4095048904418945]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 1.0, 6.0, 5.0, 13.0, 19.0, 30.0, 33.0, 60.0, 106.0, 135.0, 206.0, 362.0, 556.0, 1023.0, 1945.0, 3831.0, 8228.0, 18230.0, 41868.0, 99840.0, 259328.0, 820482.0, 1805784.0, 730682.0, 236225.0, 92466.0, 38994.0, 17351.0, 8045.0, 3804.0, 1928.0, 1109.0, 594.0, 351.0, 234.0, 137.0, 83.0, 53.0, 38.0, 32.0, 22.0, 14.0, 9.0, 8.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.515625, -1.46893310546875, -1.4222412109375, -1.37554931640625, -1.328857421875, -1.28216552734375, -1.2354736328125, -1.18878173828125, -1.14208984375, -1.09539794921875, -1.0487060546875, -1.00201416015625, -0.955322265625, -0.90863037109375, -0.8619384765625, -0.81524658203125, -0.7685546875, -0.72186279296875, -0.6751708984375, -0.62847900390625, -0.581787109375, -0.53509521484375, -0.4884033203125, -0.44171142578125, -0.39501953125, -0.34832763671875, -0.3016357421875, -0.25494384765625, -0.208251953125, -0.16156005859375, -0.1148681640625, -0.06817626953125, -0.021484375, 0.02520751953125, 0.0718994140625, 0.11859130859375, 0.165283203125, 0.21197509765625, 0.2586669921875, 0.30535888671875, 0.35205078125, 0.39874267578125, 0.4454345703125, 0.49212646484375, 0.538818359375, 0.58551025390625, 0.6322021484375, 0.67889404296875, 0.7255859375, 0.77227783203125, 0.8189697265625, 0.86566162109375, 0.912353515625, 0.95904541015625, 1.0057373046875, 1.05242919921875, 1.09912109375, 1.14581298828125, 1.1925048828125, 1.23919677734375, 1.285888671875, 1.33258056640625, 1.3792724609375, 1.42596435546875, 1.47265625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 9.0, 13.0, 7.0, 15.0, 11.0, 25.0, 24.0, 24.0, 21.0, 27.0, 31.0, 31.0, 41.0, 35.0, 32.0, 52.0, 40.0, 51.0, 47.0, 38.0, 41.0, 38.0, 36.0, 38.0, 35.0, 29.0, 34.0, 22.0, 21.0, 21.0, 12.0, 21.0, 16.0, 12.0, 3.0, 11.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.82275390625, -0.7930679321289062, -0.7633819580078125, -0.7336959838867188, -0.704010009765625, -0.6743240356445312, -0.6446380615234375, -0.6149520874023438, -0.58526611328125, -0.5555801391601562, -0.5258941650390625, -0.49620819091796875, -0.466522216796875, -0.43683624267578125, -0.4071502685546875, -0.37746429443359375, -0.3477783203125, -0.31809234619140625, -0.2884063720703125, -0.25872039794921875, -0.229034423828125, -0.19934844970703125, -0.1696624755859375, -0.13997650146484375, -0.11029052734375, -0.08060455322265625, -0.0509185791015625, -0.02123260498046875, 0.008453369140625, 0.03813934326171875, 0.0678253173828125, 0.09751129150390625, 0.127197265625, 0.15688323974609375, 0.1865692138671875, 0.21625518798828125, 0.245941162109375, 0.27562713623046875, 0.3053131103515625, 0.33499908447265625, 0.36468505859375, 0.39437103271484375, 0.4240570068359375, 0.45374298095703125, 0.483428955078125, 0.5131149291992188, 0.5428009033203125, 0.5724868774414062, 0.6021728515625, 0.6318588256835938, 0.6615447998046875, 0.6912307739257812, 0.720916748046875, 0.7506027221679688, 0.7802886962890625, 0.8099746704101562, 0.83966064453125, 0.8693466186523438, 0.8990325927734375, 0.9287185668945312, 0.958404541015625, 0.9880905151367188, 1.0177764892578125, 1.0474624633789062, 1.0771484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 11.0, 16.0, 37.0, 31.0, 50.0, 75.0, 137.0, 202.0, 323.0, 577.0, 971.0, 1747.0, 3341.0, 6418.0, 12427.0, 25023.0, 51779.0, 112425.0, 261391.0, 720789.0, 1698726.0, 787760.0, 280606.0, 119965.0, 54759.0, 26334.0, 13261.0, 6869.0, 3760.0, 1951.0, 1043.0, 591.0, 320.0, 210.0, 110.0, 82.0, 63.0, 32.0, 21.0, 12.0, 13.0, 7.0, 7.0, 1.0, 2.0, 3.0, 2.0], "bins": [-1.66796875, -1.62353515625, -1.5791015625, -1.53466796875, -1.490234375, -1.44580078125, -1.4013671875, -1.35693359375, -1.3125, -1.26806640625, -1.2236328125, -1.17919921875, -1.134765625, -1.09033203125, -1.0458984375, -1.00146484375, -0.95703125, -0.91259765625, -0.8681640625, -0.82373046875, -0.779296875, -0.73486328125, -0.6904296875, -0.64599609375, -0.6015625, -0.55712890625, -0.5126953125, -0.46826171875, -0.423828125, -0.37939453125, -0.3349609375, -0.29052734375, -0.24609375, -0.20166015625, -0.1572265625, -0.11279296875, -0.068359375, -0.02392578125, 0.0205078125, 0.06494140625, 0.109375, 0.15380859375, 0.1982421875, 0.24267578125, 0.287109375, 0.33154296875, 0.3759765625, 0.42041015625, 0.46484375, 0.50927734375, 0.5537109375, 0.59814453125, 0.642578125, 0.68701171875, 0.7314453125, 0.77587890625, 0.8203125, 0.86474609375, 0.9091796875, 0.95361328125, 0.998046875, 1.04248046875, 1.0869140625, 1.13134765625, 1.17578125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 6.0, 12.0, 11.0, 23.0, 21.0, 26.0, 39.0, 40.0, 68.0, 87.0, 143.0, 165.0, 246.0, 335.0, 495.0, 547.0, 523.0, 336.0, 262.0, 173.0, 123.0, 98.0, 70.0, 47.0, 34.0, 27.0, 29.0, 20.0, 13.0, 19.0, 7.0, 5.0, 8.0, 7.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.4140625, -2.348114013671875, -2.28216552734375, -2.216217041015625, -2.1502685546875, -2.084320068359375, -2.01837158203125, -1.952423095703125, -1.886474609375, -1.820526123046875, -1.75457763671875, -1.688629150390625, -1.6226806640625, -1.556732177734375, -1.49078369140625, -1.424835205078125, -1.35888671875, -1.292938232421875, -1.22698974609375, -1.161041259765625, -1.0950927734375, -1.029144287109375, -0.96319580078125, -0.897247314453125, -0.831298828125, -0.765350341796875, -0.69940185546875, -0.633453369140625, -0.5675048828125, -0.501556396484375, -0.43560791015625, -0.369659423828125, -0.3037109375, -0.237762451171875, -0.17181396484375, -0.105865478515625, -0.0399169921875, 0.026031494140625, 0.09197998046875, 0.157928466796875, 0.223876953125, 0.289825439453125, 0.35577392578125, 0.421722412109375, 0.4876708984375, 0.553619384765625, 0.61956787109375, 0.685516357421875, 0.75146484375, 0.817413330078125, 0.88336181640625, 0.949310302734375, 1.0152587890625, 1.081207275390625, 1.14715576171875, 1.213104248046875, 1.279052734375, 1.345001220703125, 1.41094970703125, 1.476898193359375, 1.5428466796875, 1.608795166015625, 1.67474365234375, 1.740692138671875, 1.806640625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 12.0, 15.0, 19.0, 25.0, 34.0, 57.0, 56.0, 66.0, 99.0, 97.0, 103.0, 101.0, 77.0, 62.0, 48.0, 42.0, 24.0, 22.0, 10.0, 6.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.232515335083008, -10.881206512451172, -10.529897689819336, -10.1785888671875, -9.827279090881348, -9.475970268249512, -9.124661445617676, -8.77335262298584, -8.422042846679688, -8.070734024047852, -7.719424724578857, -7.3681159019470215, -7.016806602478027, -6.665497779846191, -6.3141889572143555, -5.9628801345825195, -5.611571311950684, -5.260262489318848, -4.9089531898498535, -4.557644367218018, -4.206335067749023, -3.8550262451171875, -3.5037174224853516, -3.1524083614349365, -2.8010993003845215, -2.4497902393341064, -2.0984811782836914, -1.7471723556518555, -1.3958632946014404, -1.0445542335510254, -0.6932454109191895, -0.3419363498687744, 0.009372711181640625, 0.3606817126274109, 0.7119907140731812, 1.0632996559143066, 1.4146087169647217, 1.7659177780151367, 2.1172266006469727, 2.4685356616973877, 2.8198447227478027, 3.1711537837982178, 3.522462844848633, 3.8737716674804688, 4.225080490112305, 4.576389789581299, 4.927698612213135, 5.279007911682129, 5.630316734313965, 5.981625556945801, 6.332934856414795, 6.684243679046631, 7.035552978515625, 7.386861801147461, 7.738170623779297, 8.089479446411133, 8.440788269042969, 8.792097091674805, 9.14340591430664, 9.494714736938477, 9.846024513244629, 10.197333335876465, 10.5486421585083, 10.899950981140137, 11.251260757446289]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 5.0, 2.0, 6.0, 10.0, 8.0, 13.0, 10.0, 12.0, 21.0, 19.0, 23.0, 24.0, 30.0, 37.0, 36.0, 36.0, 49.0, 48.0, 32.0, 43.0, 46.0, 35.0, 35.0, 51.0, 43.0, 36.0, 31.0, 34.0, 30.0, 23.0, 26.0, 30.0, 22.0, 22.0, 10.0, 13.0, 12.0, 8.0, 7.0, 2.0, 3.0, 5.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9807820320129395, -5.779944896697998, -5.579108238220215, -5.378271102905273, -5.177433967590332, -4.976596832275391, -4.775760173797607, -4.574923038482666, -4.374086380004883, -4.173249244689941, -3.972412347793579, -3.771575450897217, -3.5707383155822754, -3.369901418685913, -3.169064521789551, -2.9682273864746094, -2.767390251159668, -2.5665533542633057, -2.3657162189483643, -2.164879322052002, -1.96404230594635, -1.7632052898406982, -1.562368392944336, -1.361531376838684, -1.1606943607330322, -0.9598573446273804, -0.7590203881263733, -0.5581834316253662, -0.35734641551971436, -0.1565093994140625, 0.044327497482299805, 0.24516451358795166, 0.4460010528564453, 0.6468380689620972, 0.8476750254631042, 1.0485119819641113, 1.2493489980697632, 1.450186014175415, 1.6510229110717773, 1.8518599271774292, 2.052696943283081, 2.2535338401794434, 2.4543709754943848, 2.655207872390747, 2.8560447692871094, 3.056881904602051, 3.257718801498413, 3.4585556983947754, 3.659392833709717, 3.860229730606079, 4.061066627502441, 4.261903762817383, 4.462740898132324, 4.663578033447266, 4.864414691925049, 5.06525182723999, 5.266088485717773, 5.466925621032715, 5.667762279510498, 5.8685994148254395, 6.069436550140381, 6.270273208618164, 6.4711103439331055, 6.671947479248047, 6.872784614562988]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 4.0, 12.0, 16.0, 33.0, 58.0, 77.0, 121.0, 152.0, 243.0, 358.0, 546.0, 763.0, 1125.0, 1564.0, 2142.0, 3157.0, 4452.0, 6301.0, 9007.0, 14322.0, 24028.0, 48862.0, 121135.0, 282289.0, 285176.0, 124068.0, 49718.0, 24274.0, 14148.0, 9186.0, 6128.0, 4481.0, 3123.0, 2280.0, 1634.0, 1141.0, 795.0, 520.0, 374.0, 240.0, 151.0, 100.0, 77.0, 49.0, 37.0, 33.0, 19.0, 9.0, 9.0, 8.0, 5.0, 1.0, 2.0, 3.0], "bins": [-1.6689453125, -1.619873046875, -1.57080078125, -1.521728515625, -1.47265625, -1.423583984375, -1.37451171875, -1.325439453125, -1.2763671875, -1.227294921875, -1.17822265625, -1.129150390625, -1.080078125, -1.031005859375, -0.98193359375, -0.932861328125, -0.8837890625, -0.834716796875, -0.78564453125, -0.736572265625, -0.6875, -0.638427734375, -0.58935546875, -0.540283203125, -0.4912109375, -0.442138671875, -0.39306640625, -0.343994140625, -0.294921875, -0.245849609375, -0.19677734375, -0.147705078125, -0.0986328125, -0.049560546875, -0.00048828125, 0.048583984375, 0.09765625, 0.146728515625, 0.19580078125, 0.244873046875, 0.2939453125, 0.343017578125, 0.39208984375, 0.441162109375, 0.490234375, 0.539306640625, 0.58837890625, 0.637451171875, 0.6865234375, 0.735595703125, 0.78466796875, 0.833740234375, 0.8828125, 0.931884765625, 0.98095703125, 1.030029296875, 1.0791015625, 1.128173828125, 1.17724609375, 1.226318359375, 1.275390625, 1.324462890625, 1.37353515625, 1.422607421875, 1.4716796875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 6.0, 7.0, 10.0, 8.0, 9.0, 10.0, 16.0, 26.0, 14.0, 20.0, 19.0, 26.0, 18.0, 42.0, 35.0, 25.0, 35.0, 42.0, 40.0, 34.0, 45.0, 35.0, 41.0, 46.0, 33.0, 44.0, 40.0, 32.0, 24.0, 27.0, 17.0, 18.0, 16.0, 13.0, 19.0, 23.0, 10.0, 14.0, 12.0, 9.0, 12.0, 4.0, 6.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.892578125, -0.8657302856445312, -0.8388824462890625, -0.8120346069335938, -0.785186767578125, -0.7583389282226562, -0.7314910888671875, -0.7046432495117188, -0.67779541015625, -0.6509475708007812, -0.6240997314453125, -0.5972518920898438, -0.570404052734375, -0.5435562133789062, -0.5167083740234375, -0.48986053466796875, -0.4630126953125, -0.43616485595703125, -0.4093170166015625, -0.38246917724609375, -0.355621337890625, -0.32877349853515625, -0.3019256591796875, -0.27507781982421875, -0.24822998046875, -0.22138214111328125, -0.1945343017578125, -0.16768646240234375, -0.140838623046875, -0.11399078369140625, -0.0871429443359375, -0.06029510498046875, -0.033447265625, -0.00659942626953125, 0.0202484130859375, 0.04709625244140625, 0.073944091796875, 0.10079193115234375, 0.1276397705078125, 0.15448760986328125, 0.18133544921875, 0.20818328857421875, 0.2350311279296875, 0.26187896728515625, 0.288726806640625, 0.31557464599609375, 0.3424224853515625, 0.36927032470703125, 0.3961181640625, 0.42296600341796875, 0.4498138427734375, 0.47666168212890625, 0.503509521484375, 0.5303573608398438, 0.5572052001953125, 0.5840530395507812, 0.61090087890625, 0.6377487182617188, 0.6645965576171875, 0.6914443969726562, 0.718292236328125, 0.7451400756835938, 0.7719879150390625, 0.7988357543945312, 0.82568359375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 13.0, 11.0, 11.0, 13.0, 21.0, 34.0, 42.0, 64.0, 78.0, 143.0, 257.0, 520.0, 1031.0, 2042.0, 4486.0, 9521.0, 21194.0, 54452.0, 196069.0, 490297.0, 179737.0, 50780.0, 20191.0, 9180.0, 4200.0, 2045.0, 948.0, 464.0, 238.0, 142.0, 97.0, 68.0, 48.0, 40.0, 20.0, 21.0, 7.0, 6.0, 11.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.421112060546875, -2.34417724609375, -2.267242431640625, -2.1903076171875, -2.113372802734375, -2.03643798828125, -1.959503173828125, -1.882568359375, -1.805633544921875, -1.72869873046875, -1.651763916015625, -1.5748291015625, -1.497894287109375, -1.42095947265625, -1.344024658203125, -1.26708984375, -1.190155029296875, -1.11322021484375, -1.036285400390625, -0.9593505859375, -0.882415771484375, -0.80548095703125, -0.728546142578125, -0.651611328125, -0.574676513671875, -0.49774169921875, -0.420806884765625, -0.3438720703125, -0.266937255859375, -0.19000244140625, -0.113067626953125, -0.0361328125, 0.040802001953125, 0.11773681640625, 0.194671630859375, 0.2716064453125, 0.348541259765625, 0.42547607421875, 0.502410888671875, 0.579345703125, 0.656280517578125, 0.73321533203125, 0.810150146484375, 0.8870849609375, 0.964019775390625, 1.04095458984375, 1.117889404296875, 1.19482421875, 1.271759033203125, 1.34869384765625, 1.425628662109375, 1.5025634765625, 1.579498291015625, 1.65643310546875, 1.733367919921875, 1.810302734375, 1.887237548828125, 1.96417236328125, 2.041107177734375, 2.1180419921875, 2.194976806640625, 2.27191162109375, 2.348846435546875, 2.42578125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 9.0, 8.0, 10.0, 15.0, 14.0, 18.0, 22.0, 19.0, 26.0, 31.0, 31.0, 37.0, 36.0, 27.0, 45.0, 45.0, 40.0, 51.0, 38.0, 45.0, 30.0, 43.0, 54.0, 45.0, 32.0, 30.0, 20.0, 29.0, 16.0, 20.0, 12.0, 12.0, 11.0, 18.0, 8.0, 8.0, 8.0, 7.0, 7.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-2.951171875, -2.871490478515625, -2.79180908203125, -2.712127685546875, -2.6324462890625, -2.552764892578125, -2.47308349609375, -2.393402099609375, -2.313720703125, -2.234039306640625, -2.15435791015625, -2.074676513671875, -1.9949951171875, -1.915313720703125, -1.83563232421875, -1.755950927734375, -1.67626953125, -1.596588134765625, -1.51690673828125, -1.437225341796875, -1.3575439453125, -1.277862548828125, -1.19818115234375, -1.118499755859375, -1.038818359375, -0.959136962890625, -0.87945556640625, -0.799774169921875, -0.7200927734375, -0.640411376953125, -0.56072998046875, -0.481048583984375, -0.4013671875, -0.321685791015625, -0.24200439453125, -0.162322998046875, -0.0826416015625, -0.002960205078125, 0.07672119140625, 0.156402587890625, 0.236083984375, 0.315765380859375, 0.39544677734375, 0.475128173828125, 0.5548095703125, 0.634490966796875, 0.71417236328125, 0.793853759765625, 0.87353515625, 0.953216552734375, 1.03289794921875, 1.112579345703125, 1.1922607421875, 1.271942138671875, 1.35162353515625, 1.431304931640625, 1.510986328125, 1.590667724609375, 1.67034912109375, 1.750030517578125, 1.8297119140625, 1.909393310546875, 1.98907470703125, 2.068756103515625, 2.1484375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 9.0, 9.0, 13.0, 26.0, 45.0, 72.0, 142.0, 246.0, 427.0, 757.0, 1380.0, 2473.0, 4355.0, 7671.0, 14918.0, 33418.0, 99307.0, 345834.0, 363281.0, 105334.0, 35199.0, 15382.0, 8059.0, 4496.0, 2471.0, 1431.0, 770.0, 446.0, 240.0, 139.0, 82.0, 40.0, 36.0, 10.0, 14.0, 9.0, 3.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8408203125, -0.8153610229492188, -0.7899017333984375, -0.7644424438476562, -0.738983154296875, -0.7135238647460938, -0.6880645751953125, -0.6626052856445312, -0.63714599609375, -0.6116867065429688, -0.5862274169921875, -0.5607681274414062, -0.535308837890625, -0.5098495483398438, -0.4843902587890625, -0.45893096923828125, -0.4334716796875, -0.40801239013671875, -0.3825531005859375, -0.35709381103515625, -0.331634521484375, -0.30617523193359375, -0.2807159423828125, -0.25525665283203125, -0.22979736328125, -0.20433807373046875, -0.1788787841796875, -0.15341949462890625, -0.127960205078125, -0.10250091552734375, -0.0770416259765625, -0.05158233642578125, -0.026123046875, -0.00066375732421875, 0.0247955322265625, 0.05025482177734375, 0.075714111328125, 0.10117340087890625, 0.1266326904296875, 0.15209197998046875, 0.17755126953125, 0.20301055908203125, 0.2284698486328125, 0.25392913818359375, 0.279388427734375, 0.30484771728515625, 0.3303070068359375, 0.35576629638671875, 0.3812255859375, 0.40668487548828125, 0.4321441650390625, 0.45760345458984375, 0.483062744140625, 0.5085220336914062, 0.5339813232421875, 0.5594406127929688, 0.58489990234375, 0.6103591918945312, 0.6358184814453125, 0.6612777709960938, 0.686737060546875, 0.7121963500976562, 0.7376556396484375, 0.7631149291992188, 0.78857421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 2.0, 1.0, 3.0, 9.0, 21.0, 12.0, 24.0, 30.0, 55.0, 101.0, 176.0, 207.0, 138.0, 73.0, 45.0, 32.0, 7.0, 10.0, 11.0, 7.0, 3.0, 5.0, 4.0, 3.0, 3.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002340078353881836, -0.00022436119616031647, -0.00021471455693244934, -0.00020506791770458221, -0.0001954212784767151, -0.00018577463924884796, -0.00017612800002098083, -0.0001664813607931137, -0.00015683472156524658, -0.00014718808233737946, -0.00013754144310951233, -0.0001278948038816452, -0.00011824816465377808, -0.00010860152542591095, -9.895488619804382e-05, -8.93082469701767e-05, -7.966160774230957e-05, -7.001496851444244e-05, -6.036832928657532e-05, -5.072169005870819e-05, -4.1075050830841064e-05, -3.142841160297394e-05, -2.178177237510681e-05, -1.2135133147239685e-05, -2.4884939193725586e-06, 7.158145308494568e-06, 1.6804784536361694e-05, 2.645142376422882e-05, 3.609806299209595e-05, 4.5744702219963074e-05, 5.53913414478302e-05, 6.503798067569733e-05, 7.468461990356445e-05, 8.433125913143158e-05, 9.39778983592987e-05, 0.00010362453758716583, 0.00011327117681503296, 0.00012291781604290009, 0.0001325644552707672, 0.00014221109449863434, 0.00015185773372650146, 0.0001615043729543686, 0.00017115101218223572, 0.00018079765141010284, 0.00019044429063796997, 0.0002000909298658371, 0.00020973756909370422, 0.00021938420832157135, 0.00022903084754943848, 0.0002386774867773056, 0.00024832412600517273, 0.00025797076523303986, 0.000267617404460907, 0.0002772640436887741, 0.00028691068291664124, 0.00029655732214450836, 0.0003062039613723755, 0.0003158506006002426, 0.00032549723982810974, 0.00033514387905597687, 0.000344790518283844, 0.0003544371575117111, 0.00036408379673957825, 0.0003737304359674454, 0.0003833770751953125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 6.0, 5.0, 5.0, 13.0, 9.0, 27.0, 26.0, 30.0, 60.0, 79.0, 158.0, 250.0, 390.0, 734.0, 1325.0, 2620.0, 5020.0, 10453.0, 24435.0, 66821.0, 201070.0, 381461.0, 227099.0, 76056.0, 27036.0, 11504.0, 5478.0, 2907.0, 1557.0, 800.0, 456.0, 263.0, 132.0, 83.0, 64.0, 40.0, 19.0, 19.0, 15.0, 7.0, 7.0, 2.0, 6.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64404296875, -0.6206741333007812, -0.5973052978515625, -0.5739364624023438, -0.550567626953125, -0.5271987915039062, -0.5038299560546875, -0.48046112060546875, -0.45709228515625, -0.43372344970703125, -0.4103546142578125, -0.38698577880859375, -0.363616943359375, -0.34024810791015625, -0.3168792724609375, -0.29351043701171875, -0.2701416015625, -0.24677276611328125, -0.2234039306640625, -0.20003509521484375, -0.176666259765625, -0.15329742431640625, -0.1299285888671875, -0.10655975341796875, -0.08319091796875, -0.05982208251953125, -0.0364532470703125, -0.01308441162109375, 0.010284423828125, 0.03365325927734375, 0.0570220947265625, 0.08039093017578125, 0.103759765625, 0.12712860107421875, 0.1504974365234375, 0.17386627197265625, 0.197235107421875, 0.22060394287109375, 0.2439727783203125, 0.26734161376953125, 0.29071044921875, 0.31407928466796875, 0.3374481201171875, 0.36081695556640625, 0.384185791015625, 0.40755462646484375, 0.4309234619140625, 0.45429229736328125, 0.4776611328125, 0.5010299682617188, 0.5243988037109375, 0.5477676391601562, 0.571136474609375, 0.5945053100585938, 0.6178741455078125, 0.6412429809570312, 0.66461181640625, 0.6879806518554688, 0.7113494873046875, 0.7347183227539062, 0.758087158203125, 0.7814559936523438, 0.8048248291015625, 0.8281936645507812, 0.8515625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 3.0, 5.0, 7.0, 7.0, 9.0, 15.0, 24.0, 26.0, 56.0, 45.0, 73.0, 81.0, 100.0, 81.0, 77.0, 94.0, 71.0, 59.0, 40.0, 23.0, 25.0, 11.0, 18.0, 8.0, 6.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.775390625, -0.7516021728515625, -0.727813720703125, -0.7040252685546875, -0.68023681640625, -0.6564483642578125, -0.632659912109375, -0.6088714599609375, -0.5850830078125, -0.5612945556640625, -0.537506103515625, -0.5137176513671875, -0.48992919921875, -0.4661407470703125, -0.442352294921875, -0.4185638427734375, -0.394775390625, -0.3709869384765625, -0.347198486328125, -0.3234100341796875, -0.29962158203125, -0.2758331298828125, -0.252044677734375, -0.2282562255859375, -0.2044677734375, -0.1806793212890625, -0.156890869140625, -0.1331024169921875, -0.10931396484375, -0.0855255126953125, -0.061737060546875, -0.0379486083984375, -0.01416015625, 0.0096282958984375, 0.033416748046875, 0.0572052001953125, 0.08099365234375, 0.1047821044921875, 0.128570556640625, 0.1523590087890625, 0.1761474609375, 0.1999359130859375, 0.223724365234375, 0.2475128173828125, 0.27130126953125, 0.2950897216796875, 0.318878173828125, 0.3426666259765625, 0.366455078125, 0.3902435302734375, 0.414031982421875, 0.4378204345703125, 0.46160888671875, 0.4853973388671875, 0.509185791015625, 0.5329742431640625, 0.5567626953125, 0.5805511474609375, 0.604339599609375, 0.6281280517578125, 0.65191650390625, 0.6757049560546875, 0.699493408203125, 0.7232818603515625, 0.7470703125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 11.0, 9.0, 30.0, 74.0, 136.0, 189.0, 195.0, 162.0, 111.0, 49.0, 19.0, 11.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.039463996887207, -9.464722633361816, -8.889981269836426, -8.315240859985352, -7.740499496459961, -7.16575813293457, -6.59101676940918, -6.016275882720947, -5.441534519195557, -4.866793155670166, -4.292052268981934, -3.717310905456543, -3.1425697803497314, -2.56782865524292, -1.9930872917175293, -1.4183464050292969, -0.8436050415039062, -0.26886385679244995, 0.30587732791900635, 0.8806185722351074, 1.455359697341919, 2.0301008224487305, 2.604842185974121, 3.1795830726623535, 3.754324436187744, 4.329065799713135, 4.903806686401367, 5.478548049926758, 6.053289413452148, 6.628030300140381, 7.2027716636657715, 7.777512550354004, 8.352254867553711, 8.926996231079102, 9.501737594604492, 10.076478958129883, 10.651219367980957, 11.225960731506348, 11.800702095031738, 12.375442504882812, 12.950183868408203, 13.524925231933594, 14.099666595458984, 14.674407958984375, 15.24914836883545, 15.82388973236084, 16.398632049560547, 16.973371505737305, 17.548114776611328, 18.12285614013672, 18.69759750366211, 19.2723388671875, 19.84708023071289, 20.42182159423828, 20.996562957763672, 21.57130241394043, 22.14604377746582, 22.72078514099121, 23.2955265045166, 23.870267868041992, 24.445009231567383, 25.01974868774414, 25.59449005126953, 26.169231414794922, 26.743972778320312]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 9.0, 6.0, 6.0, 11.0, 13.0, 14.0, 13.0, 20.0, 35.0, 33.0, 43.0, 32.0, 34.0, 35.0, 36.0, 41.0, 41.0, 40.0, 36.0, 44.0, 46.0, 43.0, 31.0, 42.0, 44.0, 31.0, 35.0, 34.0, 26.0, 19.0, 20.0, 13.0, 12.0, 11.0, 10.0, 7.0, 9.0, 8.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.477691650390625, -6.257359504699707, -6.037026882171631, -5.816694736480713, -5.596362113952637, -5.376029968261719, -5.155697822570801, -4.935365200042725, -4.715032577514648, -4.4947004318237305, -4.274367809295654, -4.054035663604736, -3.83370304107666, -3.613370895385742, -3.393038511276245, -3.172706127166748, -2.95237398147583, -2.732041597366333, -2.511709213256836, -2.291377067565918, -2.071044445037842, -1.8507121801376343, -1.6303799152374268, -1.4100475311279297, -1.1897151470184326, -0.9693827629089355, -0.7490504384040833, -0.528718113899231, -0.3083857297897339, -0.08805334568023682, 0.1322789192199707, 0.3526113033294678, 0.5729436874389648, 0.7932760715484619, 1.013608455657959, 1.2339407205581665, 1.4542731046676636, 1.6746054887771606, 1.8949377536773682, 2.1152701377868652, 2.3356025218963623, 2.5559349060058594, 2.7762672901153564, 2.9965996742248535, 3.2169318199157715, 3.4372644424438477, 3.6575965881347656, 3.8779289722442627, 4.09826135635376, 4.318593502044678, 4.538926124572754, 4.759258270263672, 4.979590892791748, 5.199923038482666, 5.420255661010742, 5.64058780670166, 5.860919952392578, 6.081252098083496, 6.301584720611572, 6.52191686630249, 6.742249488830566, 6.962581634521484, 7.182913780212402, 7.4032464027404785, 7.623579025268555]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 8.0, 7.0, 15.0, 22.0, 26.0, 37.0, 52.0, 77.0, 127.0, 162.0, 229.0, 393.0, 773.0, 1396.0, 2416.0, 4594.0, 9178.0, 18267.0, 36715.0, 78389.0, 181691.0, 507498.0, 1434786.0, 1222297.0, 409334.0, 152377.0, 67122.0, 32367.0, 16121.0, 8086.0, 4231.0, 2372.0, 1190.0, 723.0, 420.0, 243.0, 173.0, 112.0, 77.0, 53.0, 42.0, 26.0, 15.0, 11.0, 13.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0], "bins": [-1.3251953125, -1.2872314453125, -1.249267578125, -1.2113037109375, -1.17333984375, -1.1353759765625, -1.097412109375, -1.0594482421875, -1.021484375, -0.9835205078125, -0.945556640625, -0.9075927734375, -0.86962890625, -0.8316650390625, -0.793701171875, -0.7557373046875, -0.7177734375, -0.6798095703125, -0.641845703125, -0.6038818359375, -0.56591796875, -0.5279541015625, -0.489990234375, -0.4520263671875, -0.4140625, -0.3760986328125, -0.338134765625, -0.3001708984375, -0.26220703125, -0.2242431640625, -0.186279296875, -0.1483154296875, -0.1103515625, -0.0723876953125, -0.034423828125, 0.0035400390625, 0.04150390625, 0.0794677734375, 0.117431640625, 0.1553955078125, 0.193359375, 0.2313232421875, 0.269287109375, 0.3072509765625, 0.34521484375, 0.3831787109375, 0.421142578125, 0.4591064453125, 0.4970703125, 0.5350341796875, 0.572998046875, 0.6109619140625, 0.64892578125, 0.6868896484375, 0.724853515625, 0.7628173828125, 0.80078125, 0.8387451171875, 0.876708984375, 0.9146728515625, 0.95263671875, 0.9906005859375, 1.028564453125, 1.0665283203125, 1.1044921875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 10.0, 8.0, 14.0, 6.0, 15.0, 25.0, 17.0, 23.0, 26.0, 30.0, 36.0, 47.0, 43.0, 44.0, 47.0, 53.0, 58.0, 45.0, 44.0, 45.0, 40.0, 42.0, 41.0, 43.0, 31.0, 34.0, 23.0, 22.0, 24.0, 13.0, 13.0, 8.0, 8.0, 2.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90966796875, -0.8745346069335938, -0.8394012451171875, -0.8042678833007812, -0.769134521484375, -0.7340011596679688, -0.6988677978515625, -0.6637344360351562, -0.62860107421875, -0.5934677124023438, -0.5583343505859375, -0.5232009887695312, -0.488067626953125, -0.45293426513671875, -0.4178009033203125, -0.38266754150390625, -0.3475341796875, -0.31240081787109375, -0.2772674560546875, -0.24213409423828125, -0.207000732421875, -0.17186737060546875, -0.1367340087890625, -0.10160064697265625, -0.06646728515625, -0.03133392333984375, 0.0037994384765625, 0.03893280029296875, 0.074066162109375, 0.10919952392578125, 0.1443328857421875, 0.17946624755859375, 0.214599609375, 0.24973297119140625, 0.2848663330078125, 0.31999969482421875, 0.355133056640625, 0.39026641845703125, 0.4253997802734375, 0.46053314208984375, 0.49566650390625, 0.5307998657226562, 0.5659332275390625, 0.6010665893554688, 0.636199951171875, 0.6713333129882812, 0.7064666748046875, 0.7416000366210938, 0.7767333984375, 0.8118667602539062, 0.8470001220703125, 0.8821334838867188, 0.917266845703125, 0.9524002075195312, 0.9875335693359375, 1.0226669311523438, 1.05780029296875, 1.0929336547851562, 1.1280670166015625, 1.1632003784179688, 1.198333740234375, 1.2334671020507812, 1.2686004638671875, 1.3037338256835938, 1.3388671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 8.0, 7.0, 10.0, 16.0, 25.0, 40.0, 63.0, 86.0, 148.0, 251.0, 397.0, 783.0, 1537.0, 3347.0, 7694.0, 19022.0, 50362.0, 145615.0, 538112.0, 2260972.0, 854839.0, 201239.0, 66770.0, 24812.0, 9802.0, 4226.0, 1844.0, 965.0, 474.0, 277.0, 194.0, 135.0, 70.0, 51.0, 30.0, 24.0, 11.0, 7.0, 9.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.044921875, -1.982269287109375, -1.91961669921875, -1.856964111328125, -1.7943115234375, -1.731658935546875, -1.66900634765625, -1.606353759765625, -1.543701171875, -1.481048583984375, -1.41839599609375, -1.355743408203125, -1.2930908203125, -1.230438232421875, -1.16778564453125, -1.105133056640625, -1.04248046875, -0.979827880859375, -0.91717529296875, -0.854522705078125, -0.7918701171875, -0.729217529296875, -0.66656494140625, -0.603912353515625, -0.541259765625, -0.478607177734375, -0.41595458984375, -0.353302001953125, -0.2906494140625, -0.227996826171875, -0.16534423828125, -0.102691650390625, -0.0400390625, 0.022613525390625, 0.08526611328125, 0.147918701171875, 0.2105712890625, 0.273223876953125, 0.33587646484375, 0.398529052734375, 0.461181640625, 0.523834228515625, 0.58648681640625, 0.649139404296875, 0.7117919921875, 0.774444580078125, 0.83709716796875, 0.899749755859375, 0.96240234375, 1.025054931640625, 1.08770751953125, 1.150360107421875, 1.2130126953125, 1.275665283203125, 1.33831787109375, 1.400970458984375, 1.463623046875, 1.526275634765625, 1.58892822265625, 1.651580810546875, 1.7142333984375, 1.776885986328125, 1.83953857421875, 1.902191162109375, 1.96484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 4.0, 2.0, 7.0, 7.0, 8.0, 4.0, 4.0, 14.0, 16.0, 17.0, 30.0, 46.0, 60.0, 69.0, 121.0, 172.0, 223.0, 350.0, 532.0, 716.0, 554.0, 361.0, 227.0, 149.0, 110.0, 66.0, 61.0, 36.0, 31.0, 15.0, 18.0, 16.0, 9.0, 7.0, 6.0, 2.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6640625, -1.59014892578125, -1.5162353515625, -1.44232177734375, -1.368408203125, -1.29449462890625, -1.2205810546875, -1.14666748046875, -1.07275390625, -0.99884033203125, -0.9249267578125, -0.85101318359375, -0.777099609375, -0.70318603515625, -0.6292724609375, -0.55535888671875, -0.4814453125, -0.40753173828125, -0.3336181640625, -0.25970458984375, -0.185791015625, -0.11187744140625, -0.0379638671875, 0.03594970703125, 0.10986328125, 0.18377685546875, 0.2576904296875, 0.33160400390625, 0.405517578125, 0.47943115234375, 0.5533447265625, 0.62725830078125, 0.701171875, 0.77508544921875, 0.8489990234375, 0.92291259765625, 0.996826171875, 1.07073974609375, 1.1446533203125, 1.21856689453125, 1.29248046875, 1.36639404296875, 1.4403076171875, 1.51422119140625, 1.588134765625, 1.66204833984375, 1.7359619140625, 1.80987548828125, 1.8837890625, 1.95770263671875, 2.0316162109375, 2.10552978515625, 2.179443359375, 2.25335693359375, 2.3272705078125, 2.40118408203125, 2.47509765625, 2.54901123046875, 2.6229248046875, 2.69683837890625, 2.770751953125, 2.84466552734375, 2.9185791015625, 2.99249267578125, 3.06640625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 0.0, 8.0, 10.0, 8.0, 20.0, 36.0, 66.0, 83.0, 101.0, 122.0, 121.0, 112.0, 104.0, 74.0, 49.0, 30.0, 23.0, 15.0, 5.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.56159496307373, -12.11709213256836, -11.672590255737305, -11.228087425231934, -10.783585548400879, -10.339082717895508, -9.894580841064453, -9.450078010559082, -9.005575180053711, -8.56107234954834, -8.116570472717285, -7.672067642211914, -7.227565765380859, -6.783062934875488, -6.338560581207275, -5.8940582275390625, -5.449556350708008, -5.005053997039795, -4.560551643371582, -4.116048812866211, -3.671546697616577, -3.2270443439483643, -2.7825417518615723, -2.3380393981933594, -1.8935370445251465, -1.4490346908569336, -1.0045322179794312, -0.5600297451019287, -0.11552739143371582, 0.32897496223449707, 0.7734775543212891, 1.217979907989502, 1.6624813079833984, 2.1069836616516113, 2.551486015319824, 2.995988607406616, 3.440490961074829, 3.884993314743042, 4.329495906829834, 4.773998260498047, 5.21850061416626, 5.663002967834473, 6.1075053215026855, 6.552007675170898, 6.9965105056762695, 7.441012382507324, 7.885515213012695, 8.33001708984375, 8.774519920349121, 9.219022750854492, 9.663524627685547, 10.108027458190918, 10.552529335021973, 10.997032165527344, 11.441534042358398, 11.88603687286377, 12.33053970336914, 12.775042533874512, 13.219544410705566, 13.664047241210938, 14.108549118041992, 14.553051948547363, 14.997554779052734, 15.442056655883789, 15.886558532714844]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 5.0, 10.0, 10.0, 12.0, 7.0, 11.0, 17.0, 15.0, 21.0, 18.0, 16.0, 28.0, 37.0, 27.0, 29.0, 30.0, 25.0, 51.0, 35.0, 44.0, 38.0, 36.0, 40.0, 47.0, 38.0, 35.0, 28.0, 42.0, 24.0, 18.0, 31.0, 24.0, 24.0, 16.0, 20.0, 15.0, 10.0, 13.0, 1.0, 13.0, 6.0, 5.0, 5.0, 8.0, 1.0, 7.0, 2.0, 3.0, 1.0], "bins": [-6.567473411560059, -6.384567737579346, -6.201662540435791, -6.018756866455078, -5.835851192474365, -5.652945518493652, -5.470040321350098, -5.287134647369385, -5.104228973388672, -4.921323299407959, -4.738418102264404, -4.555512428283691, -4.3726067543029785, -4.189701080322266, -4.006795883178711, -3.823890209197998, -3.6409850120544434, -3.4580795764923096, -3.2751739025115967, -3.092268466949463, -2.90936279296875, -2.726457357406616, -2.5435519218444824, -2.3606462478637695, -2.1777408123016357, -1.9948352575302124, -1.811929702758789, -1.6290242671966553, -1.446118712425232, -1.2632131576538086, -1.0803077220916748, -0.8974021673202515, -0.7144961357116699, -0.5315905809402466, -0.348685085773468, -0.16577959060668945, 0.017125964164733887, 0.20003151893615723, 0.382936954498291, 0.5658425092697144, 0.7487480640411377, 0.931653618812561, 1.1145591735839844, 1.2974646091461182, 1.4803701639175415, 1.6632757186889648, 1.8461811542510986, 2.0290865898132324, 2.2119922637939453, 2.394897699356079, 2.577803373336792, 2.760708808898926, 2.9436144828796387, 3.1265199184417725, 3.3094253540039062, 3.492331027984619, 3.675236463546753, 3.8581418991088867, 4.0410475730896, 4.2239532470703125, 4.406858444213867, 4.58976411819458, 4.772669792175293, 4.955574989318848, 5.1384806632995605]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 5.0, 14.0, 13.0, 8.0, 22.0, 31.0, 60.0, 80.0, 130.0, 222.0, 470.0, 875.0, 1848.0, 3626.0, 6921.0, 13474.0, 27183.0, 65734.0, 229021.0, 443381.0, 159389.0, 50507.0, 22275.0, 11367.0, 5871.0, 2939.0, 1502.0, 732.0, 385.0, 179.0, 111.0, 60.0, 45.0, 15.0, 25.0, 10.0, 7.0, 4.0, 3.0, 1.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.177734375, -2.10357666015625, -2.0294189453125, -1.95526123046875, -1.881103515625, -1.80694580078125, -1.7327880859375, -1.65863037109375, -1.58447265625, -1.51031494140625, -1.4361572265625, -1.36199951171875, -1.287841796875, -1.21368408203125, -1.1395263671875, -1.06536865234375, -0.9912109375, -0.91705322265625, -0.8428955078125, -0.76873779296875, -0.694580078125, -0.62042236328125, -0.5462646484375, -0.47210693359375, -0.39794921875, -0.32379150390625, -0.2496337890625, -0.17547607421875, -0.101318359375, -0.02716064453125, 0.0469970703125, 0.12115478515625, 0.1953125, 0.26947021484375, 0.3436279296875, 0.41778564453125, 0.491943359375, 0.56610107421875, 0.6402587890625, 0.71441650390625, 0.78857421875, 0.86273193359375, 0.9368896484375, 1.01104736328125, 1.085205078125, 1.15936279296875, 1.2335205078125, 1.30767822265625, 1.3818359375, 1.45599365234375, 1.5301513671875, 1.60430908203125, 1.678466796875, 1.75262451171875, 1.8267822265625, 1.90093994140625, 1.97509765625, 2.04925537109375, 2.1234130859375, 2.19757080078125, 2.271728515625, 2.34588623046875, 2.4200439453125, 2.49420166015625, 2.568359375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 8.0, 13.0, 11.0, 13.0, 12.0, 21.0, 20.0, 18.0, 25.0, 33.0, 35.0, 33.0, 38.0, 38.0, 24.0, 37.0, 40.0, 38.0, 35.0, 52.0, 42.0, 41.0, 41.0, 33.0, 31.0, 39.0, 28.0, 31.0, 29.0, 19.0, 25.0, 16.0, 23.0, 10.0, 7.0, 7.0, 8.0, 6.0, 4.0, 7.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.87646484375, -0.8469772338867188, -0.8174896240234375, -0.7880020141601562, -0.758514404296875, -0.7290267944335938, -0.6995391845703125, -0.6700515747070312, -0.64056396484375, -0.6110763549804688, -0.5815887451171875, -0.5521011352539062, -0.522613525390625, -0.49312591552734375, -0.4636383056640625, -0.43415069580078125, -0.4046630859375, -0.37517547607421875, -0.3456878662109375, -0.31620025634765625, -0.286712646484375, -0.25722503662109375, -0.2277374267578125, -0.19824981689453125, -0.16876220703125, -0.13927459716796875, -0.1097869873046875, -0.08029937744140625, -0.050811767578125, -0.02132415771484375, 0.0081634521484375, 0.03765106201171875, 0.067138671875, 0.09662628173828125, 0.1261138916015625, 0.15560150146484375, 0.185089111328125, 0.21457672119140625, 0.2440643310546875, 0.27355194091796875, 0.30303955078125, 0.33252716064453125, 0.3620147705078125, 0.39150238037109375, 0.420989990234375, 0.45047760009765625, 0.4799652099609375, 0.5094528198242188, 0.5389404296875, 0.5684280395507812, 0.5979156494140625, 0.6274032592773438, 0.656890869140625, 0.6863784790039062, 0.7158660888671875, 0.7453536987304688, 0.77484130859375, 0.8043289184570312, 0.8338165283203125, 0.8633041381835938, 0.892791748046875, 0.9222793579101562, 0.9517669677734375, 0.9812545776367188, 1.0107421875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 4.0, 11.0, 6.0, 8.0, 18.0, 19.0, 25.0, 28.0, 51.0, 73.0, 110.0, 146.0, 233.0, 399.0, 699.0, 1262.0, 2487.0, 5066.0, 10704.0, 23564.0, 59423.0, 229084.0, 479730.0, 154057.0, 44754.0, 18814.0, 8789.0, 4269.0, 1983.0, 1071.0, 535.0, 369.0, 239.0, 152.0, 108.0, 62.0, 59.0, 35.0, 27.0, 21.0, 12.0, 13.0, 11.0, 8.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.189453125, -2.114898681640625, -2.04034423828125, -1.965789794921875, -1.8912353515625, -1.816680908203125, -1.74212646484375, -1.667572021484375, -1.593017578125, -1.518463134765625, -1.44390869140625, -1.369354248046875, -1.2947998046875, -1.220245361328125, -1.14569091796875, -1.071136474609375, -0.99658203125, -0.922027587890625, -0.84747314453125, -0.772918701171875, -0.6983642578125, -0.623809814453125, -0.54925537109375, -0.474700927734375, -0.400146484375, -0.325592041015625, -0.25103759765625, -0.176483154296875, -0.1019287109375, -0.027374267578125, 0.04718017578125, 0.121734619140625, 0.1962890625, 0.270843505859375, 0.34539794921875, 0.419952392578125, 0.4945068359375, 0.569061279296875, 0.64361572265625, 0.718170166015625, 0.792724609375, 0.867279052734375, 0.94183349609375, 1.016387939453125, 1.0909423828125, 1.165496826171875, 1.24005126953125, 1.314605712890625, 1.38916015625, 1.463714599609375, 1.53826904296875, 1.612823486328125, 1.6873779296875, 1.761932373046875, 1.83648681640625, 1.911041259765625, 1.985595703125, 2.060150146484375, 2.13470458984375, 2.209259033203125, 2.2838134765625, 2.358367919921875, 2.43292236328125, 2.507476806640625, 2.58203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 5.0, 8.0, 10.0, 8.0, 20.0, 25.0, 19.0, 20.0, 42.0, 34.0, 43.0, 40.0, 55.0, 48.0, 55.0, 48.0, 46.0, 54.0, 57.0, 49.0, 56.0, 46.0, 37.0, 27.0, 27.0, 22.0, 24.0, 13.0, 12.0, 5.0, 11.0, 8.0, 3.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.365234375, -3.25640869140625, -3.1475830078125, -3.03875732421875, -2.929931640625, -2.82110595703125, -2.7122802734375, -2.60345458984375, -2.49462890625, -2.38580322265625, -2.2769775390625, -2.16815185546875, -2.059326171875, -1.95050048828125, -1.8416748046875, -1.73284912109375, -1.6240234375, -1.51519775390625, -1.4063720703125, -1.29754638671875, -1.188720703125, -1.07989501953125, -0.9710693359375, -0.86224365234375, -0.75341796875, -0.64459228515625, -0.5357666015625, -0.42694091796875, -0.318115234375, -0.20928955078125, -0.1004638671875, 0.00836181640625, 0.1171875, 0.22601318359375, 0.3348388671875, 0.44366455078125, 0.552490234375, 0.66131591796875, 0.7701416015625, 0.87896728515625, 0.98779296875, 1.09661865234375, 1.2054443359375, 1.31427001953125, 1.423095703125, 1.53192138671875, 1.6407470703125, 1.74957275390625, 1.8583984375, 1.96722412109375, 2.0760498046875, 2.18487548828125, 2.293701171875, 2.40252685546875, 2.5113525390625, 2.62017822265625, 2.72900390625, 2.83782958984375, 2.9466552734375, 3.05548095703125, 3.164306640625, 3.27313232421875, 3.3819580078125, 3.49078369140625, 3.599609375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 11.0, 10.0, 15.0, 18.0, 34.0, 47.0, 81.0, 112.0, 217.0, 342.0, 612.0, 1022.0, 1778.0, 3308.0, 5497.0, 10320.0, 19355.0, 37008.0, 82311.0, 221846.0, 364160.0, 168185.0, 65510.0, 30553.0, 16249.0, 8640.0, 4879.0, 2647.0, 1533.0, 892.0, 536.0, 328.0, 183.0, 117.0, 69.0, 30.0, 35.0, 17.0, 15.0, 7.0, 11.0, 7.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67529296875, -0.6530532836914062, -0.6308135986328125, -0.6085739135742188, -0.586334228515625, -0.5640945434570312, -0.5418548583984375, -0.5196151733398438, -0.49737548828125, -0.47513580322265625, -0.4528961181640625, -0.43065643310546875, -0.408416748046875, -0.38617706298828125, -0.3639373779296875, -0.34169769287109375, -0.3194580078125, -0.29721832275390625, -0.2749786376953125, -0.25273895263671875, -0.230499267578125, -0.20825958251953125, -0.1860198974609375, -0.16378021240234375, -0.14154052734375, -0.11930084228515625, -0.0970611572265625, -0.07482147216796875, -0.052581787109375, -0.03034210205078125, -0.0081024169921875, 0.01413726806640625, 0.036376953125, 0.05861663818359375, 0.0808563232421875, 0.10309600830078125, 0.125335693359375, 0.14757537841796875, 0.1698150634765625, 0.19205474853515625, 0.21429443359375, 0.23653411865234375, 0.2587738037109375, 0.28101348876953125, 0.303253173828125, 0.32549285888671875, 0.3477325439453125, 0.36997222900390625, 0.3922119140625, 0.41445159912109375, 0.4366912841796875, 0.45893096923828125, 0.481170654296875, 0.5034103393554688, 0.5256500244140625, 0.5478897094726562, 0.57012939453125, 0.5923690795898438, 0.6146087646484375, 0.6368484497070312, 0.659088134765625, 0.6813278198242188, 0.7035675048828125, 0.7258071899414062, 0.748046875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 5.0, 4.0, 6.0, 11.0, 11.0, 9.0, 14.0, 13.0, 25.0, 34.0, 65.0, 80.0, 137.0, 148.0, 138.0, 85.0, 55.0, 35.0, 18.0, 20.0, 9.0, 9.0, 10.0, 6.0, 4.0, 8.0, 8.0, 5.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0003046989440917969, -0.00029615871608257294, -0.000287618488073349, -0.00027907826006412506, -0.0002705380320549011, -0.0002619978040456772, -0.00025345757603645325, -0.0002449173480272293, -0.00023637712001800537, -0.00022783689200878143, -0.0002192966639995575, -0.00021075643599033356, -0.00020221620798110962, -0.00019367597997188568, -0.00018513575196266174, -0.0001765955239534378, -0.00016805529594421387, -0.00015951506793498993, -0.000150974839925766, -0.00014243461191654205, -0.00013389438390731812, -0.00012535415589809418, -0.00011681392788887024, -0.0001082736998796463, -9.973347187042236e-05, -9.119324386119843e-05, -8.265301585197449e-05, -7.411278784275055e-05, -6.557255983352661e-05, -5.703233182430267e-05, -4.8492103815078735e-05, -3.99518758058548e-05, -3.141164779663086e-05, -2.287141978740692e-05, -1.4331191778182983e-05, -5.790963768959045e-06, 2.7492642402648926e-06, 1.128949224948883e-05, 1.982972025871277e-05, 2.8369948267936707e-05, 3.6910176277160645e-05, 4.545040428638458e-05, 5.399063229560852e-05, 6.253086030483246e-05, 7.10710883140564e-05, 7.961131632328033e-05, 8.815154433250427e-05, 9.669177234172821e-05, 0.00010523200035095215, 0.00011377222836017609, 0.00012231245636940002, 0.00013085268437862396, 0.0001393929123878479, 0.00014793314039707184, 0.00015647336840629578, 0.00016501359641551971, 0.00017355382442474365, 0.0001820940524339676, 0.00019063428044319153, 0.00019917450845241547, 0.0002077147364616394, 0.00021625496447086334, 0.00022479519248008728, 0.00023333542048931122, 0.00024187564849853516]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 4.0, 7.0, 12.0, 13.0, 21.0, 33.0, 51.0, 76.0, 105.0, 175.0, 204.0, 385.0, 604.0, 1075.0, 2154.0, 4424.0, 9917.0, 22857.0, 53495.0, 133934.0, 318839.0, 295496.0, 118454.0, 47971.0, 20530.0, 9031.0, 4104.0, 1969.0, 1038.0, 560.0, 333.0, 237.0, 147.0, 84.0, 75.0, 46.0, 28.0, 21.0, 23.0, 9.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.81640625, -0.7923507690429688, -0.7682952880859375, -0.7442398071289062, -0.720184326171875, -0.6961288452148438, -0.6720733642578125, -0.6480178833007812, -0.62396240234375, -0.5999069213867188, -0.5758514404296875, -0.5517959594726562, -0.527740478515625, -0.5036849975585938, -0.4796295166015625, -0.45557403564453125, -0.4315185546875, -0.40746307373046875, -0.3834075927734375, -0.35935211181640625, -0.335296630859375, -0.31124114990234375, -0.2871856689453125, -0.26313018798828125, -0.23907470703125, -0.21501922607421875, -0.1909637451171875, -0.16690826416015625, -0.142852783203125, -0.11879730224609375, -0.0947418212890625, -0.07068634033203125, -0.046630859375, -0.02257537841796875, 0.0014801025390625, 0.02553558349609375, 0.049591064453125, 0.07364654541015625, 0.0977020263671875, 0.12175750732421875, 0.14581298828125, 0.16986846923828125, 0.1939239501953125, 0.21797943115234375, 0.242034912109375, 0.26609039306640625, 0.2901458740234375, 0.31420135498046875, 0.3382568359375, 0.36231231689453125, 0.3863677978515625, 0.41042327880859375, 0.434478759765625, 0.45853424072265625, 0.4825897216796875, 0.5066452026367188, 0.53070068359375, 0.5547561645507812, 0.5788116455078125, 0.6028671264648438, 0.626922607421875, 0.6509780883789062, 0.6750335693359375, 0.6990890502929688, 0.72314453125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 3.0, 5.0, 4.0, 10.0, 14.0, 11.0, 25.0, 16.0, 23.0, 50.0, 36.0, 44.0, 78.0, 67.0, 83.0, 89.0, 79.0, 68.0, 60.0, 45.0, 30.0, 24.0, 15.0, 23.0, 18.0, 14.0, 20.0, 8.0, 6.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.0244140625, -0.9966583251953125, -0.968902587890625, -0.9411468505859375, -0.91339111328125, -0.8856353759765625, -0.857879638671875, -0.8301239013671875, -0.8023681640625, -0.7746124267578125, -0.746856689453125, -0.7191009521484375, -0.69134521484375, -0.6635894775390625, -0.635833740234375, -0.6080780029296875, -0.580322265625, -0.5525665283203125, -0.524810791015625, -0.4970550537109375, -0.46929931640625, -0.4415435791015625, -0.413787841796875, -0.3860321044921875, -0.3582763671875, -0.3305206298828125, -0.302764892578125, -0.2750091552734375, -0.24725341796875, -0.2194976806640625, -0.191741943359375, -0.1639862060546875, -0.13623046875, -0.1084747314453125, -0.080718994140625, -0.0529632568359375, -0.02520751953125, 0.0025482177734375, 0.030303955078125, 0.0580596923828125, 0.0858154296875, 0.1135711669921875, 0.141326904296875, 0.1690826416015625, 0.19683837890625, 0.2245941162109375, 0.252349853515625, 0.2801055908203125, 0.307861328125, 0.3356170654296875, 0.363372802734375, 0.3911285400390625, 0.41888427734375, 0.4466400146484375, 0.474395751953125, 0.5021514892578125, 0.5299072265625, 0.5576629638671875, 0.585418701171875, 0.6131744384765625, 0.64093017578125, 0.6686859130859375, 0.696441650390625, 0.7241973876953125, 0.751953125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 10.0, 18.0, 44.0, 94.0, 158.0, 201.0, 174.0, 142.0, 81.0, 38.0, 16.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.015438079833984, -18.417219161987305, -17.819000244140625, -17.220779418945312, -16.622560501098633, -16.024341583251953, -15.426122665405273, -14.827902793884277, -14.229682922363281, -13.631464004516602, -13.033244132995605, -12.435025215148926, -11.83680534362793, -11.23858642578125, -10.64036750793457, -10.042147636413574, -9.443928718566895, -8.845709800720215, -8.247489929199219, -7.649271011352539, -7.051051139831543, -6.452832221984863, -5.854612827301025, -5.2563934326171875, -4.65817403793335, -4.059954643249512, -3.461735248565674, -2.863516092300415, -2.265296697616577, -1.6670773029327393, -1.0688581466674805, -0.4706387519836426, 0.1275806427001953, 0.7257999777793884, 1.3240193128585815, 1.9222385883331299, 2.5204579830169678, 3.1186773777008057, 3.7168965339660645, 4.315115928649902, 4.91333532333374, 5.511554718017578, 6.109774112701416, 6.707993507385254, 7.306212425231934, 7.90443229675293, 8.50265121459961, 9.100870132446289, 9.699090003967285, 10.297308921813965, 10.895528793334961, 11.49374771118164, 12.091967582702637, 12.690186500549316, 13.288406372070312, 13.886625289916992, 14.484844207763672, 15.083063125610352, 15.681282997131348, 16.279502868652344, 16.877721786499023, 17.475940704345703, 18.074159622192383, 18.672378540039062, 19.270599365234375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 4.0, 7.0, 2.0, 10.0, 14.0, 12.0, 13.0, 23.0, 18.0, 20.0, 24.0, 33.0, 30.0, 37.0, 45.0, 37.0, 38.0, 43.0, 44.0, 41.0, 45.0, 45.0, 45.0, 47.0, 49.0, 25.0, 42.0, 36.0, 26.0, 21.0, 21.0, 21.0, 15.0, 14.0, 17.0, 14.0, 8.0, 6.0, 5.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.377749443054199, -7.145025730133057, -6.912302494049072, -6.67957878112793, -6.446855068206787, -6.2141313552856445, -5.98140811920166, -5.748684406280518, -5.515960693359375, -5.283236980438232, -5.050513744354248, -4.8177900314331055, -4.585066318511963, -4.35234260559082, -4.119619369506836, -3.8868956565856934, -3.65417218208313, -3.4214487075805664, -3.188724994659424, -2.9560015201568604, -2.7232778072357178, -2.4905543327331543, -2.2578306198120117, -2.0251071453094482, -1.7923835515975952, -1.5596599578857422, -1.3269363641738892, -1.0942127704620361, -0.8614892363548279, -0.6287657022476196, -0.3960421085357666, -0.16331851482391357, 0.06940507888793945, 0.3021286725997925, 0.5348522663116455, 0.7675758004188538, 1.0002994537353516, 1.233022928237915, 1.465746521949768, 1.698470115661621, 1.9311937093734741, 2.163917303085327, 2.3966407775878906, 2.629364490509033, 2.8620879650115967, 3.09481143951416, 3.3275351524353027, 3.5602588653564453, 3.792982339859009, 4.025705814361572, 4.258429527282715, 4.491153240203857, 4.723876476287842, 4.956600189208984, 5.189323902130127, 5.4220476150512695, 5.654770851135254, 5.8874945640563965, 6.120217800140381, 6.352941513061523, 6.585665225982666, 6.818388938903809, 7.051112174987793, 7.2838358879089355, 7.516559600830078]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 8.0, 17.0, 22.0, 27.0, 47.0, 59.0, 142.0, 192.0, 318.0, 577.0, 1089.0, 1903.0, 3373.0, 6195.0, 11338.0, 21187.0, 39426.0, 76356.0, 155314.0, 348014.0, 806855.0, 1237383.0, 820058.0, 352372.0, 154094.0, 74141.0, 38988.0, 20300.0, 10735.0, 6086.0, 3305.0, 1786.0, 982.0, 593.0, 387.0, 234.0, 133.0, 93.0, 50.0, 25.0, 27.0, 11.0, 11.0, 5.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.81396484375, -0.7843551635742188, -0.7547454833984375, -0.7251358032226562, -0.695526123046875, -0.6659164428710938, -0.6363067626953125, -0.6066970825195312, -0.57708740234375, -0.5474777221679688, -0.5178680419921875, -0.48825836181640625, -0.458648681640625, -0.42903900146484375, -0.3994293212890625, -0.36981964111328125, -0.3402099609375, -0.31060028076171875, -0.2809906005859375, -0.25138092041015625, -0.221771240234375, -0.19216156005859375, -0.1625518798828125, -0.13294219970703125, -0.10333251953125, -0.07372283935546875, -0.0441131591796875, -0.01450347900390625, 0.015106201171875, 0.04471588134765625, 0.0743255615234375, 0.10393524169921875, 0.133544921875, 0.16315460205078125, 0.1927642822265625, 0.22237396240234375, 0.251983642578125, 0.28159332275390625, 0.3112030029296875, 0.34081268310546875, 0.37042236328125, 0.40003204345703125, 0.4296417236328125, 0.45925140380859375, 0.488861083984375, 0.5184707641601562, 0.5480804443359375, 0.5776901245117188, 0.6072998046875, 0.6369094848632812, 0.6665191650390625, 0.6961288452148438, 0.725738525390625, 0.7553482055664062, 0.7849578857421875, 0.8145675659179688, 0.84417724609375, 0.8737869262695312, 0.9033966064453125, 0.9330062866210938, 0.962615966796875, 0.9922256469726562, 1.0218353271484375, 1.0514450073242188, 1.0810546875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 7.0, 5.0, 5.0, 7.0, 16.0, 10.0, 17.0, 16.0, 26.0, 24.0, 18.0, 32.0, 28.0, 40.0, 38.0, 36.0, 38.0, 31.0, 39.0, 40.0, 50.0, 51.0, 37.0, 26.0, 30.0, 34.0, 36.0, 31.0, 29.0, 39.0, 28.0, 24.0, 15.0, 24.0, 17.0, 14.0, 8.0, 5.0, 6.0, 7.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8203125, -0.7918930053710938, -0.7634735107421875, -0.7350540161132812, -0.706634521484375, -0.6782150268554688, -0.6497955322265625, -0.6213760375976562, -0.59295654296875, -0.5645370483398438, -0.5361175537109375, -0.5076980590820312, -0.479278564453125, -0.45085906982421875, -0.4224395751953125, -0.39402008056640625, -0.3656005859375, -0.33718109130859375, -0.3087615966796875, -0.28034210205078125, -0.251922607421875, -0.22350311279296875, -0.1950836181640625, -0.16666412353515625, -0.13824462890625, -0.10982513427734375, -0.0814056396484375, -0.05298614501953125, -0.024566650390625, 0.00385284423828125, 0.0322723388671875, 0.06069183349609375, 0.089111328125, 0.11753082275390625, 0.1459503173828125, 0.17436981201171875, 0.202789306640625, 0.23120880126953125, 0.2596282958984375, 0.28804779052734375, 0.31646728515625, 0.34488677978515625, 0.3733062744140625, 0.40172576904296875, 0.430145263671875, 0.45856475830078125, 0.4869842529296875, 0.5154037475585938, 0.5438232421875, 0.5722427368164062, 0.6006622314453125, 0.6290817260742188, 0.657501220703125, 0.6859207153320312, 0.7143402099609375, 0.7427597045898438, 0.77117919921875, 0.7995986938476562, 0.8280181884765625, 0.8564376831054688, 0.884857177734375, 0.9132766723632812, 0.9416961669921875, 0.9701156616210938, 0.99853515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 6.0, 14.0, 19.0, 29.0, 44.0, 68.0, 99.0, 141.0, 273.0, 474.0, 866.0, 1785.0, 4319.0, 11631.0, 34431.0, 109180.0, 402003.0, 1924147.0, 1313032.0, 271869.0, 79028.0, 25308.0, 8975.0, 3337.0, 1450.0, 717.0, 404.0, 238.0, 136.0, 96.0, 51.0, 37.0, 22.0, 23.0, 8.0, 9.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.275390625, -2.20819091796875, -2.1409912109375, -2.07379150390625, -2.006591796875, -1.93939208984375, -1.8721923828125, -1.80499267578125, -1.73779296875, -1.67059326171875, -1.6033935546875, -1.53619384765625, -1.468994140625, -1.40179443359375, -1.3345947265625, -1.26739501953125, -1.2001953125, -1.13299560546875, -1.0657958984375, -0.99859619140625, -0.931396484375, -0.86419677734375, -0.7969970703125, -0.72979736328125, -0.66259765625, -0.59539794921875, -0.5281982421875, -0.46099853515625, -0.393798828125, -0.32659912109375, -0.2593994140625, -0.19219970703125, -0.125, -0.05780029296875, 0.0093994140625, 0.07659912109375, 0.143798828125, 0.21099853515625, 0.2781982421875, 0.34539794921875, 0.41259765625, 0.47979736328125, 0.5469970703125, 0.61419677734375, 0.681396484375, 0.74859619140625, 0.8157958984375, 0.88299560546875, 0.9501953125, 1.01739501953125, 1.0845947265625, 1.15179443359375, 1.218994140625, 1.28619384765625, 1.3533935546875, 1.42059326171875, 1.48779296875, 1.55499267578125, 1.6221923828125, 1.68939208984375, 1.756591796875, 1.82379150390625, 1.8909912109375, 1.95819091796875, 2.025390625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 7.0, 8.0, 5.0, 12.0, 16.0, 23.0, 27.0, 38.0, 58.0, 73.0, 94.0, 121.0, 163.0, 236.0, 330.0, 472.0, 578.0, 488.0, 350.0, 277.0, 190.0, 141.0, 85.0, 74.0, 50.0, 37.0, 29.0, 25.0, 15.0, 19.0, 9.0, 7.0, 6.0, 8.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.396484375, -2.3272705078125, -2.258056640625, -2.1888427734375, -2.11962890625, -2.0504150390625, -1.981201171875, -1.9119873046875, -1.8427734375, -1.7735595703125, -1.704345703125, -1.6351318359375, -1.56591796875, -1.4967041015625, -1.427490234375, -1.3582763671875, -1.2890625, -1.2198486328125, -1.150634765625, -1.0814208984375, -1.01220703125, -0.9429931640625, -0.873779296875, -0.8045654296875, -0.7353515625, -0.6661376953125, -0.596923828125, -0.5277099609375, -0.45849609375, -0.3892822265625, -0.320068359375, -0.2508544921875, -0.181640625, -0.1124267578125, -0.043212890625, 0.0260009765625, 0.09521484375, 0.1644287109375, 0.233642578125, 0.3028564453125, 0.3720703125, 0.4412841796875, 0.510498046875, 0.5797119140625, 0.64892578125, 0.7181396484375, 0.787353515625, 0.8565673828125, 0.92578125, 0.9949951171875, 1.064208984375, 1.1334228515625, 1.20263671875, 1.2718505859375, 1.341064453125, 1.4102783203125, 1.4794921875, 1.5487060546875, 1.617919921875, 1.6871337890625, 1.75634765625, 1.8255615234375, 1.894775390625, 1.9639892578125, 2.033203125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 3.0, 6.0, 21.0, 49.0, 84.0, 151.0, 148.0, 196.0, 135.0, 89.0, 52.0, 30.0, 20.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.725340843200684, -14.111676216125488, -13.498011589050293, -12.884346961975098, -12.270682334899902, -11.657017707824707, -11.043354034423828, -10.429689407348633, -9.816024780273438, -9.202360153198242, -8.588695526123047, -7.975030899047852, -7.361366271972656, -6.747701644897461, -6.134037494659424, -5.5203728675842285, -4.906707763671875, -4.29304313659668, -3.6793785095214844, -3.065714120864868, -2.452049493789673, -1.8383848667144775, -1.2247204780578613, -0.611055850982666, 0.002608776092529297, 0.6162733435630798, 1.2299379110336304, 1.8436024188995361, 2.4572670459747314, 3.0709316730499268, 3.684596061706543, 4.298260688781738, 4.91192626953125, 5.525590896606445, 6.139255523681641, 6.752920150756836, 7.366584777832031, 7.980249404907227, 8.593914031982422, 9.207578659057617, 9.821243286132812, 10.434907913208008, 11.048572540283203, 11.662237167358398, 12.275901794433594, 12.889566421508789, 13.503231048583984, 14.11689567565918, 14.730559349060059, 15.344223976135254, 15.95788860321045, 16.571552276611328, 17.185216903686523, 17.79888153076172, 18.412546157836914, 19.02621078491211, 19.639875411987305, 20.2535400390625, 20.867204666137695, 21.48086929321289, 22.094533920288086, 22.70819854736328, 23.321863174438477, 23.935527801513672, 24.549192428588867]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 8.0, 6.0, 6.0, 8.0, 16.0, 14.0, 17.0, 14.0, 30.0, 21.0, 24.0, 27.0, 28.0, 24.0, 52.0, 33.0, 32.0, 43.0, 50.0, 44.0, 33.0, 52.0, 40.0, 41.0, 37.0, 31.0, 38.0, 26.0, 27.0, 34.0, 15.0, 14.0, 23.0, 15.0, 10.0, 9.0, 8.0, 12.0, 7.0, 9.0, 7.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.795619010925293, -6.583591938018799, -6.371564865112305, -6.1595377922058105, -5.947510719299316, -5.735483169555664, -5.523456573486328, -5.311429023742676, -5.099401950836182, -4.8873748779296875, -4.675347805023193, -4.463320732116699, -4.251293659210205, -4.039266586303711, -3.8272392749786377, -3.6152119636535645, -3.4031851291656494, -3.1911580562591553, -2.979130983352661, -2.767103672027588, -2.5550765991210938, -2.3430495262145996, -2.1310224533081055, -1.9189952611923218, -1.7069681882858276, -1.4949411153793335, -1.2829139232635498, -1.0708868503570557, -0.8588597178459167, -0.6468325853347778, -0.4348055124282837, -0.2227783203125, -0.01075124740600586, 0.20127587020397186, 0.4133029878139496, 0.6253300905227661, 0.837357223033905, 1.049384355545044, 1.261411428451538, 1.4734386205673218, 1.685465693473816, 1.89749276638031, 2.1095199584960938, 2.321547031402588, 2.533574104309082, 2.745601177215576, 2.9576282501220703, 3.1696555614471436, 3.3816826343536377, 3.593709707260132, 3.805736780166626, 4.017764091491699, 4.229791164398193, 4.4418182373046875, 4.653845310211182, 4.865872383117676, 5.07789945602417, 5.289926528930664, 5.501953601837158, 5.713980674743652, 5.9260077476501465, 6.138034820556641, 6.350062370300293, 6.562089443206787, 6.774116516113281]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 3.0, 6.0, 11.0, 16.0, 27.0, 29.0, 42.0, 71.0, 114.0, 135.0, 216.0, 340.0, 486.0, 838.0, 1329.0, 1974.0, 3307.0, 5371.0, 8642.0, 13943.0, 23469.0, 41603.0, 80991.0, 168850.0, 268535.0, 205579.0, 101920.0, 50090.0, 27728.0, 16347.0, 10077.0, 6159.0, 3825.0, 2368.0, 1483.0, 927.0, 642.0, 351.0, 255.0, 151.0, 97.0, 57.0, 49.0, 28.0, 28.0, 18.0, 14.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.216796875, -1.1743316650390625, -1.131866455078125, -1.0894012451171875, -1.04693603515625, -1.0044708251953125, -0.962005615234375, -0.9195404052734375, -0.8770751953125, -0.8346099853515625, -0.792144775390625, -0.7496795654296875, -0.70721435546875, -0.6647491455078125, -0.622283935546875, -0.5798187255859375, -0.537353515625, -0.4948883056640625, -0.452423095703125, -0.4099578857421875, -0.36749267578125, -0.3250274658203125, -0.282562255859375, -0.2400970458984375, -0.1976318359375, -0.1551666259765625, -0.112701416015625, -0.0702362060546875, -0.02777099609375, 0.0146942138671875, 0.057159423828125, 0.0996246337890625, 0.14208984375, 0.1845550537109375, 0.227020263671875, 0.2694854736328125, 0.31195068359375, 0.3544158935546875, 0.396881103515625, 0.4393463134765625, 0.4818115234375, 0.5242767333984375, 0.566741943359375, 0.6092071533203125, 0.65167236328125, 0.6941375732421875, 0.736602783203125, 0.7790679931640625, 0.821533203125, 0.8639984130859375, 0.906463623046875, 0.9489288330078125, 0.99139404296875, 1.0338592529296875, 1.076324462890625, 1.1187896728515625, 1.1612548828125, 1.2037200927734375, 1.246185302734375, 1.2886505126953125, 1.33111572265625, 1.3735809326171875, 1.416046142578125, 1.4585113525390625, 1.5009765625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 1.0, 9.0, 11.0, 7.0, 9.0, 11.0, 24.0, 16.0, 18.0, 20.0, 25.0, 23.0, 29.0, 35.0, 42.0, 42.0, 34.0, 34.0, 43.0, 48.0, 46.0, 46.0, 44.0, 37.0, 51.0, 41.0, 34.0, 45.0, 27.0, 17.0, 31.0, 16.0, 15.0, 18.0, 6.0, 15.0, 5.0, 6.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9130859375, -0.8842544555664062, -0.8554229736328125, -0.8265914916992188, -0.797760009765625, -0.7689285278320312, -0.7400970458984375, -0.7112655639648438, -0.68243408203125, -0.6536026000976562, -0.6247711181640625, -0.5959396362304688, -0.567108154296875, -0.5382766723632812, -0.5094451904296875, -0.48061370849609375, -0.4517822265625, -0.42295074462890625, -0.3941192626953125, -0.36528778076171875, -0.336456298828125, -0.30762481689453125, -0.2787933349609375, -0.24996185302734375, -0.22113037109375, -0.19229888916015625, -0.1634674072265625, -0.13463592529296875, -0.105804443359375, -0.07697296142578125, -0.0481414794921875, -0.01930999755859375, 0.009521484375, 0.03835296630859375, 0.0671844482421875, 0.09601593017578125, 0.124847412109375, 0.15367889404296875, 0.1825103759765625, 0.21134185791015625, 0.24017333984375, 0.26900482177734375, 0.2978363037109375, 0.32666778564453125, 0.355499267578125, 0.38433074951171875, 0.4131622314453125, 0.44199371337890625, 0.4708251953125, 0.49965667724609375, 0.5284881591796875, 0.5573196411132812, 0.586151123046875, 0.6149826049804688, 0.6438140869140625, 0.6726455688476562, 0.70147705078125, 0.7303085327148438, 0.7591400146484375, 0.7879714965820312, 0.816802978515625, 0.8456344604492188, 0.8744659423828125, 0.9032974243164062, 0.93212890625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 6.0, 5.0, 10.0, 17.0, 8.0, 21.0, 36.0, 59.0, 86.0, 85.0, 149.0, 228.0, 360.0, 649.0, 1216.0, 2511.0, 5291.0, 12333.0, 28655.0, 78674.0, 271589.0, 420448.0, 144910.0, 46653.0, 18793.0, 8155.0, 3698.0, 1721.0, 882.0, 470.0, 267.0, 177.0, 111.0, 92.0, 52.0, 37.0, 34.0, 20.0, 10.0, 6.0, 8.0, 8.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.23046875, -2.15673828125, -2.0830078125, -2.00927734375, -1.935546875, -1.86181640625, -1.7880859375, -1.71435546875, -1.640625, -1.56689453125, -1.4931640625, -1.41943359375, -1.345703125, -1.27197265625, -1.1982421875, -1.12451171875, -1.05078125, -0.97705078125, -0.9033203125, -0.82958984375, -0.755859375, -0.68212890625, -0.6083984375, -0.53466796875, -0.4609375, -0.38720703125, -0.3134765625, -0.23974609375, -0.166015625, -0.09228515625, -0.0185546875, 0.05517578125, 0.12890625, 0.20263671875, 0.2763671875, 0.35009765625, 0.423828125, 0.49755859375, 0.5712890625, 0.64501953125, 0.71875, 0.79248046875, 0.8662109375, 0.93994140625, 1.013671875, 1.08740234375, 1.1611328125, 1.23486328125, 1.30859375, 1.38232421875, 1.4560546875, 1.52978515625, 1.603515625, 1.67724609375, 1.7509765625, 1.82470703125, 1.8984375, 1.97216796875, 2.0458984375, 2.11962890625, 2.193359375, 2.26708984375, 2.3408203125, 2.41455078125, 2.48828125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 11.0, 1.0, 15.0, 14.0, 15.0, 24.0, 19.0, 28.0, 12.0, 38.0, 33.0, 36.0, 45.0, 44.0, 33.0, 48.0, 44.0, 65.0, 40.0, 41.0, 34.0, 32.0, 38.0, 38.0, 25.0, 23.0, 31.0, 19.0, 27.0, 14.0, 21.0, 8.0, 8.0, 16.0, 4.0, 6.0, 4.0, 9.0, 6.0, 2.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.58203125, -2.5020751953125, -2.422119140625, -2.3421630859375, -2.26220703125, -2.1822509765625, -2.102294921875, -2.0223388671875, -1.9423828125, -1.8624267578125, -1.782470703125, -1.7025146484375, -1.62255859375, -1.5426025390625, -1.462646484375, -1.3826904296875, -1.302734375, -1.2227783203125, -1.142822265625, -1.0628662109375, -0.98291015625, -0.9029541015625, -0.822998046875, -0.7430419921875, -0.6630859375, -0.5831298828125, -0.503173828125, -0.4232177734375, -0.34326171875, -0.2633056640625, -0.183349609375, -0.1033935546875, -0.0234375, 0.0565185546875, 0.136474609375, 0.2164306640625, 0.29638671875, 0.3763427734375, 0.456298828125, 0.5362548828125, 0.6162109375, 0.6961669921875, 0.776123046875, 0.8560791015625, 0.93603515625, 1.0159912109375, 1.095947265625, 1.1759033203125, 1.255859375, 1.3358154296875, 1.415771484375, 1.4957275390625, 1.57568359375, 1.6556396484375, 1.735595703125, 1.8155517578125, 1.8955078125, 1.9754638671875, 2.055419921875, 2.1353759765625, 2.21533203125, 2.2952880859375, 2.375244140625, 2.4552001953125, 2.53515625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 4.0, 7.0, 5.0, 7.0, 14.0, 22.0, 38.0, 67.0, 95.0, 155.0, 224.0, 394.0, 644.0, 991.0, 1687.0, 2516.0, 4108.0, 6717.0, 10892.0, 18922.0, 35150.0, 75230.0, 175403.0, 298576.0, 219395.0, 97501.0, 43707.0, 22624.0, 12901.0, 7874.0, 4829.0, 2940.0, 1807.0, 1128.0, 712.0, 452.0, 273.0, 176.0, 122.0, 96.0, 50.0, 29.0, 19.0, 13.0, 12.0, 6.0, 5.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.599609375, -0.580047607421875, -0.56048583984375, -0.540924072265625, -0.5213623046875, -0.501800537109375, -0.48223876953125, -0.462677001953125, -0.443115234375, -0.423553466796875, -0.40399169921875, -0.384429931640625, -0.3648681640625, -0.345306396484375, -0.32574462890625, -0.306182861328125, -0.28662109375, -0.267059326171875, -0.24749755859375, -0.227935791015625, -0.2083740234375, -0.188812255859375, -0.16925048828125, -0.149688720703125, -0.130126953125, -0.110565185546875, -0.09100341796875, -0.071441650390625, -0.0518798828125, -0.032318115234375, -0.01275634765625, 0.006805419921875, 0.0263671875, 0.045928955078125, 0.06549072265625, 0.085052490234375, 0.1046142578125, 0.124176025390625, 0.14373779296875, 0.163299560546875, 0.182861328125, 0.202423095703125, 0.22198486328125, 0.241546630859375, 0.2611083984375, 0.280670166015625, 0.30023193359375, 0.319793701171875, 0.33935546875, 0.358917236328125, 0.37847900390625, 0.398040771484375, 0.4176025390625, 0.437164306640625, 0.45672607421875, 0.476287841796875, 0.495849609375, 0.515411376953125, 0.53497314453125, 0.554534912109375, 0.5740966796875, 0.593658447265625, 0.61322021484375, 0.632781982421875, 0.65234375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 7.0, 6.0, 0.0, 4.0, 2.0, 4.0, 10.0, 10.0, 10.0, 18.0, 29.0, 40.0, 57.0, 94.0, 100.0, 142.0, 117.0, 88.0, 74.0, 54.0, 37.0, 28.0, 11.0, 9.0, 6.0, 11.0, 10.0, 2.0, 4.0, 5.0, 3.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023865699768066406, -0.0002297535538673401, -0.0002208501100540161, -0.00021194666624069214, -0.00020304322242736816, -0.0001941397786140442, -0.00018523633480072021, -0.00017633289098739624, -0.00016742944717407227, -0.0001585260033607483, -0.00014962255954742432, -0.00014071911573410034, -0.00013181567192077637, -0.0001229122281074524, -0.00011400878429412842, -0.00010510534048080444, -9.620189666748047e-05, -8.72984528541565e-05, -7.839500904083252e-05, -6.949156522750854e-05, -6.058812141418457e-05, -5.1684677600860596e-05, -4.278123378753662e-05, -3.3877789974212646e-05, -2.4974346160888672e-05, -1.6070902347564697e-05, -7.167458534240723e-06, 1.735985279083252e-06, 1.0639429092407227e-05, 1.95428729057312e-05, 2.8446316719055176e-05, 3.734976053237915e-05, 4.6253204345703125e-05, 5.51566481590271e-05, 6.406009197235107e-05, 7.296353578567505e-05, 8.186697959899902e-05, 9.0770423412323e-05, 9.967386722564697e-05, 0.00010857731103897095, 0.00011748075485229492, 0.0001263841986656189, 0.00013528764247894287, 0.00014419108629226685, 0.00015309453010559082, 0.0001619979739189148, 0.00017090141773223877, 0.00017980486154556274, 0.00018870830535888672, 0.0001976117491722107, 0.00020651519298553467, 0.00021541863679885864, 0.00022432208061218262, 0.0002332255244255066, 0.00024212896823883057, 0.00025103241205215454, 0.0002599358558654785, 0.0002688392996788025, 0.00027774274349212646, 0.00028664618730545044, 0.0002955496311187744, 0.0003044530749320984, 0.00031335651874542236, 0.00032225996255874634, 0.0003311634063720703]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 5.0, 8.0, 13.0, 22.0, 15.0, 18.0, 53.0, 39.0, 92.0, 158.0, 191.0, 322.0, 536.0, 1081.0, 2124.0, 4761.0, 11705.0, 30209.0, 91049.0, 294288.0, 389445.0, 147668.0, 45196.0, 16796.0, 6666.0, 2853.0, 1352.0, 698.0, 419.0, 278.0, 159.0, 106.0, 61.0, 48.0, 41.0, 23.0, 22.0, 8.0, 7.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.81982421875, -0.7907485961914062, -0.7616729736328125, -0.7325973510742188, -0.703521728515625, -0.6744461059570312, -0.6453704833984375, -0.6162948608398438, -0.58721923828125, -0.5581436157226562, -0.5290679931640625, -0.49999237060546875, -0.470916748046875, -0.44184112548828125, -0.4127655029296875, -0.38368988037109375, -0.3546142578125, -0.32553863525390625, -0.2964630126953125, -0.26738739013671875, -0.238311767578125, -0.20923614501953125, -0.1801605224609375, -0.15108489990234375, -0.12200927734375, -0.09293365478515625, -0.0638580322265625, -0.03478240966796875, -0.005706787109375, 0.02336883544921875, 0.0524444580078125, 0.08152008056640625, 0.110595703125, 0.13967132568359375, 0.1687469482421875, 0.19782257080078125, 0.226898193359375, 0.25597381591796875, 0.2850494384765625, 0.31412506103515625, 0.34320068359375, 0.37227630615234375, 0.4013519287109375, 0.43042755126953125, 0.459503173828125, 0.48857879638671875, 0.5176544189453125, 0.5467300415039062, 0.5758056640625, 0.6048812866210938, 0.6339569091796875, 0.6630325317382812, 0.692108154296875, 0.7211837768554688, 0.7502593994140625, 0.7793350219726562, 0.80841064453125, 0.8374862670898438, 0.8665618896484375, 0.8956375122070312, 0.924713134765625, 0.9537887573242188, 0.9828643798828125, 1.0119400024414062, 1.041015625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 1.0, 5.0, 6.0, 5.0, 1.0, 7.0, 4.0, 16.0, 28.0, 18.0, 40.0, 55.0, 74.0, 119.0, 151.0, 124.0, 103.0, 69.0, 51.0, 32.0, 27.0, 17.0, 19.0, 8.0, 7.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.169921875, -1.1263580322265625, -1.082794189453125, -1.0392303466796875, -0.99566650390625, -0.9521026611328125, -0.908538818359375, -0.8649749755859375, -0.8214111328125, -0.7778472900390625, -0.734283447265625, -0.6907196044921875, -0.64715576171875, -0.6035919189453125, -0.560028076171875, -0.5164642333984375, -0.472900390625, -0.4293365478515625, -0.385772705078125, -0.3422088623046875, -0.29864501953125, -0.2550811767578125, -0.211517333984375, -0.1679534912109375, -0.1243896484375, -0.0808258056640625, -0.037261962890625, 0.0063018798828125, 0.04986572265625, 0.0934295654296875, 0.136993408203125, 0.1805572509765625, 0.22412109375, 0.2676849365234375, 0.311248779296875, 0.3548126220703125, 0.39837646484375, 0.4419403076171875, 0.485504150390625, 0.5290679931640625, 0.5726318359375, 0.6161956787109375, 0.659759521484375, 0.7033233642578125, 0.74688720703125, 0.7904510498046875, 0.834014892578125, 0.8775787353515625, 0.921142578125, 0.9647064208984375, 1.008270263671875, 1.0518341064453125, 1.09539794921875, 1.1389617919921875, 1.182525634765625, 1.2260894775390625, 1.2696533203125, 1.3132171630859375, 1.356781005859375, 1.4003448486328125, 1.44390869140625, 1.4874725341796875, 1.531036376953125, 1.5746002197265625, 1.6181640625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 8.0, 24.0, 46.0, 134.0, 179.0, 208.0, 167.0, 111.0, 78.0, 20.0, 8.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1118745803833, -14.517218589782715, -13.922562599182129, -13.327905654907227, -12.73324966430664, -12.138593673706055, -11.543937683105469, -10.949281692504883, -10.354625701904297, -9.759969711303711, -9.165313720703125, -8.570657730102539, -7.976000785827637, -7.381344795227051, -6.786688804626465, -6.192032337188721, -5.597375869750977, -5.002719879150391, -4.4080634117126465, -3.8134074211120605, -3.2187511920928955, -2.6240949630737305, -2.0294389724731445, -1.4347825050354004, -0.8401265144348145, -0.2454703450202942, 0.3491858243942261, 0.9438419342041016, 1.5384981632232666, 2.1331543922424316, 2.7278103828430176, 3.3224668502807617, 3.917123794555664, 4.51177978515625, 5.106436252593994, 5.70109224319458, 6.295748710632324, 6.89040470123291, 7.485060691833496, 8.079717636108398, 8.674373626708984, 9.26902961730957, 9.863685607910156, 10.458341598510742, 11.052998542785645, 11.64765453338623, 12.242310523986816, 12.836967468261719, 13.431622505187988, 14.026278495788574, 14.62093448638916, 15.215591430664062, 15.810247421264648, 16.404903411865234, 16.99955940246582, 17.594215393066406, 18.188871383666992, 18.783527374267578, 19.378183364868164, 19.97283935546875, 20.567495346069336, 21.162151336669922, 21.75680923461914, 22.351465225219727, 22.946121215820312]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 2.0, 5.0, 7.0, 12.0, 9.0, 10.0, 15.0, 12.0, 18.0, 25.0, 19.0, 22.0, 34.0, 30.0, 35.0, 32.0, 46.0, 38.0, 35.0, 39.0, 41.0, 41.0, 36.0, 51.0, 34.0, 45.0, 29.0, 39.0, 35.0, 29.0, 28.0, 16.0, 24.0, 15.0, 16.0, 14.0, 13.0, 6.0, 11.0, 7.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.811169624328613, -6.602077960968018, -6.392985820770264, -6.183894157409668, -5.974802017211914, -5.765710353851318, -5.556618690490723, -5.347526550292969, -5.138434410095215, -4.929342746734619, -4.720250606536865, -4.5111589431762695, -4.302066802978516, -4.09297513961792, -3.883883237838745, -3.6747913360595703, -3.4656996726989746, -3.2566077709198, -3.047515869140625, -2.8384242057800293, -2.6293320655822754, -2.4202404022216797, -2.211148500442505, -2.00205659866333, -1.7929646968841553, -1.5838727951049805, -1.3747808933258057, -1.1656891107559204, -0.9565972089767456, -0.7475053071975708, -0.5384135246276855, -0.32932162284851074, -0.12022972106933594, 0.08886215090751648, 0.2979540228843689, 0.5070458650588989, 0.7161377668380737, 0.9252296686172485, 1.1343214511871338, 1.3434133529663086, 1.5525052547454834, 1.7615971565246582, 1.970689058303833, 2.179780960083008, 2.3888726234436035, 2.5979647636413574, 2.807056427001953, 3.016148328781128, 3.2252402305603027, 3.4343321323394775, 3.6434240341186523, 3.852515697479248, 4.061607837677002, 4.270699501037598, 4.479791641235352, 4.688883304595947, 4.897974967956543, 5.107066631317139, 5.316158771514893, 5.525250434875488, 5.734342575073242, 5.943434238433838, 6.152525901794434, 6.3616180419921875, 6.570710182189941]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 13.0, 16.0, 21.0, 40.0, 70.0, 105.0, 141.0, 258.0, 425.0, 782.0, 1441.0, 2842.0, 5743.0, 11138.0, 22690.0, 47146.0, 101349.0, 237928.0, 624682.0, 1293226.0, 1073829.0, 448005.0, 174542.0, 76328.0, 35820.0, 17391.0, 8732.0, 4462.0, 2283.0, 1301.0, 592.0, 359.0, 226.0, 125.0, 72.0, 41.0, 34.0, 21.0, 16.0, 17.0, 7.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94677734375, -0.9150314331054688, -0.8832855224609375, -0.8515396118164062, -0.819793701171875, -0.7880477905273438, -0.7563018798828125, -0.7245559692382812, -0.69281005859375, -0.6610641479492188, -0.6293182373046875, -0.5975723266601562, -0.565826416015625, -0.5340805053710938, -0.5023345947265625, -0.47058868408203125, -0.4388427734375, -0.40709686279296875, -0.3753509521484375, -0.34360504150390625, -0.311859130859375, -0.28011322021484375, -0.2483673095703125, -0.21662139892578125, -0.18487548828125, -0.15312957763671875, -0.1213836669921875, -0.08963775634765625, -0.057891845703125, -0.02614593505859375, 0.0055999755859375, 0.03734588623046875, 0.069091796875, 0.10083770751953125, 0.1325836181640625, 0.16432952880859375, 0.196075439453125, 0.22782135009765625, 0.2595672607421875, 0.29131317138671875, 0.32305908203125, 0.35480499267578125, 0.3865509033203125, 0.41829681396484375, 0.450042724609375, 0.48178863525390625, 0.5135345458984375, 0.5452804565429688, 0.5770263671875, 0.6087722778320312, 0.6405181884765625, 0.6722640991210938, 0.704010009765625, 0.7357559204101562, 0.7675018310546875, 0.7992477416992188, 0.83099365234375, 0.8627395629882812, 0.8944854736328125, 0.9262313842773438, 0.957977294921875, 0.9897232055664062, 1.0214691162109375, 1.0532150268554688, 1.0849609375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 9.0, 8.0, 11.0, 14.0, 13.0, 22.0, 13.0, 28.0, 17.0, 15.0, 28.0, 25.0, 32.0, 36.0, 27.0, 33.0, 41.0, 31.0, 35.0, 47.0, 50.0, 47.0, 32.0, 46.0, 29.0, 31.0, 32.0, 33.0, 33.0, 26.0, 27.0, 23.0, 21.0, 16.0, 14.0, 9.0, 6.0, 10.0, 9.0, 2.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.79736328125, -0.7707061767578125, -0.744049072265625, -0.7173919677734375, -0.69073486328125, -0.6640777587890625, -0.637420654296875, -0.6107635498046875, -0.5841064453125, -0.5574493408203125, -0.530792236328125, -0.5041351318359375, -0.47747802734375, -0.4508209228515625, -0.424163818359375, -0.3975067138671875, -0.370849609375, -0.3441925048828125, -0.317535400390625, -0.2908782958984375, -0.26422119140625, -0.2375640869140625, -0.210906982421875, -0.1842498779296875, -0.1575927734375, -0.1309356689453125, -0.104278564453125, -0.0776214599609375, -0.05096435546875, -0.0243072509765625, 0.002349853515625, 0.0290069580078125, 0.0556640625, 0.0823211669921875, 0.108978271484375, 0.1356353759765625, 0.16229248046875, 0.1889495849609375, 0.215606689453125, 0.2422637939453125, 0.2689208984375, 0.2955780029296875, 0.322235107421875, 0.3488922119140625, 0.37554931640625, 0.4022064208984375, 0.428863525390625, 0.4555206298828125, 0.482177734375, 0.5088348388671875, 0.535491943359375, 0.5621490478515625, 0.58880615234375, 0.6154632568359375, 0.642120361328125, 0.6687774658203125, 0.6954345703125, 0.7220916748046875, 0.748748779296875, 0.7754058837890625, 0.80206298828125, 0.8287200927734375, 0.855377197265625, 0.8820343017578125, 0.90869140625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 12.0, 16.0, 43.0, 68.0, 114.0, 195.0, 340.0, 715.0, 1690.0, 4219.0, 13193.0, 46430.0, 186021.0, 1002083.0, 2349227.0, 450260.0, 100308.0, 26180.0, 7957.0, 2805.0, 1156.0, 573.0, 292.0, 171.0, 83.0, 29.0, 35.0, 14.0, 15.0, 11.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.720703125, -2.645721435546875, -2.57073974609375, -2.495758056640625, -2.4207763671875, -2.345794677734375, -2.27081298828125, -2.195831298828125, -2.120849609375, -2.045867919921875, -1.97088623046875, -1.895904541015625, -1.8209228515625, -1.745941162109375, -1.67095947265625, -1.595977783203125, -1.52099609375, -1.446014404296875, -1.37103271484375, -1.296051025390625, -1.2210693359375, -1.146087646484375, -1.07110595703125, -0.996124267578125, -0.921142578125, -0.846160888671875, -0.77117919921875, -0.696197509765625, -0.6212158203125, -0.546234130859375, -0.47125244140625, -0.396270751953125, -0.3212890625, -0.246307373046875, -0.17132568359375, -0.096343994140625, -0.0213623046875, 0.053619384765625, 0.12860107421875, 0.203582763671875, 0.278564453125, 0.353546142578125, 0.42852783203125, 0.503509521484375, 0.5784912109375, 0.653472900390625, 0.72845458984375, 0.803436279296875, 0.87841796875, 0.953399658203125, 1.02838134765625, 1.103363037109375, 1.1783447265625, 1.253326416015625, 1.32830810546875, 1.403289794921875, 1.478271484375, 1.553253173828125, 1.62823486328125, 1.703216552734375, 1.7781982421875, 1.853179931640625, 1.92816162109375, 2.003143310546875, 2.078125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 6.0, 12.0, 10.0, 21.0, 15.0, 13.0, 37.0, 46.0, 60.0, 71.0, 114.0, 130.0, 184.0, 249.0, 386.0, 475.0, 553.0, 420.0, 363.0, 242.0, 178.0, 140.0, 76.0, 58.0, 55.0, 49.0, 27.0, 24.0, 18.0, 6.0, 10.0, 5.0, 9.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.96484375, -1.90008544921875, -1.8353271484375, -1.77056884765625, -1.705810546875, -1.64105224609375, -1.5762939453125, -1.51153564453125, -1.44677734375, -1.38201904296875, -1.3172607421875, -1.25250244140625, -1.187744140625, -1.12298583984375, -1.0582275390625, -0.99346923828125, -0.9287109375, -0.86395263671875, -0.7991943359375, -0.73443603515625, -0.669677734375, -0.60491943359375, -0.5401611328125, -0.47540283203125, -0.41064453125, -0.34588623046875, -0.2811279296875, -0.21636962890625, -0.151611328125, -0.08685302734375, -0.0220947265625, 0.04266357421875, 0.107421875, 0.17218017578125, 0.2369384765625, 0.30169677734375, 0.366455078125, 0.43121337890625, 0.4959716796875, 0.56072998046875, 0.62548828125, 0.69024658203125, 0.7550048828125, 0.81976318359375, 0.884521484375, 0.94927978515625, 1.0140380859375, 1.07879638671875, 1.1435546875, 1.20831298828125, 1.2730712890625, 1.33782958984375, 1.402587890625, 1.46734619140625, 1.5321044921875, 1.59686279296875, 1.66162109375, 1.72637939453125, 1.7911376953125, 1.85589599609375, 1.920654296875, 1.98541259765625, 2.0501708984375, 2.11492919921875, 2.1796875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 3.0, 8.0, 12.0, 9.0, 36.0, 58.0, 100.0, 161.0, 155.0, 153.0, 131.0, 80.0, 43.0, 21.0, 17.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.90761375427246, -22.30080795288086, -21.694002151489258, -21.087196350097656, -20.480392456054688, -19.873586654663086, -19.266780853271484, -18.659975051879883, -18.05316925048828, -17.44636344909668, -16.839557647705078, -16.232751846313477, -15.625946998596191, -15.01914119720459, -14.412336349487305, -13.805530548095703, -13.198724746704102, -12.5919189453125, -11.985113143920898, -11.378308296203613, -10.771502494812012, -10.16469669342041, -9.557891845703125, -8.951086044311523, -8.344280242919922, -7.73747444152832, -7.130669116973877, -6.523863792419434, -5.917057991027832, -5.3102521896362305, -4.703446865081787, -4.096641540527344, -3.4898338317871094, -2.883028268814087, -2.2762227058410645, -1.669417142868042, -1.0626115798950195, -0.45580601692199707, 0.1509995460510254, 0.7578048706054688, 1.3646106719970703, 1.9714162349700928, 2.5782217979431152, 3.1850273609161377, 3.79183292388916, 4.398638725280762, 5.005444049835205, 5.612249374389648, 6.21905517578125, 6.825860977172852, 7.432666301727295, 8.039471626281738, 8.64627742767334, 9.253083229064941, 9.859888076782227, 10.466693878173828, 11.07349967956543, 11.680305480957031, 12.287111282348633, 12.893916130065918, 13.50072193145752, 14.107527732849121, 14.714332580566406, 15.321138381958008, 15.92794418334961]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 5.0, 10.0, 8.0, 8.0, 10.0, 17.0, 15.0, 19.0, 24.0, 19.0, 39.0, 28.0, 34.0, 35.0, 42.0, 37.0, 36.0, 48.0, 60.0, 40.0, 53.0, 37.0, 46.0, 40.0, 40.0, 34.0, 31.0, 32.0, 26.0, 15.0, 26.0, 14.0, 14.0, 11.0, 9.0, 4.0, 10.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.668274402618408, -7.448633670806885, -7.228992462158203, -7.00935173034668, -6.789710521697998, -6.570069789886475, -6.350428581237793, -6.1307878494262695, -5.911147117614746, -5.691506385803223, -5.471865177154541, -5.252224445343018, -5.032583236694336, -4.8129425048828125, -4.593301773071289, -4.373660564422607, -4.154019355773926, -3.9343783855438232, -3.7147374153137207, -3.4950966835021973, -3.2754554748535156, -3.055814743041992, -2.8361737728118896, -2.616532802581787, -2.3968918323516846, -2.177250862121582, -1.9576098918914795, -1.7379690408706665, -1.518328070640564, -1.2986871004104614, -1.0790462493896484, -0.8594052791595459, -0.6397638320922852, -0.420122891664505, -0.20048195123672485, 0.01915895938873291, 0.23879992961883545, 0.458440899848938, 0.678081750869751, 0.8977227210998535, 1.117363691329956, 1.3370046615600586, 1.5566456317901611, 1.7762864828109741, 1.9959274530410767, 2.2155685424804688, 2.435209274291992, 2.6548502445220947, 2.8744912147521973, 3.0941321849823, 3.3137731552124023, 3.533413887023926, 3.7530550956726074, 3.972695827484131, 4.1923370361328125, 4.411977767944336, 4.631618499755859, 4.851259231567383, 5.0709004402160645, 5.290541172027588, 5.5101823806762695, 5.729823112487793, 5.949463844299316, 6.169105052947998, 6.38874626159668]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 1.0, 5.0, 10.0, 6.0, 15.0, 24.0, 33.0, 36.0, 68.0, 109.0, 160.0, 270.0, 394.0, 682.0, 1097.0, 1753.0, 2730.0, 4815.0, 8330.0, 15172.0, 27890.0, 52353.0, 92198.0, 146069.0, 187618.0, 182961.0, 136466.0, 83222.0, 46803.0, 25077.0, 13496.0, 7597.0, 4262.0, 2628.0, 1481.0, 1020.0, 616.0, 391.0, 237.0, 175.0, 90.0, 83.0, 42.0, 20.0, 17.0, 12.0, 9.0, 7.0, 5.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8583984375, -0.828704833984375, -0.79901123046875, -0.769317626953125, -0.7396240234375, -0.709930419921875, -0.68023681640625, -0.650543212890625, -0.620849609375, -0.591156005859375, -0.56146240234375, -0.531768798828125, -0.5020751953125, -0.472381591796875, -0.44268798828125, -0.412994384765625, -0.38330078125, -0.353607177734375, -0.32391357421875, -0.294219970703125, -0.2645263671875, -0.234832763671875, -0.20513916015625, -0.175445556640625, -0.145751953125, -0.116058349609375, -0.08636474609375, -0.056671142578125, -0.0269775390625, 0.002716064453125, 0.03240966796875, 0.062103271484375, 0.091796875, 0.121490478515625, 0.15118408203125, 0.180877685546875, 0.2105712890625, 0.240264892578125, 0.26995849609375, 0.299652099609375, 0.329345703125, 0.359039306640625, 0.38873291015625, 0.418426513671875, 0.4481201171875, 0.477813720703125, 0.50750732421875, 0.537200927734375, 0.56689453125, 0.596588134765625, 0.62628173828125, 0.655975341796875, 0.6856689453125, 0.715362548828125, 0.74505615234375, 0.774749755859375, 0.804443359375, 0.834136962890625, 0.86383056640625, 0.893524169921875, 0.9232177734375, 0.952911376953125, 0.98260498046875, 1.012298583984375, 1.0419921875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 3.0, 9.0, 7.0, 15.0, 10.0, 14.0, 17.0, 19.0, 20.0, 29.0, 26.0, 33.0, 33.0, 35.0, 25.0, 43.0, 57.0, 31.0, 39.0, 40.0, 46.0, 38.0, 41.0, 48.0, 44.0, 34.0, 21.0, 37.0, 39.0, 18.0, 26.0, 17.0, 17.0, 18.0, 12.0, 5.0, 4.0, 7.0, 6.0, 0.0, 3.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.93505859375, -0.9068832397460938, -0.8787078857421875, -0.8505325317382812, -0.822357177734375, -0.7941818237304688, -0.7660064697265625, -0.7378311157226562, -0.70965576171875, -0.6814804077148438, -0.6533050537109375, -0.6251296997070312, -0.596954345703125, -0.5687789916992188, -0.5406036376953125, -0.5124282836914062, -0.4842529296875, -0.45607757568359375, -0.4279022216796875, -0.39972686767578125, -0.371551513671875, -0.34337615966796875, -0.3152008056640625, -0.28702545166015625, -0.25885009765625, -0.23067474365234375, -0.2024993896484375, -0.17432403564453125, -0.146148681640625, -0.11797332763671875, -0.0897979736328125, -0.06162261962890625, -0.033447265625, -0.00527191162109375, 0.0229034423828125, 0.05107879638671875, 0.079254150390625, 0.10742950439453125, 0.1356048583984375, 0.16378021240234375, 0.19195556640625, 0.22013092041015625, 0.2483062744140625, 0.27648162841796875, 0.304656982421875, 0.33283233642578125, 0.3610076904296875, 0.38918304443359375, 0.4173583984375, 0.44553375244140625, 0.4737091064453125, 0.5018844604492188, 0.530059814453125, 0.5582351684570312, 0.5864105224609375, 0.6145858764648438, 0.64276123046875, 0.6709365844726562, 0.6991119384765625, 0.7272872924804688, 0.755462646484375, 0.7836380004882812, 0.8118133544921875, 0.8399887084960938, 0.8681640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 6.0, 11.0, 15.0, 21.0, 28.0, 44.0, 72.0, 99.0, 164.0, 307.0, 673.0, 1425.0, 3718.0, 10013.0, 30316.0, 101806.0, 292814.0, 368258.0, 164610.0, 49003.0, 15638.0, 5487.0, 2170.0, 882.0, 391.0, 223.0, 132.0, 63.0, 55.0, 32.0, 24.0, 15.0, 14.0, 2.0, 6.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.119140625, -2.0621795654296875, -2.005218505859375, -1.9482574462890625, -1.89129638671875, -1.8343353271484375, -1.777374267578125, -1.7204132080078125, -1.6634521484375, -1.6064910888671875, -1.549530029296875, -1.4925689697265625, -1.43560791015625, -1.3786468505859375, -1.321685791015625, -1.2647247314453125, -1.207763671875, -1.1508026123046875, -1.093841552734375, -1.0368804931640625, -0.97991943359375, -0.9229583740234375, -0.865997314453125, -0.8090362548828125, -0.7520751953125, -0.6951141357421875, -0.638153076171875, -0.5811920166015625, -0.52423095703125, -0.4672698974609375, -0.410308837890625, -0.3533477783203125, -0.29638671875, -0.2394256591796875, -0.182464599609375, -0.1255035400390625, -0.06854248046875, -0.0115814208984375, 0.045379638671875, 0.1023406982421875, 0.1593017578125, 0.2162628173828125, 0.273223876953125, 0.3301849365234375, 0.38714599609375, 0.4441070556640625, 0.501068115234375, 0.5580291748046875, 0.614990234375, 0.6719512939453125, 0.728912353515625, 0.7858734130859375, 0.84283447265625, 0.8997955322265625, 0.956756591796875, 1.0137176513671875, 1.0706787109375, 1.1276397705078125, 1.184600830078125, 1.2415618896484375, 1.29852294921875, 1.3554840087890625, 1.412445068359375, 1.4694061279296875, 1.5263671875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 5.0, 1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 6.0, 14.0, 11.0, 11.0, 16.0, 18.0, 20.0, 20.0, 23.0, 30.0, 27.0, 32.0, 34.0, 36.0, 37.0, 33.0, 41.0, 44.0, 45.0, 44.0, 50.0, 47.0, 36.0, 43.0, 31.0, 33.0, 31.0, 21.0, 24.0, 19.0, 18.0, 17.0, 14.0, 10.0, 5.0, 13.0, 7.0, 8.0, 9.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2109375, -2.1336669921875, -2.056396484375, -1.9791259765625, -1.90185546875, -1.8245849609375, -1.747314453125, -1.6700439453125, -1.5927734375, -1.5155029296875, -1.438232421875, -1.3609619140625, -1.28369140625, -1.2064208984375, -1.129150390625, -1.0518798828125, -0.974609375, -0.8973388671875, -0.820068359375, -0.7427978515625, -0.66552734375, -0.5882568359375, -0.510986328125, -0.4337158203125, -0.3564453125, -0.2791748046875, -0.201904296875, -0.1246337890625, -0.04736328125, 0.0299072265625, 0.107177734375, 0.1844482421875, 0.26171875, 0.3389892578125, 0.416259765625, 0.4935302734375, 0.57080078125, 0.6480712890625, 0.725341796875, 0.8026123046875, 0.8798828125, 0.9571533203125, 1.034423828125, 1.1116943359375, 1.18896484375, 1.2662353515625, 1.343505859375, 1.4207763671875, 1.498046875, 1.5753173828125, 1.652587890625, 1.7298583984375, 1.80712890625, 1.8843994140625, 1.961669921875, 2.0389404296875, 2.1162109375, 2.1934814453125, 2.270751953125, 2.3480224609375, 2.42529296875, 2.5025634765625, 2.579833984375, 2.6571044921875, 2.734375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 6.0, 6.0, 7.0, 20.0, 34.0, 43.0, 88.0, 128.0, 291.0, 485.0, 919.0, 1700.0, 3605.0, 7175.0, 15794.0, 34962.0, 78839.0, 164753.0, 258591.0, 236562.0, 132573.0, 61017.0, 27051.0, 12281.0, 5851.0, 2707.0, 1435.0, 749.0, 371.0, 221.0, 130.0, 73.0, 34.0, 23.0, 19.0, 4.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.58740234375, -0.5689544677734375, -0.550506591796875, -0.5320587158203125, -0.51361083984375, -0.4951629638671875, -0.476715087890625, -0.4582672119140625, -0.4398193359375, -0.4213714599609375, -0.402923583984375, -0.3844757080078125, -0.36602783203125, -0.3475799560546875, -0.329132080078125, -0.3106842041015625, -0.292236328125, -0.2737884521484375, -0.255340576171875, -0.2368927001953125, -0.21844482421875, -0.1999969482421875, -0.181549072265625, -0.1631011962890625, -0.1446533203125, -0.1262054443359375, -0.107757568359375, -0.0893096923828125, -0.07086181640625, -0.0524139404296875, -0.033966064453125, -0.0155181884765625, 0.0029296875, 0.0213775634765625, 0.039825439453125, 0.0582733154296875, 0.07672119140625, 0.0951690673828125, 0.113616943359375, 0.1320648193359375, 0.1505126953125, 0.1689605712890625, 0.187408447265625, 0.2058563232421875, 0.22430419921875, 0.2427520751953125, 0.261199951171875, 0.2796478271484375, 0.298095703125, 0.3165435791015625, 0.334991455078125, 0.3534393310546875, 0.37188720703125, 0.3903350830078125, 0.408782958984375, 0.4272308349609375, 0.4456787109375, 0.4641265869140625, 0.482574462890625, 0.5010223388671875, 0.51947021484375, 0.5379180908203125, 0.556365966796875, 0.5748138427734375, 0.59326171875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 8.0, 6.0, 4.0, 6.0, 11.0, 13.0, 19.0, 47.0, 55.0, 61.0, 95.0, 99.0, 99.0, 108.0, 83.0, 67.0, 60.0, 47.0, 33.0, 18.0, 13.0, 13.0, 13.0, 11.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001747608184814453, -0.00016773119568824768, -0.00016070157289505005, -0.00015367195010185242, -0.00014664232730865479, -0.00013961270451545715, -0.00013258308172225952, -0.0001255534589290619, -0.00011852383613586426, -0.00011149421334266663, -0.000104464590549469, -9.743496775627136e-05, -9.040534496307373e-05, -8.33757221698761e-05, -7.634609937667847e-05, -6.931647658348083e-05, -6.22868537902832e-05, -5.525723099708557e-05, -4.822760820388794e-05, -4.119798541069031e-05, -3.4168362617492676e-05, -2.7138739824295044e-05, -2.0109117031097412e-05, -1.307949423789978e-05, -6.0498714447021484e-06, 9.797513484954834e-07, 8.009374141693115e-06, 1.5038996934890747e-05, 2.206861972808838e-05, 2.909824252128601e-05, 3.612786531448364e-05, 4.3157488107681274e-05, 5.0187110900878906e-05, 5.721673369407654e-05, 6.424635648727417e-05, 7.12759792804718e-05, 7.830560207366943e-05, 8.533522486686707e-05, 9.23648476600647e-05, 9.939447045326233e-05, 0.00010642409324645996, 0.00011345371603965759, 0.00012048333883285522, 0.00012751296162605286, 0.0001345425844192505, 0.00014157220721244812, 0.00014860183000564575, 0.00015563145279884338, 0.00016266107559204102, 0.00016969069838523865, 0.00017672032117843628, 0.0001837499439716339, 0.00019077956676483154, 0.00019780918955802917, 0.0002048388123512268, 0.00021186843514442444, 0.00021889805793762207, 0.0002259276807308197, 0.00023295730352401733, 0.00023998692631721497, 0.0002470165491104126, 0.00025404617190361023, 0.00026107579469680786, 0.0002681054174900055, 0.0002751350402832031]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 2.0, 8.0, 9.0, 9.0, 10.0, 36.0, 50.0, 60.0, 110.0, 170.0, 280.0, 453.0, 778.0, 1378.0, 2540.0, 5014.0, 10111.0, 20954.0, 42074.0, 82772.0, 145617.0, 207594.0, 209304.0, 148639.0, 84163.0, 43390.0, 21496.0, 10491.0, 5105.0, 2670.0, 1364.0, 743.0, 438.0, 257.0, 156.0, 100.0, 78.0, 43.0, 32.0, 17.0, 13.0, 7.0, 11.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4345703125, -0.41905975341796875, -0.4035491943359375, -0.38803863525390625, -0.372528076171875, -0.35701751708984375, -0.3415069580078125, -0.32599639892578125, -0.31048583984375, -0.29497528076171875, -0.2794647216796875, -0.26395416259765625, -0.248443603515625, -0.23293304443359375, -0.2174224853515625, -0.20191192626953125, -0.1864013671875, -0.17089080810546875, -0.1553802490234375, -0.13986968994140625, -0.124359130859375, -0.10884857177734375, -0.0933380126953125, -0.07782745361328125, -0.06231689453125, -0.04680633544921875, -0.0312957763671875, -0.01578521728515625, -0.000274658203125, 0.01523590087890625, 0.0307464599609375, 0.04625701904296875, 0.061767578125, 0.07727813720703125, 0.0927886962890625, 0.10829925537109375, 0.123809814453125, 0.13932037353515625, 0.1548309326171875, 0.17034149169921875, 0.18585205078125, 0.20136260986328125, 0.2168731689453125, 0.23238372802734375, 0.247894287109375, 0.26340484619140625, 0.2789154052734375, 0.29442596435546875, 0.3099365234375, 0.32544708251953125, 0.3409576416015625, 0.35646820068359375, 0.371978759765625, 0.38748931884765625, 0.4029998779296875, 0.41851043701171875, 0.43402099609375, 0.44953155517578125, 0.4650421142578125, 0.48055267333984375, 0.496063232421875, 0.5115737915039062, 0.5270843505859375, 0.5425949096679688, 0.55810546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 13.0, 11.0, 16.0, 21.0, 24.0, 19.0, 39.0, 40.0, 46.0, 51.0, 56.0, 59.0, 74.0, 63.0, 41.0, 61.0, 60.0, 47.0, 42.0, 45.0, 33.0, 25.0, 18.0, 16.0, 11.0, 12.0, 9.0, 7.0, 5.0, 7.0, 6.0, 4.0, 8.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.66162109375, -0.6423416137695312, -0.6230621337890625, -0.6037826538085938, -0.584503173828125, -0.5652236938476562, -0.5459442138671875, -0.5266647338867188, -0.50738525390625, -0.48810577392578125, -0.4688262939453125, -0.44954681396484375, -0.430267333984375, -0.41098785400390625, -0.3917083740234375, -0.37242889404296875, -0.3531494140625, -0.33386993408203125, -0.3145904541015625, -0.29531097412109375, -0.276031494140625, -0.25675201416015625, -0.2374725341796875, -0.21819305419921875, -0.19891357421875, -0.17963409423828125, -0.1603546142578125, -0.14107513427734375, -0.121795654296875, -0.10251617431640625, -0.0832366943359375, -0.06395721435546875, -0.044677734375, -0.02539825439453125, -0.0061187744140625, 0.01316070556640625, 0.032440185546875, 0.05171966552734375, 0.0709991455078125, 0.09027862548828125, 0.10955810546875, 0.12883758544921875, 0.1481170654296875, 0.16739654541015625, 0.186676025390625, 0.20595550537109375, 0.2252349853515625, 0.24451446533203125, 0.2637939453125, 0.28307342529296875, 0.3023529052734375, 0.32163238525390625, 0.340911865234375, 0.36019134521484375, 0.3794708251953125, 0.39875030517578125, 0.41802978515625, 0.43730926513671875, 0.4565887451171875, 0.47586822509765625, 0.495147705078125, 0.5144271850585938, 0.5337066650390625, 0.5529861450195312, 0.572265625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 18.0, 31.0, 48.0, 90.0, 127.0, 130.0, 133.0, 156.0, 80.0, 74.0, 41.0, 24.0, 12.0, 6.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.372556686401367, -5.060115337371826, -4.747673988342285, -4.435232639312744, -4.122791290283203, -3.810349702835083, -3.497908115386963, -3.185466766357422, -2.873025417327881, -2.56058406829834, -2.248142719268799, -1.9357011318206787, -1.6232597827911377, -1.3108184337615967, -0.9983769655227661, -0.6859354972839355, -0.37349414825439453, -0.06105273962020874, 0.25138866901397705, 0.5638300776481628, 0.8762714862823486, 1.1887128353118896, 1.5011543035507202, 1.8135957717895508, 2.126037120819092, 2.438478469848633, 2.750919818878174, 3.063361406326294, 3.375802755355835, 3.688244104385376, 4.000685691833496, 4.313127040863037, 4.625567436218262, 4.938008785247803, 5.250450134277344, 5.562891483306885, 5.875332832336426, 6.187774658203125, 6.500216007232666, 6.812657356262207, 7.125098705291748, 7.437540054321289, 7.74998140335083, 8.062422752380371, 8.37486457824707, 8.687305450439453, 8.999747276306152, 9.312189102172852, 9.624629974365234, 9.937071800231934, 10.249512672424316, 10.561954498291016, 10.874395370483398, 11.186837196350098, 11.49927806854248, 11.81171989440918, 12.124160766601562, 12.436602592468262, 12.749043464660645, 13.061485290527344, 13.373926162719727, 13.686367988586426, 13.998808860778809, 14.311250686645508, 14.623692512512207]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 7.0, 16.0, 7.0, 6.0, 18.0, 5.0, 14.0, 14.0, 20.0, 18.0, 26.0, 18.0, 31.0, 34.0, 37.0, 35.0, 28.0, 37.0, 41.0, 43.0, 35.0, 30.0, 50.0, 35.0, 32.0, 31.0, 34.0, 35.0, 32.0, 29.0, 17.0, 22.0, 21.0, 19.0, 11.0, 23.0, 10.0, 12.0, 15.0, 10.0, 3.0, 8.0, 3.0, 10.0, 5.0, 2.0, 3.0, 6.0, 0.0, 1.0, 3.0], "bins": [-6.211719512939453, -6.028163909912109, -5.844608306884766, -5.661052703857422, -5.477497100830078, -5.293941497802734, -5.110385894775391, -4.926830291748047, -4.743274688720703, -4.559719085693359, -4.376163482666016, -4.192607879638672, -4.009052276611328, -3.8254966735839844, -3.6419410705566406, -3.458385467529297, -3.274829864501953, -3.0912742614746094, -2.9077186584472656, -2.724163055419922, -2.540607452392578, -2.3570518493652344, -2.1734962463378906, -1.9899406433105469, -1.8063850402832031, -1.6228294372558594, -1.4392738342285156, -1.2557182312011719, -1.0721626281738281, -0.8886070251464844, -0.7050514221191406, -0.5214958190917969, -0.3379402160644531, -0.15438461303710938, 0.029170989990234375, 0.21272659301757812, 0.3962821960449219, 0.5798377990722656, 0.7633934020996094, 0.9469490051269531, 1.1305046081542969, 1.3140602111816406, 1.4976158142089844, 1.6811714172363281, 1.8647270202636719, 2.0482826232910156, 2.2318382263183594, 2.415393829345703, 2.598949432373047, 2.7825050354003906, 2.9660606384277344, 3.149616241455078, 3.333171844482422, 3.5167274475097656, 3.7002830505371094, 3.883838653564453, 4.067394256591797, 4.250949859619141, 4.434505462646484, 4.618061065673828, 4.801616668701172, 4.985172271728516, 5.168727874755859, 5.352283477783203, 5.535839080810547]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 6.0, 5.0, 4.0, 10.0, 9.0, 10.0, 12.0, 24.0, 28.0, 47.0, 82.0, 126.0, 175.0, 268.0, 420.0, 714.0, 1089.0, 1911.0, 3345.0, 6497.0, 12408.0, 24236.0, 52226.0, 116680.0, 285500.0, 710206.0, 1312083.0, 968084.0, 403301.0, 159558.0, 68494.0, 31806.0, 15732.0, 8155.0, 4475.0, 2638.0, 1423.0, 900.0, 555.0, 342.0, 240.0, 139.0, 104.0, 73.0, 51.0, 36.0, 20.0, 17.0, 13.0, 11.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8583984375, -0.8284759521484375, -0.798553466796875, -0.7686309814453125, -0.73870849609375, -0.7087860107421875, -0.678863525390625, -0.6489410400390625, -0.6190185546875, -0.5890960693359375, -0.559173583984375, -0.5292510986328125, -0.49932861328125, -0.4694061279296875, -0.439483642578125, -0.4095611572265625, -0.379638671875, -0.3497161865234375, -0.319793701171875, -0.2898712158203125, -0.25994873046875, -0.2300262451171875, -0.200103759765625, -0.1701812744140625, -0.1402587890625, -0.1103363037109375, -0.080413818359375, -0.0504913330078125, -0.02056884765625, 0.0093536376953125, 0.039276123046875, 0.0691986083984375, 0.09912109375, 0.1290435791015625, 0.158966064453125, 0.1888885498046875, 0.21881103515625, 0.2487335205078125, 0.278656005859375, 0.3085784912109375, 0.3385009765625, 0.3684234619140625, 0.398345947265625, 0.4282684326171875, 0.45819091796875, 0.4881134033203125, 0.518035888671875, 0.5479583740234375, 0.577880859375, 0.6078033447265625, 0.637725830078125, 0.6676483154296875, 0.69757080078125, 0.7274932861328125, 0.757415771484375, 0.7873382568359375, 0.8172607421875, 0.8471832275390625, 0.877105712890625, 0.9070281982421875, 0.93695068359375, 0.9668731689453125, 0.996795654296875, 1.0267181396484375, 1.056640625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 9.0, 6.0, 6.0, 10.0, 15.0, 15.0, 20.0, 21.0, 34.0, 30.0, 31.0, 38.0, 39.0, 40.0, 59.0, 60.0, 54.0, 58.0, 53.0, 47.0, 34.0, 44.0, 34.0, 33.0, 23.0, 24.0, 27.0, 28.0, 23.0, 13.0, 14.0, 13.0, 18.0, 9.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8642578125, -0.830291748046875, -0.79632568359375, -0.762359619140625, -0.7283935546875, -0.694427490234375, -0.66046142578125, -0.626495361328125, -0.592529296875, -0.558563232421875, -0.52459716796875, -0.490631103515625, -0.4566650390625, -0.422698974609375, -0.38873291015625, -0.354766845703125, -0.32080078125, -0.286834716796875, -0.25286865234375, -0.218902587890625, -0.1849365234375, -0.150970458984375, -0.11700439453125, -0.083038330078125, -0.049072265625, -0.015106201171875, 0.01885986328125, 0.052825927734375, 0.0867919921875, 0.120758056640625, 0.15472412109375, 0.188690185546875, 0.22265625, 0.256622314453125, 0.29058837890625, 0.324554443359375, 0.3585205078125, 0.392486572265625, 0.42645263671875, 0.460418701171875, 0.494384765625, 0.528350830078125, 0.56231689453125, 0.596282958984375, 0.6302490234375, 0.664215087890625, 0.69818115234375, 0.732147216796875, 0.76611328125, 0.800079345703125, 0.83404541015625, 0.868011474609375, 0.9019775390625, 0.935943603515625, 0.96990966796875, 1.003875732421875, 1.037841796875, 1.071807861328125, 1.10577392578125, 1.139739990234375, 1.1737060546875, 1.207672119140625, 1.24163818359375, 1.275604248046875, 1.3095703125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 6.0, 3.0, 11.0, 7.0, 21.0, 31.0, 43.0, 66.0, 81.0, 138.0, 204.0, 372.0, 620.0, 1143.0, 2249.0, 4502.0, 9730.0, 22876.0, 56528.0, 149849.0, 463056.0, 1653085.0, 1287901.0, 344289.0, 118085.0, 44790.0, 18552.0, 8139.0, 3737.0, 1855.0, 930.0, 534.0, 306.0, 193.0, 125.0, 75.0, 52.0, 31.0, 20.0, 10.0, 8.0, 7.0, 5.0, 8.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4287109375, -1.3838958740234375, -1.339080810546875, -1.2942657470703125, -1.24945068359375, -1.2046356201171875, -1.159820556640625, -1.1150054931640625, -1.0701904296875, -1.0253753662109375, -0.980560302734375, -0.9357452392578125, -0.89093017578125, -0.8461151123046875, -0.801300048828125, -0.7564849853515625, -0.711669921875, -0.6668548583984375, -0.622039794921875, -0.5772247314453125, -0.53240966796875, -0.4875946044921875, -0.442779541015625, -0.3979644775390625, -0.3531494140625, -0.3083343505859375, -0.263519287109375, -0.2187042236328125, -0.17388916015625, -0.1290740966796875, -0.084259033203125, -0.0394439697265625, 0.00537109375, 0.0501861572265625, 0.095001220703125, 0.1398162841796875, 0.18463134765625, 0.2294464111328125, 0.274261474609375, 0.3190765380859375, 0.3638916015625, 0.4087066650390625, 0.453521728515625, 0.4983367919921875, 0.54315185546875, 0.5879669189453125, 0.632781982421875, 0.6775970458984375, 0.722412109375, 0.7672271728515625, 0.812042236328125, 0.8568572998046875, 0.90167236328125, 0.9464874267578125, 0.991302490234375, 1.0361175537109375, 1.0809326171875, 1.1257476806640625, 1.170562744140625, 1.2153778076171875, 1.26019287109375, 1.3050079345703125, 1.349822998046875, 1.3946380615234375, 1.439453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 3.0, 19.0, 18.0, 18.0, 17.0, 27.0, 41.0, 46.0, 52.0, 60.0, 81.0, 135.0, 139.0, 212.0, 323.0, 434.0, 512.0, 470.0, 386.0, 284.0, 194.0, 144.0, 105.0, 72.0, 58.0, 55.0, 43.0, 34.0, 22.0, 16.0, 9.0, 9.0, 15.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.0, -1.947021484375, -1.89404296875, -1.841064453125, -1.7880859375, -1.735107421875, -1.68212890625, -1.629150390625, -1.576171875, -1.523193359375, -1.47021484375, -1.417236328125, -1.3642578125, -1.311279296875, -1.25830078125, -1.205322265625, -1.15234375, -1.099365234375, -1.04638671875, -0.993408203125, -0.9404296875, -0.887451171875, -0.83447265625, -0.781494140625, -0.728515625, -0.675537109375, -0.62255859375, -0.569580078125, -0.5166015625, -0.463623046875, -0.41064453125, -0.357666015625, -0.3046875, -0.251708984375, -0.19873046875, -0.145751953125, -0.0927734375, -0.039794921875, 0.01318359375, 0.066162109375, 0.119140625, 0.172119140625, 0.22509765625, 0.278076171875, 0.3310546875, 0.384033203125, 0.43701171875, 0.489990234375, 0.54296875, 0.595947265625, 0.64892578125, 0.701904296875, 0.7548828125, 0.807861328125, 0.86083984375, 0.913818359375, 0.966796875, 1.019775390625, 1.07275390625, 1.125732421875, 1.1787109375, 1.231689453125, 1.28466796875, 1.337646484375, 1.390625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 9.0, 11.0, 28.0, 81.0, 184.0, 269.0, 220.0, 132.0, 56.0, 8.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.04484558105469, -34.26356506347656, -33.48228454589844, -32.70100402832031, -31.91972541809082, -31.138444900512695, -30.35716438293457, -29.575885772705078, -28.794605255126953, -28.013324737548828, -27.232044219970703, -26.45076560974121, -25.669485092163086, -24.88820457458496, -24.106924057006836, -23.325645446777344, -22.54436492919922, -21.763084411621094, -20.98180389404297, -20.200525283813477, -19.41924476623535, -18.637964248657227, -17.8566837310791, -17.07540512084961, -16.29412269592285, -15.512842178344727, -14.731562614440918, -13.950282096862793, -13.169002532958984, -12.38772201538086, -11.606441497802734, -10.825161933898926, -10.043882369995117, -9.262601852416992, -8.481322288513184, -7.700041770935059, -6.91876220703125, -6.137481689453125, -5.356201648712158, -4.574921607971191, -3.7936415672302246, -3.012361526489258, -2.231081485748291, -1.4498012065887451, -0.6685211658477783, 0.11275887489318848, 0.8940391540527344, 1.6753191947937012, 2.456599235534668, 3.2378792762756348, 4.019159317016602, 4.800439834594727, 5.581719398498535, 6.36299991607666, 7.144279956817627, 7.925559997558594, 8.706840515136719, 9.488121032714844, 10.269400596618652, 11.050681114196777, 11.831960678100586, 12.613241195678711, 13.394521713256836, 14.175801277160645, 14.957080841064453]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 1.0, 6.0, 6.0, 5.0, 11.0, 13.0, 18.0, 13.0, 15.0, 9.0, 27.0, 34.0, 30.0, 37.0, 29.0, 41.0, 33.0, 47.0, 45.0, 33.0, 47.0, 33.0, 46.0, 44.0, 29.0, 44.0, 26.0, 33.0, 30.0, 26.0, 24.0, 27.0, 19.0, 20.0, 20.0, 16.0, 12.0, 9.0, 10.0, 8.0, 7.0, 2.0, 0.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.789765357971191, -5.6128973960876465, -5.436029434204102, -5.259161472320557, -5.082293510437012, -4.905425548553467, -4.728557586669922, -4.551690101623535, -4.374821662902832, -4.197953701019287, -4.021085739135742, -3.8442177772521973, -3.6673498153686523, -3.4904818534851074, -3.3136141300201416, -3.1367461681365967, -2.959878444671631, -2.783010482788086, -2.606142520904541, -2.429274559020996, -2.252406597137451, -2.0755386352539062, -1.8986709117889404, -1.7218029499053955, -1.5449349880218506, -1.3680670261383057, -1.1911990642547607, -1.0143312215805054, -0.8374632596969604, -0.6605952978134155, -0.48372745513916016, -0.30685949325561523, -0.1299910545349121, 0.046876877546310425, 0.22374480962753296, 0.4006127119064331, 0.577480673789978, 0.754348635673523, 0.9312164783477783, 1.1080844402313232, 1.2849524021148682, 1.461820363998413, 1.638688325881958, 1.8155561685562134, 1.9924241304397583, 2.1692919731140137, 2.3461599349975586, 2.5230278968811035, 2.6998958587646484, 2.8767638206481934, 3.0536317825317383, 3.230499744415283, 3.407367706298828, 3.584235668182373, 3.761103391647339, 3.937971353530884, 4.114839553833008, 4.291707515716553, 4.468575477600098, 4.645443439483643, 4.8223114013671875, 4.999179363250732, 5.176047325134277, 5.352914810180664, 5.529782772064209]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 8.0, 8.0, 11.0, 7.0, 14.0, 29.0, 50.0, 57.0, 116.0, 168.0, 323.0, 554.0, 1023.0, 1750.0, 3254.0, 5687.0, 10437.0, 20713.0, 47184.0, 118870.0, 265051.0, 302102.0, 155639.0, 61546.0, 25745.0, 12631.0, 6881.0, 3825.0, 2096.0, 1130.0, 692.0, 351.0, 196.0, 125.0, 95.0, 55.0, 40.0, 30.0, 19.0, 13.0, 12.0, 3.0, 6.0, 4.0, 0.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4775390625, -1.42852783203125, -1.3795166015625, -1.33050537109375, -1.281494140625, -1.23248291015625, -1.1834716796875, -1.13446044921875, -1.08544921875, -1.03643798828125, -0.9874267578125, -0.93841552734375, -0.889404296875, -0.84039306640625, -0.7913818359375, -0.74237060546875, -0.693359375, -0.64434814453125, -0.5953369140625, -0.54632568359375, -0.497314453125, -0.44830322265625, -0.3992919921875, -0.35028076171875, -0.30126953125, -0.25225830078125, -0.2032470703125, -0.15423583984375, -0.105224609375, -0.05621337890625, -0.0072021484375, 0.04180908203125, 0.0908203125, 0.13983154296875, 0.1888427734375, 0.23785400390625, 0.286865234375, 0.33587646484375, 0.3848876953125, 0.43389892578125, 0.48291015625, 0.53192138671875, 0.5809326171875, 0.62994384765625, 0.678955078125, 0.72796630859375, 0.7769775390625, 0.82598876953125, 0.875, 0.92401123046875, 0.9730224609375, 1.02203369140625, 1.071044921875, 1.12005615234375, 1.1690673828125, 1.21807861328125, 1.26708984375, 1.31610107421875, 1.3651123046875, 1.41412353515625, 1.463134765625, 1.51214599609375, 1.5611572265625, 1.61016845703125, 1.6591796875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 5.0, 9.0, 11.0, 7.0, 11.0, 11.0, 18.0, 15.0, 20.0, 23.0, 29.0, 35.0, 31.0, 35.0, 47.0, 45.0, 46.0, 54.0, 54.0, 45.0, 35.0, 37.0, 35.0, 50.0, 42.0, 43.0, 34.0, 32.0, 17.0, 25.0, 22.0, 9.0, 17.0, 12.0, 4.0, 9.0, 6.0, 5.0, 4.0, 5.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94482421875, -0.9131698608398438, -0.8815155029296875, -0.8498611450195312, -0.818206787109375, -0.7865524291992188, -0.7548980712890625, -0.7232437133789062, -0.69158935546875, -0.6599349975585938, -0.6282806396484375, -0.5966262817382812, -0.564971923828125, -0.5333175659179688, -0.5016632080078125, -0.47000885009765625, -0.4383544921875, -0.40670013427734375, -0.3750457763671875, -0.34339141845703125, -0.311737060546875, -0.28008270263671875, -0.2484283447265625, -0.21677398681640625, -0.18511962890625, -0.15346527099609375, -0.1218109130859375, -0.09015655517578125, -0.058502197265625, -0.02684783935546875, 0.0048065185546875, 0.03646087646484375, 0.068115234375, 0.09976959228515625, 0.1314239501953125, 0.16307830810546875, 0.194732666015625, 0.22638702392578125, 0.2580413818359375, 0.28969573974609375, 0.32135009765625, 0.35300445556640625, 0.3846588134765625, 0.41631317138671875, 0.447967529296875, 0.47962188720703125, 0.5112762451171875, 0.5429306030273438, 0.5745849609375, 0.6062393188476562, 0.6378936767578125, 0.6695480346679688, 0.701202392578125, 0.7328567504882812, 0.7645111083984375, 0.7961654663085938, 0.82781982421875, 0.8594741821289062, 0.8911285400390625, 0.9227828979492188, 0.954437255859375, 0.9860916137695312, 1.0177459716796875, 1.0494003295898438, 1.0810546875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 7.0, 10.0, 17.0, 24.0, 33.0, 50.0, 84.0, 175.0, 291.0, 613.0, 1213.0, 2576.0, 5433.0, 11772.0, 27536.0, 82051.0, 268580.0, 397917.0, 165274.0, 49954.0, 18797.0, 8282.0, 4018.0, 1909.0, 893.0, 509.0, 236.0, 122.0, 58.0, 46.0, 29.0, 24.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.99609375, -1.936126708984375, -1.87615966796875, -1.816192626953125, -1.7562255859375, -1.696258544921875, -1.63629150390625, -1.576324462890625, -1.516357421875, -1.456390380859375, -1.39642333984375, -1.336456298828125, -1.2764892578125, -1.216522216796875, -1.15655517578125, -1.096588134765625, -1.03662109375, -0.976654052734375, -0.91668701171875, -0.856719970703125, -0.7967529296875, -0.736785888671875, -0.67681884765625, -0.616851806640625, -0.556884765625, -0.496917724609375, -0.43695068359375, -0.376983642578125, -0.3170166015625, -0.257049560546875, -0.19708251953125, -0.137115478515625, -0.0771484375, -0.017181396484375, 0.04278564453125, 0.102752685546875, 0.1627197265625, 0.222686767578125, 0.28265380859375, 0.342620849609375, 0.402587890625, 0.462554931640625, 0.52252197265625, 0.582489013671875, 0.6424560546875, 0.702423095703125, 0.76239013671875, 0.822357177734375, 0.88232421875, 0.942291259765625, 1.00225830078125, 1.062225341796875, 1.1221923828125, 1.182159423828125, 1.24212646484375, 1.302093505859375, 1.362060546875, 1.422027587890625, 1.48199462890625, 1.541961669921875, 1.6019287109375, 1.661895751953125, 1.72186279296875, 1.781829833984375, 1.841796875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 7.0, 8.0, 11.0, 7.0, 8.0, 12.0, 20.0, 19.0, 13.0, 16.0, 23.0, 32.0, 35.0, 32.0, 33.0, 39.0, 39.0, 41.0, 50.0, 46.0, 34.0, 54.0, 45.0, 47.0, 27.0, 31.0, 41.0, 44.0, 33.0, 25.0, 24.0, 15.0, 12.0, 13.0, 11.0, 12.0, 10.0, 7.0, 9.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.880859375, -2.79473876953125, -2.7086181640625, -2.62249755859375, -2.536376953125, -2.45025634765625, -2.3641357421875, -2.27801513671875, -2.19189453125, -2.10577392578125, -2.0196533203125, -1.93353271484375, -1.847412109375, -1.76129150390625, -1.6751708984375, -1.58905029296875, -1.5029296875, -1.41680908203125, -1.3306884765625, -1.24456787109375, -1.158447265625, -1.07232666015625, -0.9862060546875, -0.90008544921875, -0.81396484375, -0.72784423828125, -0.6417236328125, -0.55560302734375, -0.469482421875, -0.38336181640625, -0.2972412109375, -0.21112060546875, -0.125, -0.03887939453125, 0.0472412109375, 0.13336181640625, 0.219482421875, 0.30560302734375, 0.3917236328125, 0.47784423828125, 0.56396484375, 0.65008544921875, 0.7362060546875, 0.82232666015625, 0.908447265625, 0.99456787109375, 1.0806884765625, 1.16680908203125, 1.2529296875, 1.33905029296875, 1.4251708984375, 1.51129150390625, 1.597412109375, 1.68353271484375, 1.7696533203125, 1.85577392578125, 1.94189453125, 2.02801513671875, 2.1141357421875, 2.20025634765625, 2.286376953125, 2.37249755859375, 2.4586181640625, 2.54473876953125, 2.630859375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 9.0, 18.0, 22.0, 32.0, 58.0, 77.0, 134.0, 255.0, 412.0, 683.0, 1136.0, 1734.0, 2792.0, 4475.0, 7450.0, 12558.0, 21397.0, 39022.0, 73012.0, 133776.0, 212862.0, 217948.0, 142170.0, 78277.0, 41947.0, 22975.0, 13173.0, 7747.0, 4633.0, 2979.0, 1908.0, 1082.0, 721.0, 435.0, 249.0, 156.0, 100.0, 68.0, 26.0, 16.0, 16.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.48583984375, -0.4730720520019531, -0.46030426025390625, -0.4475364685058594, -0.4347686767578125, -0.4220008850097656, -0.40923309326171875, -0.3964653015136719, -0.383697509765625, -0.3709297180175781, -0.35816192626953125, -0.3453941345214844, -0.3326263427734375, -0.3198585510253906, -0.30709075927734375, -0.2943229675292969, -0.28155517578125, -0.2687873840332031, -0.25601959228515625, -0.24325180053710938, -0.2304840087890625, -0.21771621704101562, -0.20494842529296875, -0.19218063354492188, -0.179412841796875, -0.16664505004882812, -0.15387725830078125, -0.14110946655273438, -0.1283416748046875, -0.11557388305664062, -0.10280609130859375, -0.09003829956054688, -0.0772705078125, -0.06450271606445312, -0.05173492431640625, -0.038967132568359375, -0.0261993408203125, -0.013431549072265625, -0.00066375732421875, 0.012104034423828125, 0.024871826171875, 0.037639617919921875, 0.05040740966796875, 0.06317520141601562, 0.0759429931640625, 0.08871078491210938, 0.10147857666015625, 0.11424636840820312, 0.12701416015625, 0.13978195190429688, 0.15254974365234375, 0.16531753540039062, 0.1780853271484375, 0.19085311889648438, 0.20362091064453125, 0.21638870239257812, 0.229156494140625, 0.24192428588867188, 0.25469207763671875, 0.2674598693847656, 0.2802276611328125, 0.2929954528808594, 0.30576324462890625, 0.3185310363769531, 0.331298828125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 6.0, 5.0, 6.0, 6.0, 18.0, 24.0, 25.0, 45.0, 57.0, 90.0, 126.0, 133.0, 121.0, 103.0, 79.0, 40.0, 32.0, 23.0, 20.0, 9.0, 7.0, 4.0, 5.0, 7.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002391338348388672, -0.00023109093308448792, -0.00022304803133010864, -0.00021500512957572937, -0.0002069622278213501, -0.00019891932606697083, -0.00019087642431259155, -0.00018283352255821228, -0.000174790620803833, -0.00016674771904945374, -0.00015870481729507446, -0.0001506619155406952, -0.00014261901378631592, -0.00013457611203193665, -0.00012653321027755737, -0.0001184903085231781, -0.00011044740676879883, -0.00010240450501441956, -9.436160326004028e-05, -8.631870150566101e-05, -7.827579975128174e-05, -7.023289799690247e-05, -6.21899962425232e-05, -5.414709448814392e-05, -4.610419273376465e-05, -3.8061290979385376e-05, -3.0018389225006104e-05, -2.197548747062683e-05, -1.3932585716247559e-05, -5.889683961868286e-06, 2.1532177925109863e-06, 1.0196119546890259e-05, 1.823902130126953e-05, 2.6281923055648804e-05, 3.4324824810028076e-05, 4.236772656440735e-05, 5.041062831878662e-05, 5.8453530073165894e-05, 6.649643182754517e-05, 7.453933358192444e-05, 8.258223533630371e-05, 9.062513709068298e-05, 9.866803884506226e-05, 0.00010671094059944153, 0.0001147538423538208, 0.00012279674410820007, 0.00013083964586257935, 0.00013888254761695862, 0.0001469254493713379, 0.00015496835112571716, 0.00016301125288009644, 0.0001710541546344757, 0.00017909705638885498, 0.00018713995814323425, 0.00019518285989761353, 0.0002032257616519928, 0.00021126866340637207, 0.00021931156516075134, 0.00022735446691513062, 0.0002353973686695099, 0.00024344027042388916, 0.00025148317217826843, 0.0002595260739326477, 0.000267568975687027, 0.00027561187744140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 2.0, 11.0, 7.0, 17.0, 19.0, 27.0, 50.0, 55.0, 89.0, 135.0, 237.0, 406.0, 668.0, 1122.0, 1925.0, 3028.0, 5185.0, 8470.0, 13993.0, 23158.0, 38375.0, 63120.0, 99417.0, 144948.0, 173105.0, 159447.0, 117256.0, 76217.0, 46457.0, 28283.0, 17249.0, 10203.0, 6318.0, 3753.0, 2204.0, 1377.0, 820.0, 517.0, 343.0, 192.0, 112.0, 73.0, 46.0, 42.0, 24.0, 20.0, 7.0, 6.0, 9.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.3447265625, -0.3341827392578125, -0.323638916015625, -0.3130950927734375, -0.30255126953125, -0.2920074462890625, -0.281463623046875, -0.2709197998046875, -0.2603759765625, -0.2498321533203125, -0.239288330078125, -0.2287445068359375, -0.21820068359375, -0.2076568603515625, -0.197113037109375, -0.1865692138671875, -0.176025390625, -0.1654815673828125, -0.154937744140625, -0.1443939208984375, -0.13385009765625, -0.1233062744140625, -0.112762451171875, -0.1022186279296875, -0.0916748046875, -0.0811309814453125, -0.070587158203125, -0.0600433349609375, -0.04949951171875, -0.0389556884765625, -0.028411865234375, -0.0178680419921875, -0.00732421875, 0.0032196044921875, 0.013763427734375, 0.0243072509765625, 0.03485107421875, 0.0453948974609375, 0.055938720703125, 0.0664825439453125, 0.0770263671875, 0.0875701904296875, 0.098114013671875, 0.1086578369140625, 0.11920166015625, 0.1297454833984375, 0.140289306640625, 0.1508331298828125, 0.161376953125, 0.1719207763671875, 0.182464599609375, 0.1930084228515625, 0.20355224609375, 0.2140960693359375, 0.224639892578125, 0.2351837158203125, 0.2457275390625, 0.2562713623046875, 0.266815185546875, 0.2773590087890625, 0.28790283203125, 0.2984466552734375, 0.308990478515625, 0.3195343017578125, 0.330078125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 5.0, 4.0, 3.0, 4.0, 12.0, 6.0, 12.0, 9.0, 14.0, 22.0, 17.0, 16.0, 23.0, 32.0, 36.0, 35.0, 49.0, 39.0, 44.0, 56.0, 58.0, 62.0, 61.0, 41.0, 50.0, 36.0, 32.0, 33.0, 30.0, 28.0, 32.0, 19.0, 14.0, 12.0, 9.0, 8.0, 7.0, 5.0, 7.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.477783203125, -0.4620857238769531, -0.44638824462890625, -0.4306907653808594, -0.4149932861328125, -0.3992958068847656, -0.38359832763671875, -0.3679008483886719, -0.352203369140625, -0.3365058898925781, -0.32080841064453125, -0.3051109313964844, -0.2894134521484375, -0.2737159729003906, -0.25801849365234375, -0.24232101440429688, -0.22662353515625, -0.21092605590820312, -0.19522857666015625, -0.17953109741210938, -0.1638336181640625, -0.14813613891601562, -0.13243865966796875, -0.11674118041992188, -0.101043701171875, -0.08534622192382812, -0.06964874267578125, -0.053951263427734375, -0.0382537841796875, -0.022556304931640625, -0.00685882568359375, 0.008838653564453125, 0.0245361328125, 0.040233612060546875, 0.05593109130859375, 0.07162857055664062, 0.0873260498046875, 0.10302352905273438, 0.11872100830078125, 0.13441848754882812, 0.150115966796875, 0.16581344604492188, 0.18151092529296875, 0.19720840454101562, 0.2129058837890625, 0.22860336303710938, 0.24430084228515625, 0.2599983215332031, 0.27569580078125, 0.2913932800292969, 0.30709075927734375, 0.3227882385253906, 0.3384857177734375, 0.3541831970214844, 0.36988067626953125, 0.3855781555175781, 0.401275634765625, 0.4169731140136719, 0.43267059326171875, 0.4483680725097656, 0.4640655517578125, 0.4797630310058594, 0.49546051025390625, 0.5111579895019531, 0.52685546875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 13.0, 18.0, 63.0, 102.0, 194.0, 198.0, 179.0, 104.0, 66.0, 26.0, 14.0, 5.0, 3.0, 1.0, 1.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.745363235473633, -15.276466369628906, -14.80756950378418, -14.33867359161377, -13.869776725769043, -13.400879859924316, -12.931983947753906, -12.46308708190918, -11.994190216064453, -11.525293350219727, -11.056396484375, -10.58750057220459, -10.118603706359863, -9.649706840515137, -9.180810928344727, -8.7119140625, -8.243017196655273, -7.774120330810547, -7.3052239418029785, -6.83632755279541, -6.367430686950684, -5.898533821105957, -5.429637432098389, -4.96074104309082, -4.491844177246094, -4.022947311401367, -3.554050922393799, -3.0851542949676514, -2.616257667541504, -2.1473610401153564, -1.678464412689209, -1.2095677852630615, -0.7406711578369141, -0.2717745304107666, 0.19712209701538086, 0.6660187244415283, 1.1349153518676758, 1.6038119792938232, 2.0727086067199707, 2.541605234146118, 3.0105018615722656, 3.479398488998413, 3.9482951164245605, 4.417191505432129, 4.8860883712768555, 5.354985237121582, 5.82388162612915, 6.292778015136719, 6.761674880981445, 7.230571746826172, 7.69946813583374, 8.168364524841309, 8.637261390686035, 9.106158256530762, 9.575054168701172, 10.043951034545898, 10.512847900390625, 10.981744766235352, 11.450641632080078, 11.919537544250488, 12.388434410095215, 12.857331275939941, 13.326227188110352, 13.795124053955078, 14.264020919799805]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 5.0, 10.0, 5.0, 7.0, 10.0, 9.0, 16.0, 18.0, 16.0, 19.0, 13.0, 24.0, 20.0, 30.0, 34.0, 34.0, 24.0, 46.0, 40.0, 43.0, 46.0, 39.0, 44.0, 49.0, 35.0, 43.0, 38.0, 39.0, 35.0, 21.0, 28.0, 24.0, 14.0, 31.0, 19.0, 12.0, 14.0, 11.0, 10.0, 7.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-7.305245399475098, -7.0897135734558105, -6.874182224273682, -6.6586503982543945, -6.443118572235107, -6.22758674621582, -6.012055397033691, -5.796523571014404, -5.580991744995117, -5.36545991897583, -5.149928569793701, -4.934396743774414, -4.718864917755127, -4.50333309173584, -4.287801742553711, -4.072269916534424, -3.856738567352295, -3.641206979751587, -3.4256751537323, -3.210143566131592, -2.9946117401123047, -2.7790801525115967, -2.5635485649108887, -2.3480167388916016, -2.1324851512908936, -1.916953444480896, -1.7014217376708984, -1.4858901500701904, -1.2703584432601929, -1.0548267364501953, -0.8392951488494873, -0.6237634420394897, -0.4082317352294922, -0.19270005822181702, 0.022831618785858154, 0.23836326599121094, 0.4538949728012085, 0.669426679611206, 0.8849582672119141, 1.1004899740219116, 1.3160216808319092, 1.5315533876419067, 1.7470850944519043, 1.9626166820526123, 2.1781482696533203, 2.3936800956726074, 2.6092116832733154, 2.8247432708740234, 3.0402750968933105, 3.2558066844940186, 3.4713385105133057, 3.6868700981140137, 3.902401924133301, 4.11793327331543, 4.333465099334717, 4.548996925354004, 4.764528274536133, 4.98006010055542, 5.195591449737549, 5.411123275756836, 5.626655101776123, 5.84218692779541, 6.057718276977539, 6.273250102996826, 6.488781929016113]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 10.0, 10.0, 18.0, 27.0, 45.0, 55.0, 67.0, 132.0, 202.0, 349.0, 643.0, 1243.0, 2597.0, 6393.0, 17050.0, 51092.0, 172535.0, 625411.0, 1568591.0, 1213439.0, 377684.0, 103796.0, 32456.0, 11595.0, 4649.0, 1976.0, 969.0, 487.0, 318.0, 152.0, 104.0, 62.0, 40.0, 25.0, 17.0, 14.0, 7.0, 6.0, 6.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2265625, -1.1839752197265625, -1.141387939453125, -1.0988006591796875, -1.05621337890625, -1.0136260986328125, -0.971038818359375, -0.9284515380859375, -0.8858642578125, -0.8432769775390625, -0.800689697265625, -0.7581024169921875, -0.71551513671875, -0.6729278564453125, -0.630340576171875, -0.5877532958984375, -0.545166015625, -0.5025787353515625, -0.459991455078125, -0.4174041748046875, -0.37481689453125, -0.3322296142578125, -0.289642333984375, -0.2470550537109375, -0.2044677734375, -0.1618804931640625, -0.119293212890625, -0.0767059326171875, -0.03411865234375, 0.0084686279296875, 0.051055908203125, 0.0936431884765625, 0.13623046875, 0.1788177490234375, 0.221405029296875, 0.2639923095703125, 0.30657958984375, 0.3491668701171875, 0.391754150390625, 0.4343414306640625, 0.4769287109375, 0.5195159912109375, 0.562103271484375, 0.6046905517578125, 0.64727783203125, 0.6898651123046875, 0.732452392578125, 0.7750396728515625, 0.817626953125, 0.8602142333984375, 0.902801513671875, 0.9453887939453125, 0.98797607421875, 1.0305633544921875, 1.073150634765625, 1.1157379150390625, 1.1583251953125, 1.2009124755859375, 1.243499755859375, 1.2860870361328125, 1.32867431640625, 1.3712615966796875, 1.413848876953125, 1.4564361572265625, 1.4990234375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 8.0, 6.0, 15.0, 10.0, 13.0, 16.0, 19.0, 18.0, 23.0, 20.0, 19.0, 35.0, 31.0, 34.0, 43.0, 46.0, 45.0, 40.0, 44.0, 34.0, 39.0, 51.0, 26.0, 26.0, 29.0, 30.0, 33.0, 33.0, 26.0, 22.0, 28.0, 19.0, 10.0, 21.0, 13.0, 8.0, 12.0, 9.0, 7.0, 3.0, 5.0, 5.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.93798828125, -0.9091110229492188, -0.8802337646484375, -0.8513565063476562, -0.822479248046875, -0.7936019897460938, -0.7647247314453125, -0.7358474731445312, -0.70697021484375, -0.6780929565429688, -0.6492156982421875, -0.6203384399414062, -0.591461181640625, -0.5625839233398438, -0.5337066650390625, -0.5048294067382812, -0.4759521484375, -0.44707489013671875, -0.4181976318359375, -0.38932037353515625, -0.360443115234375, -0.33156585693359375, -0.3026885986328125, -0.27381134033203125, -0.24493408203125, -0.21605682373046875, -0.1871795654296875, -0.15830230712890625, -0.129425048828125, -0.10054779052734375, -0.0716705322265625, -0.04279327392578125, -0.013916015625, 0.01496124267578125, 0.0438385009765625, 0.07271575927734375, 0.101593017578125, 0.13047027587890625, 0.1593475341796875, 0.18822479248046875, 0.21710205078125, 0.24597930908203125, 0.2748565673828125, 0.30373382568359375, 0.332611083984375, 0.36148834228515625, 0.3903656005859375, 0.41924285888671875, 0.4481201171875, 0.47699737548828125, 0.5058746337890625, 0.5347518920898438, 0.563629150390625, 0.5925064086914062, 0.6213836669921875, 0.6502609252929688, 0.67913818359375, 0.7080154418945312, 0.7368927001953125, 0.7657699584960938, 0.794647216796875, 0.8235244750976562, 0.8524017333984375, 0.8812789916992188, 0.91015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 7.0, 5.0, 7.0, 8.0, 9.0, 17.0, 34.0, 50.0, 67.0, 94.0, 146.0, 260.0, 410.0, 754.0, 1477.0, 2856.0, 6168.0, 14784.0, 38593.0, 109979.0, 363018.0, 1371365.0, 1622715.0, 452155.0, 132474.0, 45585.0, 17158.0, 7156.0, 3227.0, 1608.0, 830.0, 472.0, 282.0, 162.0, 105.0, 76.0, 40.0, 43.0, 35.0, 14.0, 16.0, 2.0, 4.0, 4.0, 11.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3095703125, -1.262939453125, -1.21630859375, -1.169677734375, -1.123046875, -1.076416015625, -1.02978515625, -0.983154296875, -0.9365234375, -0.889892578125, -0.84326171875, -0.796630859375, -0.75, -0.703369140625, -0.65673828125, -0.610107421875, -0.5634765625, -0.516845703125, -0.47021484375, -0.423583984375, -0.376953125, -0.330322265625, -0.28369140625, -0.237060546875, -0.1904296875, -0.143798828125, -0.09716796875, -0.050537109375, -0.00390625, 0.042724609375, 0.08935546875, 0.135986328125, 0.1826171875, 0.229248046875, 0.27587890625, 0.322509765625, 0.369140625, 0.415771484375, 0.46240234375, 0.509033203125, 0.5556640625, 0.602294921875, 0.64892578125, 0.695556640625, 0.7421875, 0.788818359375, 0.83544921875, 0.882080078125, 0.9287109375, 0.975341796875, 1.02197265625, 1.068603515625, 1.115234375, 1.161865234375, 1.20849609375, 1.255126953125, 1.3017578125, 1.348388671875, 1.39501953125, 1.441650390625, 1.48828125, 1.534912109375, 1.58154296875, 1.628173828125, 1.6748046875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 3.0, 3.0, 4.0, 6.0, 9.0, 4.0, 6.0, 11.0, 17.0, 27.0, 23.0, 33.0, 57.0, 80.0, 110.0, 159.0, 191.0, 263.0, 352.0, 467.0, 459.0, 472.0, 361.0, 241.0, 197.0, 143.0, 101.0, 70.0, 52.0, 31.0, 35.0, 19.0, 17.0, 11.0, 9.0, 10.0, 6.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.462890625, -1.407501220703125, -1.35211181640625, -1.296722412109375, -1.2413330078125, -1.185943603515625, -1.13055419921875, -1.075164794921875, -1.019775390625, -0.964385986328125, -0.90899658203125, -0.853607177734375, -0.7982177734375, -0.742828369140625, -0.68743896484375, -0.632049560546875, -0.57666015625, -0.521270751953125, -0.46588134765625, -0.410491943359375, -0.3551025390625, -0.299713134765625, -0.24432373046875, -0.188934326171875, -0.133544921875, -0.078155517578125, -0.02276611328125, 0.032623291015625, 0.0880126953125, 0.143402099609375, 0.19879150390625, 0.254180908203125, 0.3095703125, 0.364959716796875, 0.42034912109375, 0.475738525390625, 0.5311279296875, 0.586517333984375, 0.64190673828125, 0.697296142578125, 0.752685546875, 0.808074951171875, 0.86346435546875, 0.918853759765625, 0.9742431640625, 1.029632568359375, 1.08502197265625, 1.140411376953125, 1.19580078125, 1.251190185546875, 1.30657958984375, 1.361968994140625, 1.4173583984375, 1.472747802734375, 1.52813720703125, 1.583526611328125, 1.638916015625, 1.694305419921875, 1.74969482421875, 1.805084228515625, 1.8604736328125, 1.915863037109375, 1.97125244140625, 2.026641845703125, 2.08203125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 6.0, 10.0, 23.0, 57.0, 106.0, 119.0, 175.0, 160.0, 147.0, 88.0, 47.0, 37.0, 9.0, 11.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.425603866577148, -11.926655769348145, -11.427706718444824, -10.92875862121582, -10.429810523986816, -9.930862426757812, -9.431913375854492, -8.932965278625488, -8.434017181396484, -7.935068607330322, -7.436120510101318, -6.937171936035156, -6.438223838806152, -5.93927526473999, -5.440326690673828, -4.941378593444824, -4.442430019378662, -3.943481683731079, -3.444533348083496, -2.945584774017334, -2.44663667678833, -1.947688102722168, -1.448739767074585, -0.949791431427002, -0.45084309577941895, 0.04810526967048645, 0.5470536351203918, 1.0460020303726196, 1.5449503660202026, 2.043898820877075, 2.542847156524658, 3.041795492172241, 3.540743827819824, 4.039692401885986, 4.53864049911499, 5.037589073181152, 5.536537170410156, 6.035485744476318, 6.5344343185424805, 7.033382415771484, 7.532330513000488, 8.031278610229492, 8.530227661132812, 9.029175758361816, 9.52812385559082, 10.02707290649414, 10.526021003723145, 11.024969100952148, 11.523918151855469, 12.022866249084473, 12.521815299987793, 13.020763397216797, 13.5197114944458, 14.018659591674805, 14.517608642578125, 15.016556739807129, 15.515504837036133, 16.014453887939453, 16.51340103149414, 17.01235008239746, 17.51129913330078, 18.01024627685547, 18.50919532775879, 19.00814437866211, 19.507091522216797]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 8.0, 8.0, 7.0, 13.0, 11.0, 16.0, 15.0, 21.0, 18.0, 33.0, 32.0, 31.0, 40.0, 42.0, 40.0, 48.0, 48.0, 32.0, 56.0, 37.0, 43.0, 43.0, 46.0, 32.0, 34.0, 37.0, 23.0, 19.0, 20.0, 26.0, 24.0, 16.0, 11.0, 8.0, 17.0, 14.0, 8.0, 4.0, 6.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-5.503911018371582, -5.331973552703857, -5.160036087036133, -4.988098621368408, -4.816161155700684, -4.644224166870117, -4.472286224365234, -4.300349235534668, -4.128411769866943, -3.9564743041992188, -3.784536838531494, -3.6125993728637695, -3.440662145614624, -3.2687246799468994, -3.096787214279175, -2.9248499870300293, -2.7529122829437256, -2.580974817276001, -2.4090373516082764, -2.237100124359131, -2.0651626586914062, -1.8932251930236816, -1.721287727355957, -1.549350380897522, -1.3774129152297974, -1.2054754495620728, -1.0335381031036377, -0.8616006374359131, -0.6896632313728333, -0.5177258253097534, -0.3457883596420288, -0.17385101318359375, -0.0019135475158691406, 0.1700238734483719, 0.3419612944126129, 0.5138987302780151, 0.685836136341095, 0.8577735424041748, 1.0297110080718994, 1.2016483545303345, 1.373585820198059, 1.5455232858657837, 1.7174606323242188, 1.8893980979919434, 2.061335563659668, 2.2332730293273926, 2.405210494995117, 2.5771477222442627, 2.7490851879119873, 2.921022653579712, 3.0929601192474365, 3.264897346496582, 3.4368348121643066, 3.6087722778320312, 3.780709743499756, 3.9526472091674805, 4.124584674835205, 4.29652214050293, 4.468459606170654, 4.640397071838379, 4.8123345375061035, 4.984272003173828, 5.1562089920043945, 5.328146457672119, 5.500083923339844]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 10.0, 9.0, 17.0, 31.0, 22.0, 47.0, 76.0, 85.0, 153.0, 211.0, 319.0, 511.0, 813.0, 1220.0, 1996.0, 2923.0, 4733.0, 7514.0, 12514.0, 22638.0, 47459.0, 103386.0, 198192.0, 254091.0, 191822.0, 98473.0, 45305.0, 22047.0, 11908.0, 7164.0, 4567.0, 2948.0, 1888.0, 1245.0, 767.0, 491.0, 305.0, 212.0, 126.0, 95.0, 53.0, 48.0, 42.0, 25.0, 13.0, 9.0, 11.0, 2.0, 7.0, 5.0, 0.0, 5.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.38671875, -1.3426513671875, -1.298583984375, -1.2545166015625, -1.21044921875, -1.1663818359375, -1.122314453125, -1.0782470703125, -1.0341796875, -0.9901123046875, -0.946044921875, -0.9019775390625, -0.85791015625, -0.8138427734375, -0.769775390625, -0.7257080078125, -0.681640625, -0.6375732421875, -0.593505859375, -0.5494384765625, -0.50537109375, -0.4613037109375, -0.417236328125, -0.3731689453125, -0.3291015625, -0.2850341796875, -0.240966796875, -0.1968994140625, -0.15283203125, -0.1087646484375, -0.064697265625, -0.0206298828125, 0.0234375, 0.0675048828125, 0.111572265625, 0.1556396484375, 0.19970703125, 0.2437744140625, 0.287841796875, 0.3319091796875, 0.3759765625, 0.4200439453125, 0.464111328125, 0.5081787109375, 0.55224609375, 0.5963134765625, 0.640380859375, 0.6844482421875, 0.728515625, 0.7725830078125, 0.816650390625, 0.8607177734375, 0.90478515625, 0.9488525390625, 0.992919921875, 1.0369873046875, 1.0810546875, 1.1251220703125, 1.169189453125, 1.2132568359375, 1.25732421875, 1.3013916015625, 1.345458984375, 1.3895263671875, 1.43359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 3.0, 5.0, 9.0, 12.0, 4.0, 19.0, 11.0, 15.0, 22.0, 24.0, 24.0, 29.0, 24.0, 27.0, 34.0, 27.0, 32.0, 38.0, 37.0, 47.0, 50.0, 34.0, 41.0, 34.0, 36.0, 30.0, 37.0, 35.0, 30.0, 23.0, 16.0, 19.0, 26.0, 19.0, 19.0, 14.0, 17.0, 16.0, 13.0, 16.0, 7.0, 3.0, 9.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.02734375, -0.9982528686523438, -0.9691619873046875, -0.9400711059570312, -0.910980224609375, -0.8818893432617188, -0.8527984619140625, -0.8237075805664062, -0.79461669921875, -0.7655258178710938, -0.7364349365234375, -0.7073440551757812, -0.678253173828125, -0.6491622924804688, -0.6200714111328125, -0.5909805297851562, -0.5618896484375, -0.5327987670898438, -0.5037078857421875, -0.47461700439453125, -0.445526123046875, -0.41643524169921875, -0.3873443603515625, -0.35825347900390625, -0.32916259765625, -0.30007171630859375, -0.2709808349609375, -0.24188995361328125, -0.212799072265625, -0.18370819091796875, -0.1546173095703125, -0.12552642822265625, -0.096435546875, -0.06734466552734375, -0.0382537841796875, -0.00916290283203125, 0.019927978515625, 0.04901885986328125, 0.0781097412109375, 0.10720062255859375, 0.13629150390625, 0.16538238525390625, 0.1944732666015625, 0.22356414794921875, 0.252655029296875, 0.28174591064453125, 0.3108367919921875, 0.33992767333984375, 0.3690185546875, 0.39810943603515625, 0.4272003173828125, 0.45629119873046875, 0.485382080078125, 0.5144729614257812, 0.5435638427734375, 0.5726547241210938, 0.60174560546875, 0.6308364868164062, 0.6599273681640625, 0.6890182495117188, 0.718109130859375, 0.7472000122070312, 0.7762908935546875, 0.8053817749023438, 0.83447265625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 6.0, 9.0, 7.0, 12.0, 17.0, 19.0, 29.0, 60.0, 77.0, 104.0, 168.0, 299.0, 590.0, 1130.0, 2438.0, 5129.0, 10601.0, 24836.0, 70499.0, 222266.0, 388856.0, 210708.0, 66829.0, 23756.0, 10316.0, 4943.0, 2349.0, 1106.0, 564.0, 307.0, 199.0, 102.0, 55.0, 43.0, 33.0, 19.0, 25.0, 10.0, 15.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.9619140625, -1.8975372314453125, -1.833160400390625, -1.7687835693359375, -1.70440673828125, -1.6400299072265625, -1.575653076171875, -1.5112762451171875, -1.4468994140625, -1.3825225830078125, -1.318145751953125, -1.2537689208984375, -1.18939208984375, -1.1250152587890625, -1.060638427734375, -0.9962615966796875, -0.931884765625, -0.8675079345703125, -0.803131103515625, -0.7387542724609375, -0.67437744140625, -0.6100006103515625, -0.545623779296875, -0.4812469482421875, -0.4168701171875, -0.3524932861328125, -0.288116455078125, -0.2237396240234375, -0.15936279296875, -0.0949859619140625, -0.030609130859375, 0.0337677001953125, 0.09814453125, 0.1625213623046875, 0.226898193359375, 0.2912750244140625, 0.35565185546875, 0.4200286865234375, 0.484405517578125, 0.5487823486328125, 0.6131591796875, 0.6775360107421875, 0.741912841796875, 0.8062896728515625, 0.87066650390625, 0.9350433349609375, 0.999420166015625, 1.0637969970703125, 1.128173828125, 1.1925506591796875, 1.256927490234375, 1.3213043212890625, 1.38568115234375, 1.4500579833984375, 1.514434814453125, 1.5788116455078125, 1.6431884765625, 1.7075653076171875, 1.771942138671875, 1.8363189697265625, 1.90069580078125, 1.9650726318359375, 2.029449462890625, 2.0938262939453125, 2.158203125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 1.0, 4.0, 10.0, 7.0, 7.0, 7.0, 11.0, 16.0, 17.0, 17.0, 28.0, 29.0, 16.0, 30.0, 39.0, 40.0, 26.0, 32.0, 34.0, 43.0, 46.0, 50.0, 42.0, 35.0, 35.0, 39.0, 36.0, 35.0, 34.0, 30.0, 35.0, 18.0, 22.0, 27.0, 14.0, 19.0, 7.0, 10.0, 15.0, 11.0, 7.0, 4.0, 5.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.48828125, -2.40167236328125, -2.3150634765625, -2.22845458984375, -2.141845703125, -2.05523681640625, -1.9686279296875, -1.88201904296875, -1.79541015625, -1.70880126953125, -1.6221923828125, -1.53558349609375, -1.448974609375, -1.36236572265625, -1.2757568359375, -1.18914794921875, -1.1025390625, -1.01593017578125, -0.9293212890625, -0.84271240234375, -0.756103515625, -0.66949462890625, -0.5828857421875, -0.49627685546875, -0.40966796875, -0.32305908203125, -0.2364501953125, -0.14984130859375, -0.063232421875, 0.02337646484375, 0.1099853515625, 0.19659423828125, 0.283203125, 0.36981201171875, 0.4564208984375, 0.54302978515625, 0.629638671875, 0.71624755859375, 0.8028564453125, 0.88946533203125, 0.97607421875, 1.06268310546875, 1.1492919921875, 1.23590087890625, 1.322509765625, 1.40911865234375, 1.4957275390625, 1.58233642578125, 1.6689453125, 1.75555419921875, 1.8421630859375, 1.92877197265625, 2.015380859375, 2.10198974609375, 2.1885986328125, 2.27520751953125, 2.36181640625, 2.44842529296875, 2.5350341796875, 2.62164306640625, 2.708251953125, 2.79486083984375, 2.8814697265625, 2.96807861328125, 3.0546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 8.0, 16.0, 18.0, 26.0, 35.0, 50.0, 92.0, 124.0, 201.0, 295.0, 452.0, 735.0, 1273.0, 1832.0, 2829.0, 4544.0, 7403.0, 11998.0, 20343.0, 38313.0, 75945.0, 149723.0, 234165.0, 220593.0, 131268.0, 65513.0, 33400.0, 18182.0, 10946.0, 6702.0, 4126.0, 2574.0, 1680.0, 1120.0, 764.0, 418.0, 310.0, 178.0, 114.0, 86.0, 55.0, 41.0, 24.0, 15.0, 12.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.49560546875, -0.4800682067871094, -0.46453094482421875, -0.4489936828613281, -0.4334564208984375, -0.4179191589355469, -0.40238189697265625, -0.3868446350097656, -0.371307373046875, -0.3557701110839844, -0.34023284912109375, -0.3246955871582031, -0.3091583251953125, -0.2936210632324219, -0.27808380126953125, -0.2625465393066406, -0.24700927734375, -0.23147201538085938, -0.21593475341796875, -0.20039749145507812, -0.1848602294921875, -0.16932296752929688, -0.15378570556640625, -0.13824844360351562, -0.122711181640625, -0.10717391967773438, -0.09163665771484375, -0.07609939575195312, -0.0605621337890625, -0.045024871826171875, -0.02948760986328125, -0.013950347900390625, 0.0015869140625, 0.017124176025390625, 0.03266143798828125, 0.048198699951171875, 0.0637359619140625, 0.07927322387695312, 0.09481048583984375, 0.11034774780273438, 0.125885009765625, 0.14142227172851562, 0.15695953369140625, 0.17249679565429688, 0.1880340576171875, 0.20357131958007812, 0.21910858154296875, 0.23464584350585938, 0.25018310546875, 0.2657203674316406, 0.28125762939453125, 0.2967948913574219, 0.3123321533203125, 0.3278694152832031, 0.34340667724609375, 0.3589439392089844, 0.374481201171875, 0.3900184631347656, 0.40555572509765625, 0.4210929870605469, 0.4366302490234375, 0.4521675109863281, 0.46770477294921875, 0.4832420349121094, 0.498779296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 5.0, 4.0, 9.0, 6.0, 7.0, 2.0, 13.0, 16.0, 17.0, 32.0, 33.0, 50.0, 77.0, 110.0, 129.0, 122.0, 81.0, 81.0, 61.0, 36.0, 21.0, 15.0, 21.0, 6.0, 4.0, 10.0, 7.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0003037452697753906, -0.0002947896718978882, -0.00028583407402038574, -0.0002768784761428833, -0.00026792287826538086, -0.0002589672803878784, -0.000250011682510376, -0.00024105608463287354, -0.0002321004867553711, -0.00022314488887786865, -0.0002141892910003662, -0.00020523369312286377, -0.00019627809524536133, -0.0001873224973678589, -0.00017836689949035645, -0.000169411301612854, -0.00016045570373535156, -0.00015150010585784912, -0.00014254450798034668, -0.00013358891010284424, -0.0001246333122253418, -0.00011567771434783936, -0.00010672211647033691, -9.776651859283447e-05, -8.881092071533203e-05, -7.985532283782959e-05, -7.089972496032715e-05, -6.194412708282471e-05, -5.2988529205322266e-05, -4.4032931327819824e-05, -3.507733345031738e-05, -2.612173557281494e-05, -1.71661376953125e-05, -8.210539817810059e-06, 7.450580596923828e-07, 9.700655937194824e-06, 1.8656253814697266e-05, 2.7611851692199707e-05, 3.656744956970215e-05, 4.552304744720459e-05, 5.447864532470703e-05, 6.343424320220947e-05, 7.238984107971191e-05, 8.134543895721436e-05, 9.03010368347168e-05, 9.925663471221924e-05, 0.00010821223258972168, 0.00011716783046722412, 0.00012612342834472656, 0.000135079026222229, 0.00014403462409973145, 0.0001529902219772339, 0.00016194581985473633, 0.00017090141773223877, 0.0001798570156097412, 0.00018881261348724365, 0.0001977682113647461, 0.00020672380924224854, 0.00021567940711975098, 0.00022463500499725342, 0.00023359060287475586, 0.0002425462007522583, 0.00025150179862976074, 0.0002604573965072632, 0.0002694129943847656]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 8.0, 3.0, 7.0, 18.0, 17.0, 29.0, 31.0, 59.0, 82.0, 131.0, 181.0, 311.0, 576.0, 1002.0, 1809.0, 3339.0, 6269.0, 11447.0, 21977.0, 44115.0, 85490.0, 156469.0, 224030.0, 210405.0, 133968.0, 70886.0, 35999.0, 18649.0, 9663.0, 5137.0, 2812.0, 1483.0, 866.0, 487.0, 310.0, 184.0, 115.0, 65.0, 49.0, 25.0, 25.0, 4.0, 7.0, 11.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.509765625, -0.4942512512207031, -0.47873687744140625, -0.4632225036621094, -0.4477081298828125, -0.4321937561035156, -0.41667938232421875, -0.4011650085449219, -0.385650634765625, -0.3701362609863281, -0.35462188720703125, -0.3391075134277344, -0.3235931396484375, -0.3080787658691406, -0.29256439208984375, -0.2770500183105469, -0.26153564453125, -0.24602127075195312, -0.23050689697265625, -0.21499252319335938, -0.1994781494140625, -0.18396377563476562, -0.16844940185546875, -0.15293502807617188, -0.137420654296875, -0.12190628051757812, -0.10639190673828125, -0.09087753295898438, -0.0753631591796875, -0.059848785400390625, -0.04433441162109375, -0.028820037841796875, -0.0133056640625, 0.002208709716796875, 0.01772308349609375, 0.033237457275390625, 0.0487518310546875, 0.06426620483398438, 0.07978057861328125, 0.09529495239257812, 0.110809326171875, 0.12632369995117188, 0.14183807373046875, 0.15735244750976562, 0.1728668212890625, 0.18838119506835938, 0.20389556884765625, 0.21940994262695312, 0.23492431640625, 0.2504386901855469, 0.26595306396484375, 0.2814674377441406, 0.2969818115234375, 0.3124961853027344, 0.32801055908203125, 0.3435249328613281, 0.359039306640625, 0.3745536804199219, 0.39006805419921875, 0.4055824279785156, 0.4210968017578125, 0.4366111755371094, 0.45212554931640625, 0.4676399230957031, 0.483154296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 14.0, 7.0, 10.0, 23.0, 23.0, 33.0, 28.0, 47.0, 61.0, 83.0, 71.0, 89.0, 83.0, 87.0, 76.0, 65.0, 54.0, 46.0, 27.0, 19.0, 16.0, 10.0, 8.0, 9.0, 4.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9248046875, -0.8960800170898438, -0.8673553466796875, -0.8386306762695312, -0.809906005859375, -0.7811813354492188, -0.7524566650390625, -0.7237319946289062, -0.69500732421875, -0.6662826538085938, -0.6375579833984375, -0.6088333129882812, -0.580108642578125, -0.5513839721679688, -0.5226593017578125, -0.49393463134765625, -0.4652099609375, -0.43648529052734375, -0.4077606201171875, -0.37903594970703125, -0.350311279296875, -0.32158660888671875, -0.2928619384765625, -0.26413726806640625, -0.23541259765625, -0.20668792724609375, -0.1779632568359375, -0.14923858642578125, -0.120513916015625, -0.09178924560546875, -0.0630645751953125, -0.03433990478515625, -0.005615234375, 0.02310943603515625, 0.0518341064453125, 0.08055877685546875, 0.109283447265625, 0.13800811767578125, 0.1667327880859375, 0.19545745849609375, 0.22418212890625, 0.25290679931640625, 0.2816314697265625, 0.31035614013671875, 0.339080810546875, 0.36780548095703125, 0.3965301513671875, 0.42525482177734375, 0.4539794921875, 0.48270416259765625, 0.5114288330078125, 0.5401535034179688, 0.568878173828125, 0.5976028442382812, 0.6263275146484375, 0.6550521850585938, 0.68377685546875, 0.7125015258789062, 0.7412261962890625, 0.7699508666992188, 0.798675537109375, 0.8274002075195312, 0.8561248779296875, 0.8848495483398438, 0.91357421875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 8.0, 0.0, 6.0, 8.0, 11.0, 24.0, 63.0, 97.0, 138.0, 130.0, 134.0, 131.0, 98.0, 63.0, 33.0, 28.0, 10.0, 5.0, 3.0, 5.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.472113609313965, -7.096959114074707, -6.721805095672607, -6.34665060043335, -5.97149658203125, -5.596342086791992, -5.221187591552734, -4.846033096313477, -4.470879077911377, -4.095724582672119, -3.7205705642700195, -3.3454160690307617, -2.970261812210083, -2.5951075553894043, -2.2199530601501465, -1.8447988033294678, -1.469644546508789, -1.0944902896881104, -0.7193359136581421, -0.34418153762817383, 0.030972719192504883, 0.4061269760131836, 0.7812814712524414, 1.1564357280731201, 1.5315899848937988, 1.9067442417144775, 2.2818984985351562, 2.657052993774414, 3.0322072505950928, 3.4073615074157715, 3.7825160026550293, 4.157670021057129, 4.53282356262207, 4.907978057861328, 5.283132076263428, 5.6582865715026855, 6.033440589904785, 6.408595085144043, 6.783749580383301, 7.158904075622559, 7.534058094024658, 7.909212589263916, 8.284366607666016, 8.659521102905273, 9.034675598144531, 9.409830093383789, 9.784984588623047, 10.160138130187988, 10.535292625427246, 10.910447120666504, 11.285601615905762, 11.660755157470703, 12.035909652709961, 12.411064147949219, 12.786218643188477, 13.161373138427734, 13.536527633666992, 13.91168212890625, 14.286836624145508, 14.661991119384766, 15.037144660949707, 15.412299156188965, 15.787453651428223, 16.162607192993164, 16.537761688232422]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0, 7.0, 12.0, 14.0, 19.0, 21.0, 17.0, 25.0, 36.0, 29.0, 35.0, 32.0, 44.0, 47.0, 40.0, 37.0, 35.0, 35.0, 36.0, 37.0, 33.0, 45.0, 35.0, 34.0, 28.0, 28.0, 29.0, 36.0, 20.0, 20.0, 20.0, 20.0, 19.0, 12.0, 9.0, 6.0, 5.0, 3.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.96188497543335, -5.762948513031006, -5.564012050628662, -5.36507511138916, -5.166138648986816, -4.967202186584473, -4.768265724182129, -4.569329261779785, -4.370392799377441, -4.171456336975098, -3.972519636154175, -3.773583173751831, -3.574646472930908, -3.3757100105285645, -3.1767735481262207, -2.977837085723877, -2.778900146484375, -2.5799636840820312, -2.3810269832611084, -2.1820905208587646, -1.9831539392471313, -1.784217357635498, -1.5852808952331543, -1.386344313621521, -1.1874077320098877, -0.9884711503982544, -0.7895346283912659, -0.5905981063842773, -0.39166152477264404, -0.19272494316101074, 0.006211519241333008, 0.2051481008529663, 0.4040846824645996, 0.6030212640762329, 0.8019577860832214, 1.00089430809021, 1.1998308897018433, 1.3987674713134766, 1.5977039337158203, 1.7966405153274536, 1.995577096939087, 2.1945135593414307, 2.3934502601623535, 2.5923867225646973, 2.791323184967041, 2.990259885787964, 3.1891963481903076, 3.3881330490112305, 3.587069511413574, 3.786005973815918, 3.984942674636841, 4.1838788986206055, 4.382815837860107, 4.581752300262451, 4.780688762664795, 4.979625225067139, 5.178562164306641, 5.377498626708984, 5.576435089111328, 5.775371551513672, 5.974308490753174, 6.173244953155518, 6.372181415557861, 6.571117877960205, 6.770054340362549]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 8.0, 5.0, 20.0, 35.0, 35.0, 39.0, 92.0, 131.0, 249.0, 350.0, 628.0, 1177.0, 2451.0, 5110.0, 11532.0, 28063.0, 75274.0, 212223.0, 571432.0, 1156444.0, 1176827.0, 595225.0, 223245.0, 79742.0, 30166.0, 12583.0, 5325.0, 2684.0, 1356.0, 764.0, 414.0, 248.0, 149.0, 81.0, 40.0, 39.0, 31.0, 26.0, 16.0, 7.0, 9.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.072265625, -1.0377197265625, -1.003173828125, -0.9686279296875, -0.93408203125, -0.8995361328125, -0.864990234375, -0.8304443359375, -0.7958984375, -0.7613525390625, -0.726806640625, -0.6922607421875, -0.65771484375, -0.6231689453125, -0.588623046875, -0.5540771484375, -0.51953125, -0.4849853515625, -0.450439453125, -0.4158935546875, -0.38134765625, -0.3468017578125, -0.312255859375, -0.2777099609375, -0.2431640625, -0.2086181640625, -0.174072265625, -0.1395263671875, -0.10498046875, -0.0704345703125, -0.035888671875, -0.0013427734375, 0.033203125, 0.0677490234375, 0.102294921875, 0.1368408203125, 0.17138671875, 0.2059326171875, 0.240478515625, 0.2750244140625, 0.3095703125, 0.3441162109375, 0.378662109375, 0.4132080078125, 0.44775390625, 0.4822998046875, 0.516845703125, 0.5513916015625, 0.5859375, 0.6204833984375, 0.655029296875, 0.6895751953125, 0.72412109375, 0.7586669921875, 0.793212890625, 0.8277587890625, 0.8623046875, 0.8968505859375, 0.931396484375, 0.9659423828125, 1.00048828125, 1.0350341796875, 1.069580078125, 1.1041259765625, 1.138671875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 4.0, 8.0, 12.0, 15.0, 18.0, 26.0, 18.0, 30.0, 23.0, 27.0, 30.0, 41.0, 40.0, 41.0, 50.0, 53.0, 60.0, 43.0, 51.0, 40.0, 37.0, 36.0, 36.0, 34.0, 29.0, 35.0, 29.0, 19.0, 22.0, 20.0, 16.0, 12.0, 8.0, 7.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.11328125, -1.078338623046875, -1.04339599609375, -1.008453369140625, -0.9735107421875, -0.938568115234375, -0.90362548828125, -0.868682861328125, -0.833740234375, -0.798797607421875, -0.76385498046875, -0.728912353515625, -0.6939697265625, -0.659027099609375, -0.62408447265625, -0.589141845703125, -0.55419921875, -0.519256591796875, -0.48431396484375, -0.449371337890625, -0.4144287109375, -0.379486083984375, -0.34454345703125, -0.309600830078125, -0.274658203125, -0.239715576171875, -0.20477294921875, -0.169830322265625, -0.1348876953125, -0.099945068359375, -0.06500244140625, -0.030059814453125, 0.0048828125, 0.039825439453125, 0.07476806640625, 0.109710693359375, 0.1446533203125, 0.179595947265625, 0.21453857421875, 0.249481201171875, 0.284423828125, 0.319366455078125, 0.35430908203125, 0.389251708984375, 0.4241943359375, 0.459136962890625, 0.49407958984375, 0.529022216796875, 0.56396484375, 0.598907470703125, 0.63385009765625, 0.668792724609375, 0.7037353515625, 0.738677978515625, 0.77362060546875, 0.808563232421875, 0.843505859375, 0.878448486328125, 0.91339111328125, 0.948333740234375, 0.9832763671875, 1.018218994140625, 1.05316162109375, 1.088104248046875, 1.123046875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 9.0, 8.0, 9.0, 21.0, 24.0, 44.0, 57.0, 115.0, 224.0, 348.0, 716.0, 1360.0, 2749.0, 6337.0, 15922.0, 42667.0, 128727.0, 442431.0, 1507776.0, 1442568.0, 413026.0, 121589.0, 40788.0, 15034.0, 6237.0, 2709.0, 1289.0, 680.0, 334.0, 190.0, 125.0, 72.0, 41.0, 26.0, 11.0, 6.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.189453125, -1.1436614990234375, -1.097869873046875, -1.0520782470703125, -1.00628662109375, -0.9604949951171875, -0.914703369140625, -0.8689117431640625, -0.8231201171875, -0.7773284912109375, -0.731536865234375, -0.6857452392578125, -0.63995361328125, -0.5941619873046875, -0.548370361328125, -0.5025787353515625, -0.456787109375, -0.4109954833984375, -0.365203857421875, -0.3194122314453125, -0.27362060546875, -0.2278289794921875, -0.182037353515625, -0.1362457275390625, -0.0904541015625, -0.0446624755859375, 0.001129150390625, 0.0469207763671875, 0.09271240234375, 0.1385040283203125, 0.184295654296875, 0.2300872802734375, 0.27587890625, 0.3216705322265625, 0.367462158203125, 0.4132537841796875, 0.45904541015625, 0.5048370361328125, 0.550628662109375, 0.5964202880859375, 0.6422119140625, 0.6880035400390625, 0.733795166015625, 0.7795867919921875, 0.82537841796875, 0.8711700439453125, 0.916961669921875, 0.9627532958984375, 1.008544921875, 1.0543365478515625, 1.100128173828125, 1.1459197998046875, 1.19171142578125, 1.2375030517578125, 1.283294677734375, 1.3290863037109375, 1.3748779296875, 1.4206695556640625, 1.466461181640625, 1.5122528076171875, 1.55804443359375, 1.6038360595703125, 1.649627685546875, 1.6954193115234375, 1.7412109375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 7.0, 5.0, 7.0, 11.0, 18.0, 23.0, 45.0, 48.0, 58.0, 97.0, 107.0, 143.0, 213.0, 294.0, 341.0, 438.0, 489.0, 414.0, 330.0, 267.0, 209.0, 146.0, 95.0, 74.0, 46.0, 31.0, 30.0, 21.0, 12.0, 15.0, 7.0, 8.0, 7.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.03515625, -1.9777374267578125, -1.920318603515625, -1.8628997802734375, -1.80548095703125, -1.7480621337890625, -1.690643310546875, -1.6332244873046875, -1.5758056640625, -1.5183868408203125, -1.460968017578125, -1.4035491943359375, -1.34613037109375, -1.2887115478515625, -1.231292724609375, -1.1738739013671875, -1.116455078125, -1.0590362548828125, -1.001617431640625, -0.9441986083984375, -0.88677978515625, -0.8293609619140625, -0.771942138671875, -0.7145233154296875, -0.6571044921875, -0.5996856689453125, -0.542266845703125, -0.4848480224609375, -0.42742919921875, -0.3700103759765625, -0.312591552734375, -0.2551727294921875, -0.19775390625, -0.1403350830078125, -0.082916259765625, -0.0254974365234375, 0.03192138671875, 0.0893402099609375, 0.146759033203125, 0.2041778564453125, 0.2615966796875, 0.3190155029296875, 0.376434326171875, 0.4338531494140625, 0.49127197265625, 0.5486907958984375, 0.606109619140625, 0.6635284423828125, 0.720947265625, 0.7783660888671875, 0.835784912109375, 0.8932037353515625, 0.95062255859375, 1.0080413818359375, 1.065460205078125, 1.1228790283203125, 1.1802978515625, 1.2377166748046875, 1.295135498046875, 1.3525543212890625, 1.40997314453125, 1.4673919677734375, 1.524810791015625, 1.5822296142578125, 1.6396484375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 4.0, 6.0, 11.0, 23.0, 28.0, 37.0, 76.0, 101.0, 117.0, 138.0, 119.0, 99.0, 77.0, 66.0, 33.0, 33.0, 9.0, 9.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.373401641845703, -10.991823196411133, -10.610245704650879, -10.228667259216309, -9.847089767456055, -9.465511322021484, -9.083932876586914, -8.70235538482666, -8.32077693939209, -7.939198970794678, -7.557621002197266, -7.176042556762695, -6.794464588165283, -6.412886619567871, -6.031308650970459, -5.649730682373047, -5.268152713775635, -4.886574745178223, -4.5049967765808105, -4.123418807983398, -3.741840362548828, -3.360262393951416, -2.978684425354004, -2.5971062183380127, -2.2155282497406006, -1.833950161933899, -1.4523720741271973, -1.0707941055297852, -0.6892160177230835, -0.30763792991638184, 0.07394003868103027, 0.4555182456970215, 0.8370962142944336, 1.2186743021011353, 1.600252389907837, 1.981830358505249, 2.3634085655212402, 2.7449865341186523, 3.1265645027160645, 3.5081427097320557, 3.8897206783294678, 4.271298885345459, 4.652876853942871, 5.034454822540283, 5.416032791137695, 5.797611236572266, 6.1791887283325195, 6.56076717376709, 6.942345142364502, 7.323923110961914, 7.705501079559326, 8.087079048156738, 8.468657493591309, 8.850234985351562, 9.231813430786133, 9.613391876220703, 9.994969367980957, 10.376547813415527, 10.758125305175781, 11.139703750610352, 11.521281242370605, 11.902859687805176, 12.28443717956543, 12.666015625, 13.04759407043457]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 4.0, 5.0, 5.0, 10.0, 7.0, 14.0, 13.0, 17.0, 21.0, 21.0, 19.0, 24.0, 31.0, 21.0, 37.0, 33.0, 49.0, 43.0, 41.0, 40.0, 42.0, 48.0, 44.0, 39.0, 42.0, 35.0, 35.0, 29.0, 33.0, 26.0, 29.0, 24.0, 17.0, 21.0, 17.0, 12.0, 7.0, 15.0, 7.0, 12.0, 3.0, 5.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.008131980895996, -5.81958532333374, -5.631039142608643, -5.442492485046387, -5.253945827484131, -5.065399169921875, -4.876852989196777, -4.6883063316345215, -4.499759674072266, -4.31121301651001, -4.122666835784912, -3.9341201782226562, -3.7455735206604004, -3.5570271015167236, -3.368480682373047, -3.179934024810791, -2.9913878440856934, -2.8028414249420166, -2.6142947673797607, -2.425748348236084, -2.237201690673828, -2.0486552715301514, -1.8601088523864746, -1.6715623140335083, -1.483015775680542, -1.2944692373275757, -1.1059226989746094, -0.9173762798309326, -0.7288297414779663, -0.540283203125, -0.35173678398132324, -0.16319024562835693, 0.025356292724609375, 0.2139028012752533, 0.4024493098258972, 0.5909957885742188, 0.7795423269271851, 0.9680888652801514, 1.1566352844238281, 1.3451818227767944, 1.5337283611297607, 1.722274899482727, 1.9108214378356934, 2.09936785697937, 2.287914276123047, 2.4764609336853027, 2.6650073528289795, 2.8535537719726562, 3.042100429534912, 3.230646848678589, 3.4191935062408447, 3.6077399253845215, 3.7962865829467773, 3.984833002090454, 4.173379421234131, 4.361926078796387, 4.550472259521484, 4.73901891708374, 4.927565097808838, 5.116111755371094, 5.30465841293335, 5.4932050704956055, 5.681751251220703, 5.870297908782959, 6.058844566345215]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 9.0, 6.0, 7.0, 9.0, 20.0, 27.0, 40.0, 61.0, 106.0, 165.0, 260.0, 439.0, 711.0, 1193.0, 2156.0, 3967.0, 8239.0, 22942.0, 85989.0, 283312.0, 391654.0, 175115.0, 45808.0, 13817.0, 5530.0, 2921.0, 1711.0, 958.0, 531.0, 334.0, 211.0, 99.0, 72.0, 51.0, 37.0, 22.0, 13.0, 10.0, 7.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.095703125, -2.03076171875, -1.9658203125, -1.90087890625, -1.8359375, -1.77099609375, -1.7060546875, -1.64111328125, -1.576171875, -1.51123046875, -1.4462890625, -1.38134765625, -1.31640625, -1.25146484375, -1.1865234375, -1.12158203125, -1.056640625, -0.99169921875, -0.9267578125, -0.86181640625, -0.796875, -0.73193359375, -0.6669921875, -0.60205078125, -0.537109375, -0.47216796875, -0.4072265625, -0.34228515625, -0.27734375, -0.21240234375, -0.1474609375, -0.08251953125, -0.017578125, 0.04736328125, 0.1123046875, 0.17724609375, 0.2421875, 0.30712890625, 0.3720703125, 0.43701171875, 0.501953125, 0.56689453125, 0.6318359375, 0.69677734375, 0.76171875, 0.82666015625, 0.8916015625, 0.95654296875, 1.021484375, 1.08642578125, 1.1513671875, 1.21630859375, 1.28125, 1.34619140625, 1.4111328125, 1.47607421875, 1.541015625, 1.60595703125, 1.6708984375, 1.73583984375, 1.80078125, 1.86572265625, 1.9306640625, 1.99560546875, 2.060546875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 11.0, 8.0, 12.0, 20.0, 28.0, 16.0, 25.0, 39.0, 31.0, 28.0, 22.0, 39.0, 46.0, 45.0, 46.0, 45.0, 36.0, 46.0, 53.0, 37.0, 49.0, 48.0, 39.0, 28.0, 37.0, 22.0, 29.0, 14.0, 11.0, 18.0, 18.0, 11.0, 11.0, 6.0, 4.0, 5.0, 1.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3837890625, -1.3457183837890625, -1.307647705078125, -1.2695770263671875, -1.23150634765625, -1.1934356689453125, -1.155364990234375, -1.1172943115234375, -1.0792236328125, -1.0411529541015625, -1.003082275390625, -0.9650115966796875, -0.92694091796875, -0.8888702392578125, -0.850799560546875, -0.8127288818359375, -0.774658203125, -0.7365875244140625, -0.698516845703125, -0.6604461669921875, -0.62237548828125, -0.5843048095703125, -0.546234130859375, -0.5081634521484375, -0.4700927734375, -0.4320220947265625, -0.393951416015625, -0.3558807373046875, -0.31781005859375, -0.2797393798828125, -0.241668701171875, -0.2035980224609375, -0.16552734375, -0.1274566650390625, -0.089385986328125, -0.0513153076171875, -0.01324462890625, 0.0248260498046875, 0.062896728515625, 0.1009674072265625, 0.1390380859375, 0.1771087646484375, 0.215179443359375, 0.2532501220703125, 0.29132080078125, 0.3293914794921875, 0.367462158203125, 0.4055328369140625, 0.443603515625, 0.4816741943359375, 0.519744873046875, 0.5578155517578125, 0.59588623046875, 0.6339569091796875, 0.672027587890625, 0.7100982666015625, 0.7481689453125, 0.7862396240234375, 0.824310302734375, 0.8623809814453125, 0.90045166015625, 0.9385223388671875, 0.976593017578125, 1.0146636962890625, 1.052734375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 9.0, 7.0, 11.0, 23.0, 25.0, 30.0, 62.0, 79.0, 119.0, 184.0, 294.0, 478.0, 882.0, 1503.0, 2662.0, 5105.0, 10251.0, 23269.0, 62479.0, 168349.0, 313326.0, 266713.0, 116479.0, 42404.0, 16900.0, 7738.0, 4025.0, 2096.0, 1228.0, 700.0, 383.0, 262.0, 161.0, 91.0, 67.0, 56.0, 35.0, 17.0, 18.0, 10.0, 7.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.5439453125, -1.49688720703125, -1.4498291015625, -1.40277099609375, -1.355712890625, -1.30865478515625, -1.2615966796875, -1.21453857421875, -1.16748046875, -1.12042236328125, -1.0733642578125, -1.02630615234375, -0.979248046875, -0.93218994140625, -0.8851318359375, -0.83807373046875, -0.791015625, -0.74395751953125, -0.6968994140625, -0.64984130859375, -0.602783203125, -0.55572509765625, -0.5086669921875, -0.46160888671875, -0.41455078125, -0.36749267578125, -0.3204345703125, -0.27337646484375, -0.226318359375, -0.17926025390625, -0.1322021484375, -0.08514404296875, -0.0380859375, 0.00897216796875, 0.0560302734375, 0.10308837890625, 0.150146484375, 0.19720458984375, 0.2442626953125, 0.29132080078125, 0.33837890625, 0.38543701171875, 0.4324951171875, 0.47955322265625, 0.526611328125, 0.57366943359375, 0.6207275390625, 0.66778564453125, 0.71484375, 0.76190185546875, 0.8089599609375, 0.85601806640625, 0.903076171875, 0.95013427734375, 0.9971923828125, 1.04425048828125, 1.09130859375, 1.13836669921875, 1.1854248046875, 1.23248291015625, 1.279541015625, 1.32659912109375, 1.3736572265625, 1.42071533203125, 1.4677734375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 12.0, 11.0, 15.0, 30.0, 16.0, 30.0, 28.0, 28.0, 34.0, 35.0, 38.0, 45.0, 44.0, 48.0, 40.0, 50.0, 60.0, 48.0, 43.0, 32.0, 35.0, 35.0, 38.0, 26.0, 34.0, 26.0, 26.0, 22.0, 6.0, 15.0, 5.0, 9.0, 11.0, 3.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.40234375, -3.295196533203125, -3.18804931640625, -3.080902099609375, -2.9737548828125, -2.866607666015625, -2.75946044921875, -2.652313232421875, -2.545166015625, -2.438018798828125, -2.33087158203125, -2.223724365234375, -2.1165771484375, -2.009429931640625, -1.90228271484375, -1.795135498046875, -1.68798828125, -1.580841064453125, -1.47369384765625, -1.366546630859375, -1.2593994140625, -1.152252197265625, -1.04510498046875, -0.937957763671875, -0.830810546875, -0.723663330078125, -0.61651611328125, -0.509368896484375, -0.4022216796875, -0.295074462890625, -0.18792724609375, -0.080780029296875, 0.0263671875, 0.133514404296875, 0.24066162109375, 0.347808837890625, 0.4549560546875, 0.562103271484375, 0.66925048828125, 0.776397705078125, 0.883544921875, 0.990692138671875, 1.09783935546875, 1.204986572265625, 1.3121337890625, 1.419281005859375, 1.52642822265625, 1.633575439453125, 1.74072265625, 1.847869873046875, 1.95501708984375, 2.062164306640625, 2.1693115234375, 2.276458740234375, 2.38360595703125, 2.490753173828125, 2.597900390625, 2.705047607421875, 2.81219482421875, 2.919342041015625, 3.0264892578125, 3.133636474609375, 3.24078369140625, 3.347930908203125, 3.455078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 11.0, 19.0, 25.0, 43.0, 56.0, 77.0, 133.0, 213.0, 332.0, 518.0, 819.0, 1375.0, 2287.0, 4105.0, 6962.0, 12487.0, 24398.0, 48128.0, 93124.0, 165796.0, 223532.0, 199936.0, 125233.0, 66262.0, 33817.0, 17119.0, 9204.0, 5024.0, 2912.0, 1796.0, 1028.0, 642.0, 386.0, 260.0, 197.0, 98.0, 61.0, 48.0, 30.0, 19.0, 13.0, 10.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.312255859375, -0.3009986877441406, -0.28974151611328125, -0.2784843444824219, -0.2672271728515625, -0.2559700012207031, -0.24471282958984375, -0.23345565795898438, -0.222198486328125, -0.21094131469726562, -0.19968414306640625, -0.18842697143554688, -0.1771697998046875, -0.16591262817382812, -0.15465545654296875, -0.14339828491210938, -0.13214111328125, -0.12088394165039062, -0.10962677001953125, -0.09836959838867188, -0.0871124267578125, -0.07585525512695312, -0.06459808349609375, -0.053340911865234375, -0.042083740234375, -0.030826568603515625, -0.01956939697265625, -0.008312225341796875, 0.0029449462890625, 0.014202117919921875, 0.02545928955078125, 0.036716461181640625, 0.0479736328125, 0.059230804443359375, 0.07048797607421875, 0.08174514770507812, 0.0930023193359375, 0.10425949096679688, 0.11551666259765625, 0.12677383422851562, 0.138031005859375, 0.14928817749023438, 0.16054534912109375, 0.17180252075195312, 0.1830596923828125, 0.19431686401367188, 0.20557403564453125, 0.21683120727539062, 0.22808837890625, 0.23934555053710938, 0.25060272216796875, 0.2618598937988281, 0.2731170654296875, 0.2843742370605469, 0.29563140869140625, 0.3068885803222656, 0.318145751953125, 0.3294029235839844, 0.34066009521484375, 0.3519172668457031, 0.3631744384765625, 0.3744316101074219, 0.38568878173828125, 0.3969459533691406, 0.408203125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 7.0, 2.0, 2.0, 1.0, 6.0, 14.0, 7.0, 19.0, 17.0, 33.0, 43.0, 59.0, 76.0, 94.0, 106.0, 120.0, 107.0, 65.0, 61.0, 55.0, 36.0, 18.0, 21.0, 11.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017452239990234375, -0.00016763806343078613, -0.00016075372695922852, -0.0001538693904876709, -0.00014698505401611328, -0.00014010071754455566, -0.00013321638107299805, -0.00012633204460144043, -0.00011944770812988281, -0.0001125633716583252, -0.00010567903518676758, -9.879469871520996e-05, -9.191036224365234e-05, -8.502602577209473e-05, -7.814168930053711e-05, -7.125735282897949e-05, -6.437301635742188e-05, -5.748867988586426e-05, -5.060434341430664e-05, -4.3720006942749023e-05, -3.6835670471191406e-05, -2.995133399963379e-05, -2.3066997528076172e-05, -1.6182661056518555e-05, -9.298324584960938e-06, -2.4139881134033203e-06, 4.470348358154297e-06, 1.1354684829711914e-05, 1.823902130126953e-05, 2.512335777282715e-05, 3.2007694244384766e-05, 3.889203071594238e-05, 4.57763671875e-05, 5.266070365905762e-05, 5.9545040130615234e-05, 6.642937660217285e-05, 7.331371307373047e-05, 8.019804954528809e-05, 8.70823860168457e-05, 9.396672248840332e-05, 0.00010085105895996094, 0.00010773539543151855, 0.00011461973190307617, 0.00012150406837463379, 0.0001283884048461914, 0.00013527274131774902, 0.00014215707778930664, 0.00014904141426086426, 0.00015592575073242188, 0.0001628100872039795, 0.0001696944236755371, 0.00017657876014709473, 0.00018346309661865234, 0.00019034743309020996, 0.00019723176956176758, 0.0002041161060333252, 0.0002110004425048828, 0.00021788477897644043, 0.00022476911544799805, 0.00023165345191955566, 0.00023853778839111328, 0.0002454221248626709, 0.0002523064613342285, 0.00025919079780578613, 0.00026607513427734375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 8.0, 9.0, 22.0, 18.0, 37.0, 39.0, 64.0, 119.0, 130.0, 261.0, 385.0, 667.0, 1131.0, 2003.0, 3386.0, 5883.0, 10375.0, 18527.0, 32837.0, 57603.0, 97245.0, 146823.0, 183590.0, 172930.0, 127436.0, 79759.0, 46450.0, 26212.0, 14690.0, 8345.0, 4804.0, 2711.0, 1644.0, 885.0, 555.0, 385.0, 220.0, 111.0, 89.0, 52.0, 36.0, 24.0, 18.0, 18.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.30908203125, -0.29965972900390625, -0.2902374267578125, -0.28081512451171875, -0.271392822265625, -0.26197052001953125, -0.2525482177734375, -0.24312591552734375, -0.23370361328125, -0.22428131103515625, -0.2148590087890625, -0.20543670654296875, -0.196014404296875, -0.18659210205078125, -0.1771697998046875, -0.16774749755859375, -0.1583251953125, -0.14890289306640625, -0.1394805908203125, -0.13005828857421875, -0.120635986328125, -0.11121368408203125, -0.1017913818359375, -0.09236907958984375, -0.08294677734375, -0.07352447509765625, -0.0641021728515625, -0.05467987060546875, -0.045257568359375, -0.03583526611328125, -0.0264129638671875, -0.01699066162109375, -0.007568359375, 0.00185394287109375, 0.0112762451171875, 0.02069854736328125, 0.030120849609375, 0.03954315185546875, 0.0489654541015625, 0.05838775634765625, 0.06781005859375, 0.07723236083984375, 0.0866546630859375, 0.09607696533203125, 0.105499267578125, 0.11492156982421875, 0.1243438720703125, 0.13376617431640625, 0.1431884765625, 0.15261077880859375, 0.1620330810546875, 0.17145538330078125, 0.180877685546875, 0.19029998779296875, 0.1997222900390625, 0.20914459228515625, 0.21856689453125, 0.22798919677734375, 0.2374114990234375, 0.24683380126953125, 0.256256103515625, 0.26567840576171875, 0.2751007080078125, 0.28452301025390625, 0.2939453125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 12.0, 6.0, 10.0, 9.0, 19.0, 22.0, 15.0, 21.0, 14.0, 24.0, 39.0, 42.0, 41.0, 42.0, 52.0, 39.0, 54.0, 39.0, 61.0, 49.0, 56.0, 53.0, 49.0, 39.0, 29.0, 24.0, 15.0, 21.0, 23.0, 24.0, 19.0, 4.0, 3.0, 8.0, 3.0, 5.0, 7.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.461669921875, -0.4466514587402344, -0.43163299560546875, -0.4166145324707031, -0.4015960693359375, -0.3865776062011719, -0.37155914306640625, -0.3565406799316406, -0.341522216796875, -0.3265037536621094, -0.31148529052734375, -0.2964668273925781, -0.2814483642578125, -0.2664299011230469, -0.25141143798828125, -0.23639297485351562, -0.22137451171875, -0.20635604858398438, -0.19133758544921875, -0.17631912231445312, -0.1613006591796875, -0.14628219604492188, -0.13126373291015625, -0.11624526977539062, -0.101226806640625, -0.08620834350585938, -0.07118988037109375, -0.056171417236328125, -0.0411529541015625, -0.026134490966796875, -0.01111602783203125, 0.003902435302734375, 0.0189208984375, 0.033939361572265625, 0.04895782470703125, 0.06397628784179688, 0.0789947509765625, 0.09401321411132812, 0.10903167724609375, 0.12405014038085938, 0.139068603515625, 0.15408706665039062, 0.16910552978515625, 0.18412399291992188, 0.1991424560546875, 0.21416091918945312, 0.22917938232421875, 0.24419784545898438, 0.25921630859375, 0.2742347717285156, 0.28925323486328125, 0.3042716979980469, 0.3192901611328125, 0.3343086242675781, 0.34932708740234375, 0.3643455505371094, 0.379364013671875, 0.3943824768066406, 0.40940093994140625, 0.4244194030761719, 0.4394378662109375, 0.4544563293457031, 0.46947479248046875, 0.4844932556152344, 0.49951171875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 14.0, 21.0, 55.0, 114.0, 188.0, 188.0, 178.0, 111.0, 69.0, 22.0, 6.0, 6.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.035860061645508, -14.526975631713867, -14.01809024810791, -13.50920581817627, -13.000321388244629, -12.491436004638672, -11.982551574707031, -11.47366714477539, -10.96478271484375, -10.45589828491211, -9.947012901306152, -9.438128471374512, -8.929244041442871, -8.420358657836914, -7.911474227905273, -7.402589797973633, -6.893704414367676, -6.384819507598877, -5.875935077667236, -5.3670501708984375, -4.858165740966797, -4.349280834197998, -3.840395927429199, -3.3315112590789795, -2.8226265907287598, -2.31374192237854, -1.8048571348190308, -1.2959723472595215, -0.7870876789093018, -0.27820301055908203, 0.2306818962097168, 0.7395665645599365, 1.2484512329101562, 1.757335901260376, 2.2662205696105957, 2.7751054763793945, 3.2839901447296143, 3.792874813079834, 4.301759719848633, 4.810644149780273, 5.319529056549072, 5.828413963317871, 6.337298393249512, 6.8461833000183105, 7.355068206787109, 7.86395263671875, 8.37283706665039, 8.881722450256348, 9.390606880187988, 9.899491310119629, 10.408376693725586, 10.917261123657227, 11.426145553588867, 11.935029983520508, 12.443915367126465, 12.952799797058105, 13.461685180664062, 13.970569610595703, 14.47945499420166, 14.9883394241333, 15.497223854064941, 16.0061092376709, 16.51499366760254, 17.02387809753418, 17.53276252746582]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 8.0, 7.0, 3.0, 8.0, 11.0, 12.0, 12.0, 18.0, 18.0, 22.0, 15.0, 30.0, 30.0, 33.0, 32.0, 41.0, 48.0, 31.0, 50.0, 38.0, 50.0, 40.0, 42.0, 40.0, 38.0, 41.0, 39.0, 22.0, 30.0, 33.0, 36.0, 18.0, 13.0, 10.0, 14.0, 14.0, 5.0, 13.0, 10.0, 5.0, 6.0, 3.0, 9.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.763487339019775, -6.536324977874756, -6.309162139892578, -6.081999778747559, -5.854836940765381, -5.627674579620361, -5.400511741638184, -5.173349380493164, -4.9461870193481445, -4.719024658203125, -4.491861820220947, -4.264699459075928, -4.03753662109375, -3.8103742599487305, -3.583211660385132, -3.356049060821533, -3.1288862228393555, -2.901723623275757, -2.674561023712158, -2.4473986625671387, -2.220235824584961, -1.9930733442306519, -1.7659108638763428, -1.5387482643127441, -1.3115856647491455, -1.0844230651855469, -0.857260525226593, -0.6300979852676392, -0.4029353857040405, -0.1757727861404419, 0.05138969421386719, 0.2785522937774658, 0.5057153701782227, 0.7328779697418213, 0.9600405097007751, 1.187203049659729, 1.4143656492233276, 1.6415282487869263, 1.8686907291412354, 2.095853328704834, 2.3230159282684326, 2.5501785278320312, 2.77734112739563, 3.0045037269592285, 3.231666088104248, 3.458828926086426, 3.6859912872314453, 3.913153886795044, 4.140316486358643, 4.367478847503662, 4.59464168548584, 4.821804046630859, 5.048966884613037, 5.276129245758057, 5.503292083740234, 5.730454444885254, 5.957616806030273, 6.184779167175293, 6.411942005157471, 6.63910436630249, 6.866267204284668, 7.0934295654296875, 7.320591926574707, 7.547754764556885, 7.7749176025390625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 8.0, 12.0, 9.0, 14.0, 15.0, 30.0, 32.0, 49.0, 84.0, 117.0, 194.0, 356.0, 585.0, 984.0, 1704.0, 3143.0, 5599.0, 11024.0, 22542.0, 48547.0, 109999.0, 249411.0, 522416.0, 900822.0, 1011801.0, 682729.0, 343131.0, 151800.0, 66508.0, 29903.0, 14386.0, 7340.0, 3996.0, 1988.0, 1227.0, 666.0, 363.0, 266.0, 167.0, 116.0, 62.0, 40.0, 26.0, 26.0, 13.0, 7.0, 5.0, 8.0, 3.0, 5.0, 3.0, 3.0, 0.0, 3.0], "bins": [-0.9267578125, -0.899658203125, -0.87255859375, -0.845458984375, -0.818359375, -0.791259765625, -0.76416015625, -0.737060546875, -0.7099609375, -0.682861328125, -0.65576171875, -0.628662109375, -0.6015625, -0.574462890625, -0.54736328125, -0.520263671875, -0.4931640625, -0.466064453125, -0.43896484375, -0.411865234375, -0.384765625, -0.357666015625, -0.33056640625, -0.303466796875, -0.2763671875, -0.249267578125, -0.22216796875, -0.195068359375, -0.16796875, -0.140869140625, -0.11376953125, -0.086669921875, -0.0595703125, -0.032470703125, -0.00537109375, 0.021728515625, 0.048828125, 0.075927734375, 0.10302734375, 0.130126953125, 0.1572265625, 0.184326171875, 0.21142578125, 0.238525390625, 0.265625, 0.292724609375, 0.31982421875, 0.346923828125, 0.3740234375, 0.401123046875, 0.42822265625, 0.455322265625, 0.482421875, 0.509521484375, 0.53662109375, 0.563720703125, 0.5908203125, 0.617919921875, 0.64501953125, 0.672119140625, 0.69921875, 0.726318359375, 0.75341796875, 0.780517578125, 0.8076171875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 13.0, 12.0, 23.0, 20.0, 12.0, 28.0, 20.0, 27.0, 30.0, 30.0, 21.0, 26.0, 32.0, 31.0, 39.0, 37.0, 48.0, 42.0, 45.0, 47.0, 44.0, 33.0, 34.0, 32.0, 37.0, 28.0, 25.0, 23.0, 27.0, 17.0, 16.0, 21.0, 11.0, 13.0, 6.0, 9.0, 6.0, 5.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-1.025390625, -0.9957275390625, -0.966064453125, -0.9364013671875, -0.90673828125, -0.8770751953125, -0.847412109375, -0.8177490234375, -0.7880859375, -0.7584228515625, -0.728759765625, -0.6990966796875, -0.66943359375, -0.6397705078125, -0.610107421875, -0.5804443359375, -0.55078125, -0.5211181640625, -0.491455078125, -0.4617919921875, -0.43212890625, -0.4024658203125, -0.372802734375, -0.3431396484375, -0.3134765625, -0.2838134765625, -0.254150390625, -0.2244873046875, -0.19482421875, -0.1651611328125, -0.135498046875, -0.1058349609375, -0.076171875, -0.0465087890625, -0.016845703125, 0.0128173828125, 0.04248046875, 0.0721435546875, 0.101806640625, 0.1314697265625, 0.1611328125, 0.1907958984375, 0.220458984375, 0.2501220703125, 0.27978515625, 0.3094482421875, 0.339111328125, 0.3687744140625, 0.3984375, 0.4281005859375, 0.457763671875, 0.4874267578125, 0.51708984375, 0.5467529296875, 0.576416015625, 0.6060791015625, 0.6357421875, 0.6654052734375, 0.695068359375, 0.7247314453125, 0.75439453125, 0.7840576171875, 0.813720703125, 0.8433837890625, 0.873046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 7.0, 7.0, 9.0, 19.0, 33.0, 33.0, 52.0, 71.0, 114.0, 177.0, 274.0, 442.0, 692.0, 1200.0, 2002.0, 3557.0, 6514.0, 12795.0, 25717.0, 55584.0, 129956.0, 331661.0, 908875.0, 1484852.0, 749451.0, 274902.0, 109977.0, 47861.0, 22593.0, 11153.0, 5851.0, 3166.0, 1815.0, 1151.0, 634.0, 364.0, 269.0, 147.0, 90.0, 58.0, 49.0, 35.0, 21.0, 14.0, 7.0, 5.0, 7.0, 2.0, 5.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0], "bins": [-1.0234375, -0.991851806640625, -0.96026611328125, -0.928680419921875, -0.8970947265625, -0.865509033203125, -0.83392333984375, -0.802337646484375, -0.770751953125, -0.739166259765625, -0.70758056640625, -0.675994873046875, -0.6444091796875, -0.612823486328125, -0.58123779296875, -0.549652099609375, -0.51806640625, -0.486480712890625, -0.45489501953125, -0.423309326171875, -0.3917236328125, -0.360137939453125, -0.32855224609375, -0.296966552734375, -0.265380859375, -0.233795166015625, -0.20220947265625, -0.170623779296875, -0.1390380859375, -0.107452392578125, -0.07586669921875, -0.044281005859375, -0.0126953125, 0.018890380859375, 0.05047607421875, 0.082061767578125, 0.1136474609375, 0.145233154296875, 0.17681884765625, 0.208404541015625, 0.239990234375, 0.271575927734375, 0.30316162109375, 0.334747314453125, 0.3663330078125, 0.397918701171875, 0.42950439453125, 0.461090087890625, 0.49267578125, 0.524261474609375, 0.55584716796875, 0.587432861328125, 0.6190185546875, 0.650604248046875, 0.68218994140625, 0.713775634765625, 0.745361328125, 0.776947021484375, 0.80853271484375, 0.840118408203125, 0.8717041015625, 0.903289794921875, 0.93487548828125, 0.966461181640625, 0.998046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 9.0, 7.0, 11.0, 13.0, 19.0, 21.0, 19.0, 38.0, 43.0, 63.0, 65.0, 87.0, 104.0, 135.0, 130.0, 215.0, 278.0, 332.0, 348.0, 388.0, 354.0, 306.0, 224.0, 172.0, 135.0, 108.0, 91.0, 79.0, 55.0, 62.0, 33.0, 24.0, 15.0, 15.0, 16.0, 12.0, 5.0, 5.0, 9.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0], "bins": [-1.4443359375, -1.4021759033203125, -1.360015869140625, -1.3178558349609375, -1.27569580078125, -1.2335357666015625, -1.191375732421875, -1.1492156982421875, -1.1070556640625, -1.0648956298828125, -1.022735595703125, -0.9805755615234375, -0.93841552734375, -0.8962554931640625, -0.854095458984375, -0.8119354248046875, -0.769775390625, -0.7276153564453125, -0.685455322265625, -0.6432952880859375, -0.60113525390625, -0.5589752197265625, -0.516815185546875, -0.4746551513671875, -0.4324951171875, -0.3903350830078125, -0.348175048828125, -0.3060150146484375, -0.26385498046875, -0.2216949462890625, -0.179534912109375, -0.1373748779296875, -0.09521484375, -0.0530548095703125, -0.010894775390625, 0.0312652587890625, 0.07342529296875, 0.1155853271484375, 0.157745361328125, 0.1999053955078125, 0.2420654296875, 0.2842254638671875, 0.326385498046875, 0.3685455322265625, 0.41070556640625, 0.4528656005859375, 0.495025634765625, 0.5371856689453125, 0.579345703125, 0.6215057373046875, 0.663665771484375, 0.7058258056640625, 0.74798583984375, 0.7901458740234375, 0.832305908203125, 0.8744659423828125, 0.9166259765625, 0.9587860107421875, 1.000946044921875, 1.0431060791015625, 1.08526611328125, 1.1274261474609375, 1.169586181640625, 1.2117462158203125, 1.25390625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 10.0, 5.0, 16.0, 23.0, 65.0, 109.0, 170.0, 216.0, 180.0, 96.0, 57.0, 29.0, 11.0, 8.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.010448455810547, -26.372703552246094, -25.734960556030273, -25.09721565246582, -24.45947265625, -23.821727752685547, -23.183982849121094, -22.54623794555664, -21.90849494934082, -21.270750045776367, -20.633007049560547, -19.995262145996094, -19.35751724243164, -18.71977424621582, -18.082029342651367, -17.444286346435547, -16.806541442871094, -16.16879653930664, -15.53105354309082, -14.893308639526367, -14.25556468963623, -13.617820739746094, -12.98007583618164, -12.342331886291504, -11.704587936401367, -11.06684398651123, -10.429100036621094, -9.79135513305664, -9.153611183166504, -8.515867233276367, -7.878122806549072, -7.240378379821777, -6.602635383605957, -5.96489143371582, -5.327147006988525, -4.6894025802612305, -4.051658630371094, -3.413914442062378, -2.776170253753662, -2.138425827026367, -1.5006818771362305, -0.8629376888275146, -0.22519350051879883, 0.412550687789917, 1.0502948760986328, 1.6880390644073486, 2.3257832527160645, 2.9635276794433594, 3.601271629333496, 4.239015579223633, 4.876760005950928, 5.514504432678223, 6.152248382568359, 6.789992332458496, 7.427736759185791, 8.065481185913086, 8.703225135803223, 9.34096908569336, 9.978713989257812, 10.61645793914795, 11.254201889038086, 11.891945838928223, 12.52968978881836, 13.167434692382812, 13.80517864227295]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 10.0, 13.0, 10.0, 20.0, 16.0, 19.0, 27.0, 21.0, 36.0, 22.0, 31.0, 35.0, 40.0, 30.0, 48.0, 49.0, 49.0, 65.0, 54.0, 45.0, 52.0, 50.0, 31.0, 28.0, 32.0, 23.0, 27.0, 14.0, 19.0, 13.0, 13.0, 8.0, 9.0, 9.0, 11.0, 7.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.013010025024414, -5.830756187438965, -5.648501873016357, -5.466248035430908, -5.283993721008301, -5.101739883422852, -4.919486045837402, -4.737231731414795, -4.5549774169921875, -4.372723579406738, -4.190469264984131, -4.008215427398682, -3.825961112976074, -3.643707275390625, -3.4614531993865967, -3.2791991233825684, -3.096945285797119, -2.914691209793091, -2.7324371337890625, -2.5501832962036133, -2.367928981781006, -2.1856751441955566, -2.0034210681915283, -1.8211669921875, -1.6389129161834717, -1.4566588401794434, -1.274404764175415, -1.0921508073806763, -0.909896731376648, -0.7276426553726196, -0.5453886985778809, -0.36313462257385254, -0.18088102340698242, 0.0013730227947235107, 0.18362706899642944, 0.365881085395813, 0.5481351613998413, 0.7303892374038696, 0.9126431941986084, 1.0948972702026367, 1.277151346206665, 1.4594054222106934, 1.6416594982147217, 1.8239134550094604, 2.006167411804199, 2.1884217262268066, 2.370675563812256, 2.552929639816284, 2.7351837158203125, 2.917437791824341, 3.099691867828369, 3.2819457054138184, 3.464200019836426, 3.646453857421875, 3.8287079334259033, 4.010962009429932, 4.193216323852539, 4.375470161437988, 4.557724475860596, 4.739978313446045, 4.922232627868652, 5.104486465454102, 5.286740303039551, 5.468994617462158, 5.651248455047607]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 9.0, 12.0, 27.0, 48.0, 47.0, 84.0, 122.0, 224.0, 348.0, 623.0, 1046.0, 1925.0, 3462.0, 6479.0, 12191.0, 23531.0, 43799.0, 77984.0, 127081.0, 178642.0, 192540.0, 152982.0, 99813.0, 58171.0, 31138.0, 16731.0, 8823.0, 4734.0, 2515.0, 1446.0, 731.0, 485.0, 297.0, 166.0, 95.0, 62.0, 38.0, 28.0, 29.0, 12.0, 8.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.873046875, -0.8467788696289062, -0.8205108642578125, -0.7942428588867188, -0.767974853515625, -0.7417068481445312, -0.7154388427734375, -0.6891708374023438, -0.66290283203125, -0.6366348266601562, -0.6103668212890625, -0.5840988159179688, -0.557830810546875, -0.5315628051757812, -0.5052947998046875, -0.47902679443359375, -0.4527587890625, -0.42649078369140625, -0.4002227783203125, -0.37395477294921875, -0.347686767578125, -0.32141876220703125, -0.2951507568359375, -0.26888275146484375, -0.24261474609375, -0.21634674072265625, -0.1900787353515625, -0.16381072998046875, -0.137542724609375, -0.11127471923828125, -0.0850067138671875, -0.05873870849609375, -0.032470703125, -0.00620269775390625, 0.0200653076171875, 0.04633331298828125, 0.072601318359375, 0.09886932373046875, 0.1251373291015625, 0.15140533447265625, 0.17767333984375, 0.20394134521484375, 0.2302093505859375, 0.25647735595703125, 0.282745361328125, 0.30901336669921875, 0.3352813720703125, 0.36154937744140625, 0.3878173828125, 0.41408538818359375, 0.4403533935546875, 0.46662139892578125, 0.492889404296875, 0.5191574096679688, 0.5454254150390625, 0.5716934204101562, 0.59796142578125, 0.6242294311523438, 0.6504974365234375, 0.6767654418945312, 0.703033447265625, 0.7293014526367188, 0.7555694580078125, 0.7818374633789062, 0.80810546875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 5.0, 4.0, 10.0, 13.0, 11.0, 15.0, 27.0, 25.0, 23.0, 27.0, 37.0, 25.0, 49.0, 28.0, 43.0, 34.0, 43.0, 51.0, 45.0, 38.0, 40.0, 39.0, 40.0, 37.0, 49.0, 46.0, 36.0, 21.0, 21.0, 18.0, 16.0, 16.0, 11.0, 20.0, 14.0, 10.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1123046875, -1.074859619140625, -1.03741455078125, -0.999969482421875, -0.9625244140625, -0.925079345703125, -0.88763427734375, -0.850189208984375, -0.812744140625, -0.775299072265625, -0.73785400390625, -0.700408935546875, -0.6629638671875, -0.625518798828125, -0.58807373046875, -0.550628662109375, -0.51318359375, -0.475738525390625, -0.43829345703125, -0.400848388671875, -0.3634033203125, -0.325958251953125, -0.28851318359375, -0.251068115234375, -0.213623046875, -0.176177978515625, -0.13873291015625, -0.101287841796875, -0.0638427734375, -0.026397705078125, 0.01104736328125, 0.048492431640625, 0.0859375, 0.123382568359375, 0.16082763671875, 0.198272705078125, 0.2357177734375, 0.273162841796875, 0.31060791015625, 0.348052978515625, 0.385498046875, 0.422943115234375, 0.46038818359375, 0.497833251953125, 0.5352783203125, 0.572723388671875, 0.61016845703125, 0.647613525390625, 0.68505859375, 0.722503662109375, 0.75994873046875, 0.797393798828125, 0.8348388671875, 0.872283935546875, 0.90972900390625, 0.947174072265625, 0.984619140625, 1.022064208984375, 1.05950927734375, 1.096954345703125, 1.1343994140625, 1.171844482421875, 1.20928955078125, 1.246734619140625, 1.2841796875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 7.0, 9.0, 7.0, 11.0, 26.0, 25.0, 50.0, 72.0, 120.0, 228.0, 413.0, 885.0, 1803.0, 3833.0, 8728.0, 19717.0, 46163.0, 100615.0, 192961.0, 289958.0, 195852.0, 102830.0, 47068.0, 20509.0, 8954.0, 4003.0, 1812.0, 885.0, 424.0, 220.0, 144.0, 71.0, 50.0, 30.0, 34.0, 11.0, 11.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.111328125, -1.0771484375, -1.04296875, -1.0087890625, -0.974609375, -0.9404296875, -0.90625, -0.8720703125, -0.837890625, -0.8037109375, -0.76953125, -0.7353515625, -0.701171875, -0.6669921875, -0.6328125, -0.5986328125, -0.564453125, -0.5302734375, -0.49609375, -0.4619140625, -0.427734375, -0.3935546875, -0.359375, -0.3251953125, -0.291015625, -0.2568359375, -0.22265625, -0.1884765625, -0.154296875, -0.1201171875, -0.0859375, -0.0517578125, -0.017578125, 0.0166015625, 0.05078125, 0.0849609375, 0.119140625, 0.1533203125, 0.1875, 0.2216796875, 0.255859375, 0.2900390625, 0.32421875, 0.3583984375, 0.392578125, 0.4267578125, 0.4609375, 0.4951171875, 0.529296875, 0.5634765625, 0.59765625, 0.6318359375, 0.666015625, 0.7001953125, 0.734375, 0.7685546875, 0.802734375, 0.8369140625, 0.87109375, 0.9052734375, 0.939453125, 0.9736328125, 1.0078125, 1.0419921875, 1.076171875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 7.0, 5.0, 2.0, 6.0, 12.0, 13.0, 13.0, 13.0, 17.0, 11.0, 24.0, 13.0, 21.0, 17.0, 30.0, 41.0, 30.0, 30.0, 36.0, 47.0, 37.0, 24.0, 37.0, 41.0, 37.0, 44.0, 41.0, 35.0, 29.0, 35.0, 22.0, 30.0, 28.0, 24.0, 20.0, 17.0, 14.0, 18.0, 14.0, 12.0, 12.0, 11.0, 7.0, 2.0, 9.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.6328125, -2.54962158203125, -2.4664306640625, -2.38323974609375, -2.300048828125, -2.21685791015625, -2.1336669921875, -2.05047607421875, -1.96728515625, -1.88409423828125, -1.8009033203125, -1.71771240234375, -1.634521484375, -1.55133056640625, -1.4681396484375, -1.38494873046875, -1.3017578125, -1.21856689453125, -1.1353759765625, -1.05218505859375, -0.968994140625, -0.88580322265625, -0.8026123046875, -0.71942138671875, -0.63623046875, -0.55303955078125, -0.4698486328125, -0.38665771484375, -0.303466796875, -0.22027587890625, -0.1370849609375, -0.05389404296875, 0.029296875, 0.11248779296875, 0.1956787109375, 0.27886962890625, 0.362060546875, 0.44525146484375, 0.5284423828125, 0.61163330078125, 0.69482421875, 0.77801513671875, 0.8612060546875, 0.94439697265625, 1.027587890625, 1.11077880859375, 1.1939697265625, 1.27716064453125, 1.3603515625, 1.44354248046875, 1.5267333984375, 1.60992431640625, 1.693115234375, 1.77630615234375, 1.8594970703125, 1.94268798828125, 2.02587890625, 2.10906982421875, 2.1922607421875, 2.27545166015625, 2.358642578125, 2.44183349609375, 2.5250244140625, 2.60821533203125, 2.69140625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 11.0, 14.0, 18.0, 38.0, 43.0, 77.0, 127.0, 194.0, 346.0, 560.0, 906.0, 1639.0, 2830.0, 5028.0, 8869.0, 15886.0, 29142.0, 51830.0, 90465.0, 146145.0, 227834.0, 181963.0, 120851.0, 71832.0, 40770.0, 22485.0, 12457.0, 6845.0, 3926.0, 2234.0, 1266.0, 791.0, 413.0, 253.0, 178.0, 110.0, 65.0, 38.0, 28.0, 10.0, 14.0, 5.0, 5.0, 3.0, 6.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.2301025390625, -0.22348785400390625, -0.2168731689453125, -0.21025848388671875, -0.203643798828125, -0.19702911376953125, -0.1904144287109375, -0.18379974365234375, -0.17718505859375, -0.17057037353515625, -0.1639556884765625, -0.15734100341796875, -0.150726318359375, -0.14411163330078125, -0.1374969482421875, -0.13088226318359375, -0.124267578125, -0.11765289306640625, -0.1110382080078125, -0.10442352294921875, -0.097808837890625, -0.09119415283203125, -0.0845794677734375, -0.07796478271484375, -0.07135009765625, -0.06473541259765625, -0.0581207275390625, -0.05150604248046875, -0.044891357421875, -0.03827667236328125, -0.0316619873046875, -0.02504730224609375, -0.0184326171875, -0.01181793212890625, -0.0052032470703125, 0.00141143798828125, 0.008026123046875, 0.01464080810546875, 0.0212554931640625, 0.02787017822265625, 0.03448486328125, 0.04109954833984375, 0.0477142333984375, 0.05432891845703125, 0.060943603515625, 0.06755828857421875, 0.0741729736328125, 0.08078765869140625, 0.08740234375, 0.09401702880859375, 0.1006317138671875, 0.10724639892578125, 0.113861083984375, 0.12047576904296875, 0.1270904541015625, 0.13370513916015625, 0.14031982421875, 0.14693450927734375, 0.1535491943359375, 0.16016387939453125, 0.166778564453125, 0.17339324951171875, 0.1800079345703125, 0.18662261962890625, 0.1932373046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 13.0, 11.0, 11.0, 16.0, 25.0, 27.0, 31.0, 34.0, 55.0, 67.0, 74.0, 83.0, 69.0, 85.0, 72.0, 73.0, 47.0, 45.0, 35.0, 22.0, 17.0, 19.0, 13.0, 6.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00012373924255371094, -0.00011962652206420898, -0.00011551380157470703, -0.00011140108108520508, -0.00010728836059570312, -0.00010317564010620117, -9.906291961669922e-05, -9.495019912719727e-05, -9.083747863769531e-05, -8.672475814819336e-05, -8.26120376586914e-05, -7.849931716918945e-05, -7.43865966796875e-05, -7.027387619018555e-05, -6.61611557006836e-05, -6.204843521118164e-05, -5.793571472167969e-05, -5.3822994232177734e-05, -4.971027374267578e-05, -4.559755325317383e-05, -4.1484832763671875e-05, -3.737211227416992e-05, -3.325939178466797e-05, -2.9146671295166016e-05, -2.5033950805664062e-05, -2.092123031616211e-05, -1.6808509826660156e-05, -1.2695789337158203e-05, -8.58306884765625e-06, -4.470348358154297e-06, -3.5762786865234375e-07, 3.7550926208496094e-06, 7.867813110351562e-06, 1.1980533599853516e-05, 1.609325408935547e-05, 2.0205974578857422e-05, 2.4318695068359375e-05, 2.8431415557861328e-05, 3.254413604736328e-05, 3.6656856536865234e-05, 4.076957702636719e-05, 4.488229751586914e-05, 4.8995018005371094e-05, 5.310773849487305e-05, 5.7220458984375e-05, 6.133317947387695e-05, 6.54458999633789e-05, 6.955862045288086e-05, 7.367134094238281e-05, 7.778406143188477e-05, 8.189678192138672e-05, 8.600950241088867e-05, 9.012222290039062e-05, 9.423494338989258e-05, 9.834766387939453e-05, 0.00010246038436889648, 0.00010657310485839844, 0.00011068582534790039, 0.00011479854583740234, 0.0001189112663269043, 0.00012302398681640625, 0.0001271367073059082, 0.00013124942779541016, 0.0001353621482849121, 0.00013947486877441406]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 6.0, 8.0, 13.0, 21.0, 20.0, 34.0, 51.0, 81.0, 109.0, 165.0, 284.0, 486.0, 711.0, 1123.0, 1901.0, 3046.0, 4989.0, 8163.0, 13287.0, 22195.0, 35900.0, 57072.0, 88608.0, 126796.0, 185033.0, 159026.0, 119521.0, 81977.0, 52858.0, 32874.0, 20501.0, 12199.0, 7545.0, 4543.0, 2800.0, 1761.0, 1064.0, 646.0, 420.0, 236.0, 162.0, 106.0, 63.0, 39.0, 41.0, 33.0, 11.0, 14.0, 5.0, 4.0, 8.0, 3.0, 0.0, 1.0], "bins": [-0.20361328125, -0.19778060913085938, -0.19194793701171875, -0.18611526489257812, -0.1802825927734375, -0.17444992065429688, -0.16861724853515625, -0.16278457641601562, -0.156951904296875, -0.15111923217773438, -0.14528656005859375, -0.13945388793945312, -0.1336212158203125, -0.12778854370117188, -0.12195587158203125, -0.11612319946289062, -0.11029052734375, -0.10445785522460938, -0.09862518310546875, -0.09279251098632812, -0.0869598388671875, -0.08112716674804688, -0.07529449462890625, -0.06946182250976562, -0.063629150390625, -0.057796478271484375, -0.05196380615234375, -0.046131134033203125, -0.0402984619140625, -0.034465789794921875, -0.02863311767578125, -0.022800445556640625, -0.0169677734375, -0.011135101318359375, -0.00530242919921875, 0.000530242919921875, 0.0063629150390625, 0.012195587158203125, 0.01802825927734375, 0.023860931396484375, 0.029693603515625, 0.035526275634765625, 0.04135894775390625, 0.047191619873046875, 0.0530242919921875, 0.058856964111328125, 0.06468963623046875, 0.07052230834960938, 0.07635498046875, 0.08218765258789062, 0.08802032470703125, 0.09385299682617188, 0.0996856689453125, 0.10551834106445312, 0.11135101318359375, 0.11718368530273438, 0.123016357421875, 0.12884902954101562, 0.13468170166015625, 0.14051437377929688, 0.1463470458984375, 0.15217971801757812, 0.15801239013671875, 0.16384506225585938, 0.169677734375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 1.0, 3.0, 6.0, 8.0, 4.0, 14.0, 11.0, 18.0, 15.0, 20.0, 16.0, 32.0, 33.0, 29.0, 35.0, 36.0, 35.0, 49.0, 38.0, 57.0, 57.0, 61.0, 50.0, 49.0, 37.0, 44.0, 37.0, 35.0, 26.0, 27.0, 23.0, 21.0, 12.0, 15.0, 13.0, 12.0, 7.0, 4.0, 2.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.375732421875, -0.3647422790527344, -0.35375213623046875, -0.3427619934082031, -0.3317718505859375, -0.3207817077636719, -0.30979156494140625, -0.2988014221191406, -0.287811279296875, -0.2768211364746094, -0.26583099365234375, -0.2548408508300781, -0.2438507080078125, -0.23286056518554688, -0.22187042236328125, -0.21088027954101562, -0.19989013671875, -0.18889999389648438, -0.17790985107421875, -0.16691970825195312, -0.1559295654296875, -0.14493942260742188, -0.13394927978515625, -0.12295913696289062, -0.111968994140625, -0.10097885131835938, -0.08998870849609375, -0.07899856567382812, -0.0680084228515625, -0.057018280029296875, -0.04602813720703125, -0.035037994384765625, -0.0240478515625, -0.013057708740234375, -0.00206756591796875, 0.008922576904296875, 0.0199127197265625, 0.030902862548828125, 0.04189300537109375, 0.052883148193359375, 0.063873291015625, 0.07486343383789062, 0.08585357666015625, 0.09684371948242188, 0.1078338623046875, 0.11882400512695312, 0.12981414794921875, 0.14080429077148438, 0.15179443359375, 0.16278457641601562, 0.17377471923828125, 0.18476486206054688, 0.1957550048828125, 0.20674514770507812, 0.21773529052734375, 0.22872543334960938, 0.239715576171875, 0.2507057189941406, 0.26169586181640625, 0.2726860046386719, 0.2836761474609375, 0.2946662902832031, 0.30565643310546875, 0.3166465759277344, 0.32763671875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 3.0, 7.0, 5.0, 14.0, 17.0, 42.0, 74.0, 103.0, 143.0, 163.0, 142.0, 120.0, 77.0, 41.0, 18.0, 13.0, 3.0, 8.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.754478454589844, -5.406192779541016, -5.0579071044921875, -4.709620952606201, -4.361335277557373, -4.013049602508545, -3.6647636890411377, -3.3164777755737305, -2.9681921005249023, -2.619906425476074, -2.271620512008667, -1.9233347177505493, -1.5750489234924316, -1.226763129234314, -0.8784773349761963, -0.5301914215087891, -0.18190574645996094, 0.16638004779815674, 0.5146658420562744, 0.8629516363143921, 1.2112374305725098, 1.5595232248306274, 1.9078090190887451, 2.2560949325561523, 2.6043806076049805, 2.9526662826538086, 3.300952196121216, 3.649238109588623, 3.997523784637451, 4.345809459686279, 4.694095611572266, 5.042381286621094, 5.390666961669922, 5.73895263671875, 6.087238311767578, 6.4355244636535645, 6.783810138702393, 7.132095813751221, 7.480381965637207, 7.828667640686035, 8.176953315734863, 8.525238990783691, 8.87352466583252, 9.221810340881348, 9.570096969604492, 9.91838264465332, 10.266668319702148, 10.614953994750977, 10.963239669799805, 11.311525344848633, 11.659811019897461, 12.008096694946289, 12.356382369995117, 12.704668998718262, 13.05295467376709, 13.401240348815918, 13.749526023864746, 14.097811698913574, 14.446097373962402, 14.79438304901123, 15.142669677734375, 15.490955352783203, 15.839241027832031, 16.18752670288086, 16.535812377929688]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 6.0, 8.0, 14.0, 13.0, 10.0, 15.0, 14.0, 23.0, 27.0, 21.0, 24.0, 33.0, 34.0, 35.0, 28.0, 32.0, 47.0, 39.0, 40.0, 43.0, 36.0, 42.0, 43.0, 37.0, 30.0, 37.0, 30.0, 22.0, 30.0, 27.0, 24.0, 15.0, 18.0, 16.0, 20.0, 14.0, 12.0, 8.0, 5.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.588969707489014, -6.373042106628418, -6.157114028930664, -5.941186428070068, -5.725258827209473, -5.509331226348877, -5.293403625488281, -5.077475547790527, -4.861547946929932, -4.645620346069336, -4.429692268371582, -4.213764667510986, -3.9978370666503906, -3.781909465789795, -3.56598162651062, -3.3500537872314453, -3.1341261863708496, -2.918198585510254, -2.702270746231079, -2.4863429069519043, -2.2704153060913086, -2.054487705230713, -1.838559865951538, -1.6226321458816528, -1.4067044258117676, -1.1907767057418823, -0.9748489856719971, -0.7589212656021118, -0.5429935455322266, -0.3270658254623413, -0.11113810539245605, 0.1047896146774292, 0.32071685791015625, 0.5366445779800415, 0.7525722980499268, 0.968500018119812, 1.1844277381896973, 1.4003554582595825, 1.6162831783294678, 1.832210898399353, 2.0481386184692383, 2.264066219329834, 2.479994058609009, 2.6959218978881836, 2.9118494987487793, 3.127777099609375, 3.34370493888855, 3.5596327781677246, 3.7755603790283203, 3.991487979888916, 4.207415580749512, 4.423343658447266, 4.639271259307861, 4.855198860168457, 5.071126937866211, 5.287054538726807, 5.502982139587402, 5.718909740447998, 5.934837341308594, 6.150765419006348, 6.366693019866943, 6.582620620727539, 6.798548698425293, 7.014476299285889, 7.230403900146484]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 16.0, 18.0, 34.0, 47.0, 67.0, 109.0, 178.0, 289.0, 445.0, 744.0, 1322.0, 2179.0, 4127.0, 8095.0, 16598.0, 34510.0, 71683.0, 142115.0, 260737.0, 430274.0, 604284.0, 701988.0, 668524.0, 524982.0, 340645.0, 190495.0, 95556.0, 47080.0, 22666.0, 11398.0, 5809.0, 3071.0, 1663.0, 992.0, 563.0, 364.0, 228.0, 136.0, 83.0, 46.0, 46.0, 20.0, 15.0, 11.0, 11.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.69580078125, -0.674530029296875, -0.65325927734375, -0.631988525390625, -0.6107177734375, -0.589447021484375, -0.56817626953125, -0.546905517578125, -0.525634765625, -0.504364013671875, -0.48309326171875, -0.461822509765625, -0.4405517578125, -0.419281005859375, -0.39801025390625, -0.376739501953125, -0.35546875, -0.334197998046875, -0.31292724609375, -0.291656494140625, -0.2703857421875, -0.249114990234375, -0.22784423828125, -0.206573486328125, -0.185302734375, -0.164031982421875, -0.14276123046875, -0.121490478515625, -0.1002197265625, -0.078948974609375, -0.05767822265625, -0.036407470703125, -0.01513671875, 0.006134033203125, 0.02740478515625, 0.048675537109375, 0.0699462890625, 0.091217041015625, 0.11248779296875, 0.133758544921875, 0.155029296875, 0.176300048828125, 0.19757080078125, 0.218841552734375, 0.2401123046875, 0.261383056640625, 0.28265380859375, 0.303924560546875, 0.3251953125, 0.346466064453125, 0.36773681640625, 0.389007568359375, 0.4102783203125, 0.431549072265625, 0.45281982421875, 0.474090576171875, 0.495361328125, 0.516632080078125, 0.53790283203125, 0.559173583984375, 0.5804443359375, 0.601715087890625, 0.62298583984375, 0.644256591796875, 0.66552734375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 7.0, 7.0, 9.0, 11.0, 18.0, 13.0, 17.0, 30.0, 25.0, 31.0, 39.0, 38.0, 41.0, 34.0, 58.0, 42.0, 42.0, 41.0, 59.0, 50.0, 46.0, 35.0, 36.0, 40.0, 34.0, 33.0, 35.0, 18.0, 24.0, 15.0, 22.0, 10.0, 7.0, 5.0, 7.0, 9.0, 3.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1513671875, -1.1163787841796875, -1.081390380859375, -1.0464019775390625, -1.01141357421875, -0.9764251708984375, -0.941436767578125, -0.9064483642578125, -0.8714599609375, -0.8364715576171875, -0.801483154296875, -0.7664947509765625, -0.73150634765625, -0.6965179443359375, -0.661529541015625, -0.6265411376953125, -0.591552734375, -0.5565643310546875, -0.521575927734375, -0.4865875244140625, -0.45159912109375, -0.4166107177734375, -0.381622314453125, -0.3466339111328125, -0.3116455078125, -0.2766571044921875, -0.241668701171875, -0.2066802978515625, -0.17169189453125, -0.1367034912109375, -0.101715087890625, -0.0667266845703125, -0.03173828125, 0.0032501220703125, 0.038238525390625, 0.0732269287109375, 0.10821533203125, 0.1432037353515625, 0.178192138671875, 0.2131805419921875, 0.2481689453125, 0.2831573486328125, 0.318145751953125, 0.3531341552734375, 0.38812255859375, 0.4231109619140625, 0.458099365234375, 0.4930877685546875, 0.528076171875, 0.5630645751953125, 0.598052978515625, 0.6330413818359375, 0.66802978515625, 0.7030181884765625, 0.738006591796875, 0.7729949951171875, 0.8079833984375, 0.8429718017578125, 0.877960205078125, 0.9129486083984375, 0.94793701171875, 0.9829254150390625, 1.017913818359375, 1.0529022216796875, 1.087890625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 10.0, 14.0, 14.0, 27.0, 21.0, 43.0, 57.0, 95.0, 141.0, 249.0, 419.0, 859.0, 2072.0, 6640.0, 32016.0, 292563.0, 2726580.0, 1028401.0, 84356.0, 13225.0, 3483.0, 1358.0, 672.0, 343.0, 199.0, 134.0, 81.0, 61.0, 50.0, 24.0, 19.0, 13.0, 10.0, 8.0, 3.0, 6.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.228515625, -2.150970458984375, -2.07342529296875, -1.995880126953125, -1.9183349609375, -1.840789794921875, -1.76324462890625, -1.685699462890625, -1.608154296875, -1.530609130859375, -1.45306396484375, -1.375518798828125, -1.2979736328125, -1.220428466796875, -1.14288330078125, -1.065338134765625, -0.98779296875, -0.910247802734375, -0.83270263671875, -0.755157470703125, -0.6776123046875, -0.600067138671875, -0.52252197265625, -0.444976806640625, -0.367431640625, -0.289886474609375, -0.21234130859375, -0.134796142578125, -0.0572509765625, 0.020294189453125, 0.09783935546875, 0.175384521484375, 0.2529296875, 0.330474853515625, 0.40802001953125, 0.485565185546875, 0.5631103515625, 0.640655517578125, 0.71820068359375, 0.795745849609375, 0.873291015625, 0.950836181640625, 1.02838134765625, 1.105926513671875, 1.1834716796875, 1.261016845703125, 1.33856201171875, 1.416107177734375, 1.49365234375, 1.571197509765625, 1.64874267578125, 1.726287841796875, 1.8038330078125, 1.881378173828125, 1.95892333984375, 2.036468505859375, 2.114013671875, 2.191558837890625, 2.26910400390625, 2.346649169921875, 2.4241943359375, 2.501739501953125, 2.57928466796875, 2.656829833984375, 2.734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 1.0, 5.0, 4.0, 8.0, 6.0, 8.0, 14.0, 10.0, 20.0, 30.0, 36.0, 56.0, 55.0, 82.0, 76.0, 126.0, 168.0, 224.0, 264.0, 295.0, 337.0, 350.0, 310.0, 323.0, 259.0, 229.0, 171.0, 145.0, 110.0, 105.0, 62.0, 47.0, 35.0, 26.0, 24.0, 14.0, 8.0, 8.0, 5.0, 3.0, 8.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.015625, -1.9609527587890625, -1.906280517578125, -1.8516082763671875, -1.79693603515625, -1.7422637939453125, -1.687591552734375, -1.6329193115234375, -1.5782470703125, -1.5235748291015625, -1.468902587890625, -1.4142303466796875, -1.35955810546875, -1.3048858642578125, -1.250213623046875, -1.1955413818359375, -1.140869140625, -1.0861968994140625, -1.031524658203125, -0.9768524169921875, -0.92218017578125, -0.8675079345703125, -0.812835693359375, -0.7581634521484375, -0.7034912109375, -0.6488189697265625, -0.594146728515625, -0.5394744873046875, -0.48480224609375, -0.4301300048828125, -0.375457763671875, -0.3207855224609375, -0.26611328125, -0.2114410400390625, -0.156768798828125, -0.1020965576171875, -0.04742431640625, 0.0072479248046875, 0.061920166015625, 0.1165924072265625, 0.1712646484375, 0.2259368896484375, 0.280609130859375, 0.3352813720703125, 0.38995361328125, 0.4446258544921875, 0.499298095703125, 0.5539703369140625, 0.608642578125, 0.6633148193359375, 0.717987060546875, 0.7726593017578125, 0.82733154296875, 0.8820037841796875, 0.936676025390625, 0.9913482666015625, 1.0460205078125, 1.1006927490234375, 1.155364990234375, 1.2100372314453125, 1.26470947265625, 1.3193817138671875, 1.374053955078125, 1.4287261962890625, 1.4833984375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 5.0, 11.0, 8.0, 8.0, 16.0, 26.0, 29.0, 37.0, 66.0, 63.0, 89.0, 105.0, 110.0, 104.0, 91.0, 70.0, 43.0, 30.0, 17.0, 16.0, 7.0, 11.0, 7.0, 9.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.719646453857422, -20.12316131591797, -19.52667808532715, -18.930192947387695, -18.333709716796875, -17.737224578857422, -17.1407413482666, -16.54425621032715, -15.947772026062012, -15.351287841796875, -14.754803657531738, -14.158319473266602, -13.561834335327148, -12.965351104736328, -12.368865966796875, -11.772381782531738, -11.175897598266602, -10.579413414001465, -9.982929229736328, -9.386445045471191, -8.789960861206055, -8.193475723266602, -7.596991539001465, -7.000507354736328, -6.404023170471191, -5.807538986206055, -5.211054801940918, -4.614570140838623, -4.018085956573486, -3.4216017723083496, -2.825117349624634, -2.228632926940918, -1.6321468353271484, -1.0356625318527222, -0.4391782283782959, 0.15730607509613037, 0.7537903785705566, 1.3502745628356934, 1.9467589855194092, 2.543243408203125, 3.1397275924682617, 3.7362117767333984, 4.332695960998535, 4.92918062210083, 5.525664806365967, 6.1221489906311035, 6.718633651733398, 7.315117835998535, 7.911602020263672, 8.508086204528809, 9.104570388793945, 9.701054573059082, 10.297538757324219, 10.894023895263672, 11.490508079528809, 12.086992263793945, 12.683476448059082, 13.279960632324219, 13.876444816589355, 14.472929000854492, 15.069414138793945, 15.665897369384766, 16.26238250732422, 16.858867645263672, 17.455350875854492]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 9.0, 12.0, 15.0, 10.0, 17.0, 17.0, 20.0, 12.0, 22.0, 23.0, 18.0, 29.0, 35.0, 25.0, 38.0, 35.0, 28.0, 49.0, 37.0, 49.0, 37.0, 44.0, 44.0, 36.0, 40.0, 39.0, 43.0, 30.0, 26.0, 18.0, 12.0, 19.0, 22.0, 23.0, 15.0, 11.0, 7.0, 4.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-8.931053161621094, -8.6801176071167, -8.429181098937988, -8.178245544433594, -7.927309989929199, -7.6763739585876465, -7.425437927246094, -7.174502372741699, -6.9235663414001465, -6.672630310058594, -6.421694755554199, -6.1707587242126465, -5.919822692871094, -5.668887138366699, -5.4179511070251465, -5.167015075683594, -4.916079521179199, -4.6651434898376465, -4.414207935333252, -4.163271903991699, -3.9123361110687256, -3.661400318145752, -3.410464286804199, -3.1595284938812256, -2.908592700958252, -2.6576569080352783, -2.4067211151123047, -2.155785083770752, -1.9048492908477783, -1.6539134979248047, -1.4029775857925415, -1.1520416736602783, -0.9011058807373047, -0.6501700282096863, -0.39923417568206787, -0.14829832315444946, 0.10263752937316895, 0.3535733222961426, 0.6045092344284058, 0.855445146560669, 1.1063809394836426, 1.3573167324066162, 1.6082526445388794, 1.8591885566711426, 2.110124349594116, 2.36106014251709, 2.6119961738586426, 2.862931966781616, 3.11386775970459, 3.3648035526275635, 3.615739345550537, 3.86667537689209, 4.117610931396484, 4.368546962738037, 4.61948299407959, 4.870418548583984, 5.121354579925537, 5.37229061126709, 5.623226165771484, 5.874162197113037, 6.12509822845459, 6.376033782958984, 6.626969814300537, 6.87790584564209, 7.128841400146484]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 5.0, 13.0, 4.0, 10.0, 20.0, 11.0, 22.0, 37.0, 53.0, 79.0, 142.0, 202.0, 308.0, 621.0, 1126.0, 2154.0, 4376.0, 9593.0, 23283.0, 67942.0, 217472.0, 418271.0, 200751.0, 62365.0, 22042.0, 8931.0, 4069.0, 2037.0, 1035.0, 610.0, 370.0, 218.0, 110.0, 74.0, 56.0, 43.0, 28.0, 17.0, 6.0, 10.0, 11.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.00390625, -0.9698333740234375, -0.935760498046875, -0.9016876220703125, -0.86761474609375, -0.8335418701171875, -0.799468994140625, -0.7653961181640625, -0.7313232421875, -0.6972503662109375, -0.663177490234375, -0.6291046142578125, -0.59503173828125, -0.5609588623046875, -0.526885986328125, -0.4928131103515625, -0.458740234375, -0.4246673583984375, -0.390594482421875, -0.3565216064453125, -0.32244873046875, -0.2883758544921875, -0.254302978515625, -0.2202301025390625, -0.1861572265625, -0.1520843505859375, -0.118011474609375, -0.0839385986328125, -0.04986572265625, -0.0157928466796875, 0.018280029296875, 0.0523529052734375, 0.08642578125, 0.1204986572265625, 0.154571533203125, 0.1886444091796875, 0.22271728515625, 0.2567901611328125, 0.290863037109375, 0.3249359130859375, 0.3590087890625, 0.3930816650390625, 0.427154541015625, 0.4612274169921875, 0.49530029296875, 0.5293731689453125, 0.563446044921875, 0.5975189208984375, 0.631591796875, 0.6656646728515625, 0.699737548828125, 0.7338104248046875, 0.76788330078125, 0.8019561767578125, 0.836029052734375, 0.8701019287109375, 0.9041748046875, 0.9382476806640625, 0.972320556640625, 1.0063934326171875, 1.04046630859375, 1.0745391845703125, 1.108612060546875, 1.1426849365234375, 1.1767578125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 5.0, 7.0, 5.0, 8.0, 8.0, 10.0, 7.0, 13.0, 20.0, 23.0, 31.0, 35.0, 30.0, 38.0, 46.0, 44.0, 37.0, 39.0, 48.0, 57.0, 43.0, 36.0, 54.0, 48.0, 35.0, 25.0, 40.0, 34.0, 31.0, 24.0, 14.0, 24.0, 11.0, 18.0, 12.0, 7.0, 12.0, 5.0, 3.0, 2.0, 7.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.232421875, -1.1884613037109375, -1.144500732421875, -1.1005401611328125, -1.05657958984375, -1.0126190185546875, -0.968658447265625, -0.9246978759765625, -0.8807373046875, -0.8367767333984375, -0.792816162109375, -0.7488555908203125, -0.70489501953125, -0.6609344482421875, -0.616973876953125, -0.5730133056640625, -0.529052734375, -0.4850921630859375, -0.441131591796875, -0.3971710205078125, -0.35321044921875, -0.3092498779296875, -0.265289306640625, -0.2213287353515625, -0.1773681640625, -0.1334075927734375, -0.089447021484375, -0.0454864501953125, -0.00152587890625, 0.0424346923828125, 0.086395263671875, 0.1303558349609375, 0.17431640625, 0.2182769775390625, 0.262237548828125, 0.3061981201171875, 0.35015869140625, 0.3941192626953125, 0.438079833984375, 0.4820404052734375, 0.5260009765625, 0.5699615478515625, 0.613922119140625, 0.6578826904296875, 0.70184326171875, 0.7458038330078125, 0.789764404296875, 0.8337249755859375, 0.877685546875, 0.9216461181640625, 0.965606689453125, 1.0095672607421875, 1.05352783203125, 1.0974884033203125, 1.141448974609375, 1.1854095458984375, 1.2293701171875, 1.2733306884765625, 1.317291259765625, 1.3612518310546875, 1.40521240234375, 1.4491729736328125, 1.493133544921875, 1.5370941162109375, 1.5810546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 8.0, 5.0, 12.0, 22.0, 37.0, 55.0, 86.0, 202.0, 362.0, 822.0, 2030.0, 6378.0, 26526.0, 185454.0, 702462.0, 99427.0, 17009.0, 4736.0, 1540.0, 704.0, 288.0, 178.0, 80.0, 48.0, 29.0, 20.0, 13.0, 5.0, 8.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7841796875, -1.72540283203125, -1.6666259765625, -1.60784912109375, -1.549072265625, -1.49029541015625, -1.4315185546875, -1.37274169921875, -1.31396484375, -1.25518798828125, -1.1964111328125, -1.13763427734375, -1.078857421875, -1.02008056640625, -0.9613037109375, -0.90252685546875, -0.84375, -0.78497314453125, -0.7261962890625, -0.66741943359375, -0.608642578125, -0.54986572265625, -0.4910888671875, -0.43231201171875, -0.37353515625, -0.31475830078125, -0.2559814453125, -0.19720458984375, -0.138427734375, -0.07965087890625, -0.0208740234375, 0.03790283203125, 0.0966796875, 0.15545654296875, 0.2142333984375, 0.27301025390625, 0.331787109375, 0.39056396484375, 0.4493408203125, 0.50811767578125, 0.56689453125, 0.62567138671875, 0.6844482421875, 0.74322509765625, 0.802001953125, 0.86077880859375, 0.9195556640625, 0.97833251953125, 1.037109375, 1.09588623046875, 1.1546630859375, 1.21343994140625, 1.272216796875, 1.33099365234375, 1.3897705078125, 1.44854736328125, 1.50732421875, 1.56610107421875, 1.6248779296875, 1.68365478515625, 1.742431640625, 1.80120849609375, 1.8599853515625, 1.91876220703125, 1.9775390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 5.0, 8.0, 11.0, 13.0, 11.0, 21.0, 23.0, 29.0, 31.0, 39.0, 50.0, 67.0, 61.0, 65.0, 67.0, 57.0, 79.0, 60.0, 62.0, 37.0, 45.0, 34.0, 33.0, 17.0, 15.0, 14.0, 11.0, 9.0, 3.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.234375, -3.11407470703125, -2.9937744140625, -2.87347412109375, -2.753173828125, -2.63287353515625, -2.5125732421875, -2.39227294921875, -2.27197265625, -2.15167236328125, -2.0313720703125, -1.91107177734375, -1.790771484375, -1.67047119140625, -1.5501708984375, -1.42987060546875, -1.3095703125, -1.18927001953125, -1.0689697265625, -0.94866943359375, -0.828369140625, -0.70806884765625, -0.5877685546875, -0.46746826171875, -0.34716796875, -0.22686767578125, -0.1065673828125, 0.01373291015625, 0.134033203125, 0.25433349609375, 0.3746337890625, 0.49493408203125, 0.615234375, 0.73553466796875, 0.8558349609375, 0.97613525390625, 1.096435546875, 1.21673583984375, 1.3370361328125, 1.45733642578125, 1.57763671875, 1.69793701171875, 1.8182373046875, 1.93853759765625, 2.058837890625, 2.17913818359375, 2.2994384765625, 2.41973876953125, 2.5400390625, 2.66033935546875, 2.7806396484375, 2.90093994140625, 3.021240234375, 3.14154052734375, 3.2618408203125, 3.38214111328125, 3.50244140625, 3.62274169921875, 3.7430419921875, 3.86334228515625, 3.983642578125, 4.10394287109375, 4.2242431640625, 4.34454345703125, 4.46484375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 8.0, 9.0, 21.0, 24.0, 48.0, 61.0, 78.0, 155.0, 267.0, 499.0, 1081.0, 2651.0, 16902.0, 740104.0, 273149.0, 9446.0, 2071.0, 844.0, 448.0, 262.0, 171.0, 86.0, 54.0, 42.0, 25.0, 14.0, 7.0, 3.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.1552734375, -1.1221542358398438, -1.0890350341796875, -1.0559158325195312, -1.022796630859375, -0.9896774291992188, -0.9565582275390625, -0.9234390258789062, -0.89031982421875, -0.8572006225585938, -0.8240814208984375, -0.7909622192382812, -0.757843017578125, -0.7247238159179688, -0.6916046142578125, -0.6584854125976562, -0.6253662109375, -0.5922470092773438, -0.5591278076171875, -0.5260086059570312, -0.492889404296875, -0.45977020263671875, -0.4266510009765625, -0.39353179931640625, -0.36041259765625, -0.32729339599609375, -0.2941741943359375, -0.26105499267578125, -0.227935791015625, -0.19481658935546875, -0.1616973876953125, -0.12857818603515625, -0.095458984375, -0.06233978271484375, -0.0292205810546875, 0.00389862060546875, 0.037017822265625, 0.07013702392578125, 0.1032562255859375, 0.13637542724609375, 0.16949462890625, 0.20261383056640625, 0.2357330322265625, 0.26885223388671875, 0.301971435546875, 0.33509063720703125, 0.3682098388671875, 0.40132904052734375, 0.4344482421875, 0.46756744384765625, 0.5006866455078125, 0.5338058471679688, 0.566925048828125, 0.6000442504882812, 0.6331634521484375, 0.6662826538085938, 0.69940185546875, 0.7325210571289062, 0.7656402587890625, 0.7987594604492188, 0.831878662109375, 0.8649978637695312, 0.8981170654296875, 0.9312362670898438, 0.96435546875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 8.0, 8.0, 17.0, 18.0, 27.0, 24.0, 58.0, 81.0, 96.0, 126.0, 137.0, 111.0, 90.0, 61.0, 47.0, 29.0, 29.0, 12.0, 7.0, 11.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014853477478027344, -0.00014444347470998764, -0.00014035217463970184, -0.00013626087456941605, -0.00013216957449913025, -0.00012807827442884445, -0.00012398697435855865, -0.00011989567428827286, -0.00011580437421798706, -0.00011171307414770126, -0.00010762177407741547, -0.00010353047400712967, -9.943917393684387e-05, -9.534787386655807e-05, -9.125657379627228e-05, -8.716527372598648e-05, -8.307397365570068e-05, -7.898267358541489e-05, -7.489137351512909e-05, -7.080007344484329e-05, -6.67087733745575e-05, -6.26174733042717e-05, -5.85261732339859e-05, -5.4434873163700104e-05, -5.034357309341431e-05, -4.625227302312851e-05, -4.216097295284271e-05, -3.8069672882556915e-05, -3.397837281227112e-05, -2.988707274198532e-05, -2.5795772671699524e-05, -2.1704472601413727e-05, -1.761317253112793e-05, -1.3521872460842133e-05, -9.430572390556335e-06, -5.339272320270538e-06, -1.2479722499847412e-06, 2.843327820301056e-06, 6.934627890586853e-06, 1.102592796087265e-05, 1.5117228031158447e-05, 1.9208528101444244e-05, 2.329982817173004e-05, 2.739112824201584e-05, 3.1482428312301636e-05, 3.557372838258743e-05, 3.966502845287323e-05, 4.375632852315903e-05, 4.7847628593444824e-05, 5.193892866373062e-05, 5.603022873401642e-05, 6.0121528804302216e-05, 6.421282887458801e-05, 6.830412894487381e-05, 7.239542901515961e-05, 7.64867290854454e-05, 8.05780291557312e-05, 8.4669329226017e-05, 8.87606292963028e-05, 9.285192936658859e-05, 9.694322943687439e-05, 0.00010103452950716019, 0.00010512582957744598, 0.00010921712964773178, 0.00011330842971801758]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 7.0, 10.0, 10.0, 17.0, 32.0, 34.0, 63.0, 113.0, 193.0, 424.0, 1202.0, 6359.0, 154534.0, 858617.0, 22914.0, 2552.0, 774.0, 286.0, 148.0, 85.0, 51.0, 37.0, 22.0, 10.0, 3.0, 9.0, 5.0, 6.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0], "bins": [-1.4892578125, -1.4503173828125, -1.411376953125, -1.3724365234375, -1.33349609375, -1.2945556640625, -1.255615234375, -1.2166748046875, -1.177734375, -1.1387939453125, -1.099853515625, -1.0609130859375, -1.02197265625, -0.9830322265625, -0.944091796875, -0.9051513671875, -0.8662109375, -0.8272705078125, -0.788330078125, -0.7493896484375, -0.71044921875, -0.6715087890625, -0.632568359375, -0.5936279296875, -0.5546875, -0.5157470703125, -0.476806640625, -0.4378662109375, -0.39892578125, -0.3599853515625, -0.321044921875, -0.2821044921875, -0.2431640625, -0.2042236328125, -0.165283203125, -0.1263427734375, -0.08740234375, -0.0484619140625, -0.009521484375, 0.0294189453125, 0.068359375, 0.1072998046875, 0.146240234375, 0.1851806640625, 0.22412109375, 0.2630615234375, 0.302001953125, 0.3409423828125, 0.3798828125, 0.4188232421875, 0.457763671875, 0.4967041015625, 0.53564453125, 0.5745849609375, 0.613525390625, 0.6524658203125, 0.69140625, 0.7303466796875, 0.769287109375, 0.8082275390625, 0.84716796875, 0.8861083984375, 0.925048828125, 0.9639892578125, 1.0029296875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 9.0, 10.0, 11.0, 10.0, 24.0, 33.0, 47.0, 70.0, 80.0, 103.0, 122.0, 121.0, 105.0, 66.0, 42.0, 44.0, 20.0, 27.0, 20.0, 11.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.9794921875, -0.9553985595703125, -0.931304931640625, -0.9072113037109375, -0.88311767578125, -0.8590240478515625, -0.834930419921875, -0.8108367919921875, -0.7867431640625, -0.7626495361328125, -0.738555908203125, -0.7144622802734375, -0.69036865234375, -0.6662750244140625, -0.642181396484375, -0.6180877685546875, -0.593994140625, -0.5699005126953125, -0.545806884765625, -0.5217132568359375, -0.49761962890625, -0.4735260009765625, -0.449432373046875, -0.4253387451171875, -0.4012451171875, -0.3771514892578125, -0.353057861328125, -0.3289642333984375, -0.30487060546875, -0.2807769775390625, -0.256683349609375, -0.2325897216796875, -0.20849609375, -0.1844024658203125, -0.160308837890625, -0.1362152099609375, -0.11212158203125, -0.0880279541015625, -0.063934326171875, -0.0398406982421875, -0.0157470703125, 0.0083465576171875, 0.032440185546875, 0.0565338134765625, 0.08062744140625, 0.1047210693359375, 0.128814697265625, 0.1529083251953125, 0.177001953125, 0.2010955810546875, 0.225189208984375, 0.2492828369140625, 0.27337646484375, 0.2974700927734375, 0.321563720703125, 0.3456573486328125, 0.3697509765625, 0.3938446044921875, 0.417938232421875, 0.4420318603515625, 0.46612548828125, 0.4902191162109375, 0.514312744140625, 0.5384063720703125, 0.5625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 6.0, 11.0, 20.0, 43.0, 111.0, 244.0, 316.0, 162.0, 54.0, 16.0, 6.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.28986358642578, -35.49031066894531, -34.69076156616211, -33.89120864868164, -33.09165573120117, -32.29210662841797, -31.4925537109375, -30.693002700805664, -29.893451690673828, -29.093900680541992, -28.294347763061523, -27.494796752929688, -26.69524574279785, -25.895694732666016, -25.096141815185547, -24.29659080505371, -23.497037887573242, -22.697486877441406, -21.897933959960938, -21.0983829498291, -20.298831939697266, -19.499279022216797, -18.69972801208496, -17.900177001953125, -17.100624084472656, -16.30107307434082, -15.501521110534668, -14.701969146728516, -13.90241813659668, -13.102866172790527, -12.303314208984375, -11.503763198852539, -10.70421314239502, -9.904661178588867, -9.105110168457031, -8.305558204650879, -7.506006717681885, -6.706455230712891, -5.906903266906738, -5.107351779937744, -4.30780029296875, -3.508248805999756, -2.7086970806121826, -1.9091453552246094, -1.1095938682556152, -0.3100423812866211, 0.48950958251953125, 1.2890610694885254, 2.0886125564575195, 2.8881640434265137, 3.687715768814087, 4.48726749420166, 5.286818981170654, 6.086370468139648, 6.885922431945801, 7.685473918914795, 8.485025405883789, 9.284577369689941, 10.084128379821777, 10.88368034362793, 11.683231353759766, 12.482783317565918, 13.28233528137207, 14.081886291503906, 14.881438255310059]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 7.0, 5.0, 6.0, 8.0, 13.0, 18.0, 26.0, 37.0, 43.0, 40.0, 31.0, 42.0, 37.0, 47.0, 68.0, 83.0, 74.0, 68.0, 60.0, 41.0, 30.0, 39.0, 36.0, 32.0, 18.0, 22.0, 17.0, 16.0, 10.0, 7.0, 10.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.752073287963867, -8.444417953491211, -8.136762619018555, -7.82910680770874, -7.521450996398926, -7.2137956619262695, -6.906140327453613, -6.598484516143799, -6.290828704833984, -5.983173370361328, -5.675517559051514, -5.367862224578857, -5.060206413269043, -4.752551078796387, -4.4448957443237305, -4.137239933013916, -3.8295845985412598, -3.5219290256500244, -3.214273452758789, -2.906618118286133, -2.5989623069763184, -2.291306972503662, -1.9836513996124268, -1.6759958267211914, -1.368340253829956, -1.0606846809387207, -0.7530291676521301, -0.44537365436553955, -0.1377180814743042, 0.16993749141693115, 0.47759294509887695, 0.7852485179901123, 1.0929040908813477, 1.400559663772583, 1.7082152366638184, 2.0158705711364746, 2.323526382446289, 2.6311817169189453, 2.9388372898101807, 3.246492862701416, 3.5541484355926514, 3.8618040084838867, 4.169459342956543, 4.477115154266357, 4.784770488739014, 5.092426300048828, 5.400081634521484, 5.707736968994141, 6.015392780303955, 6.323048114776611, 6.630703926086426, 6.938359260559082, 7.2460150718688965, 7.553670406341553, 7.861326217651367, 8.168981552124023, 8.47663688659668, 8.784292221069336, 9.091947555541992, 9.399603843688965, 9.707259178161621, 10.014914512634277, 10.322569847106934, 10.630226135253906, 10.937881469726562]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 5.0, 13.0, 10.0, 17.0, 20.0, 22.0, 31.0, 22.0, 28.0, 29.0, 39.0, 123.0, 213.0, 124.0, 49.0, 33.0, 36.0, 30.0, 20.0, 19.0, 11.0, 11.0, 13.0, 17.0, 15.0, 5.0, 7.0, 3.0, 4.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.302734375, -1.25531005859375, -1.2078857421875, -1.16046142578125, -1.113037109375, -1.06561279296875, -1.0181884765625, -0.97076416015625, -0.92333984375, -0.87591552734375, -0.8284912109375, -0.78106689453125, -0.733642578125, -0.68621826171875, -0.6387939453125, -0.59136962890625, -0.5439453125, -0.49652099609375, -0.4490966796875, -0.40167236328125, -0.354248046875, -0.30682373046875, -0.2593994140625, -0.21197509765625, -0.16455078125, -0.11712646484375, -0.0697021484375, -0.02227783203125, 0.025146484375, 0.07257080078125, 0.1199951171875, 0.16741943359375, 0.21484375, 0.26226806640625, 0.3096923828125, 0.35711669921875, 0.404541015625, 0.45196533203125, 0.4993896484375, 0.54681396484375, 0.59423828125, 0.64166259765625, 0.6890869140625, 0.73651123046875, 0.783935546875, 0.83135986328125, 0.8787841796875, 0.92620849609375, 0.9736328125, 1.02105712890625, 1.0684814453125, 1.11590576171875, 1.163330078125, 1.21075439453125, 1.2581787109375, 1.30560302734375, 1.35302734375, 1.40045166015625, 1.4478759765625, 1.49530029296875, 1.542724609375, 1.59014892578125, 1.6375732421875, 1.68499755859375, 1.732421875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 7.0, 5.0, 6.0, 23.0, 24.0, 44.0, 72.0, 74.0, 117.0, 197.0, 326.0, 658.0, 1108.0, 2417.0, 5673.0, 17454.0, 659029.0, 7669029.0, 20742.0, 6299.0, 2525.0, 1192.0, 622.0, 337.0, 203.0, 121.0, 68.0, 58.0, 40.0, 35.0, 14.0, 17.0, 7.0, 7.0, 13.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.4045233726501465, -4.27524471282959, -4.145966053009033, -4.016687393188477, -3.88740873336792, -3.7581300735473633, -3.6288516521453857, -3.499572992324829, -3.3702943325042725, -3.241015672683716, -3.111737012863159, -2.9824583530426025, -2.853179931640625, -2.7239012718200684, -2.5946226119995117, -2.465343952178955, -2.3360652923583984, -2.206786632537842, -2.077507972717285, -1.948229432106018, -1.8189507722854614, -1.6896721124649048, -1.5603935718536377, -1.431114912033081, -1.3018362522125244, -1.1725575923919678, -1.0432789325714111, -0.914000391960144, -0.7847217321395874, -0.6554430723190308, -0.5261644721031189, -0.39688587188720703, -0.2676074504852295, -0.13832882046699524, -0.009050190448760986, 0.12022843956947327, 0.24950706958770752, 0.37878572940826416, 0.508064329624176, 0.6373429298400879, 0.7666215896606445, 0.8959002494812012, 1.0251789093017578, 1.154457449913025, 1.2837361097335815, 1.4130147695541382, 1.5422933101654053, 1.671571969985962, 1.8008506298065186, 1.9301292896270752, 2.059407949447632, 2.1886866092681885, 2.317965030670166, 2.4472436904907227, 2.5765223503112793, 2.705801010131836, 2.8350796699523926, 2.964358329772949, 3.093636989593506, 3.2229156494140625, 3.352194309234619, 3.481472969055176, 3.6107513904571533, 3.74003005027771, 3.8693087100982666]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 4.0, 1.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 5.0, 6.0, 2.0, 4.0, 3.0, 4.0, 2.0, 9.0, 1.0, 4.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-7.563855171203613, -7.365002632141113, -7.1661505699157715, -6.9672980308532715, -6.7684454917907715, -6.56959342956543, -6.37074089050293, -6.17188835144043, -5.97303581237793, -5.77418327331543, -5.575331211090088, -5.376478672027588, -5.177626132965088, -4.978774070739746, -4.779921531677246, -4.581068992614746, -4.382216930389404, -4.183364391326904, -3.9845120906829834, -3.7856597900390625, -3.5868072509765625, -3.3879549503326416, -3.1891026496887207, -2.9902501106262207, -2.7913978099823, -2.592545509338379, -2.393692970275879, -2.194840669631958, -1.9959882497787476, -1.797135829925537, -1.5982835292816162, -1.3994311094284058, -1.200578212738037, -1.0017257928848267, -0.802873432636261, -0.6040210723876953, -0.40516865253448486, -0.20631623268127441, -0.007463932037353516, 0.19138848781585693, 0.3902409076690674, 0.5890933275222778, 0.7879456877708435, 0.9867980480194092, 1.1856504678726196, 1.38450288772583, 1.583355188369751, 1.7822076082229614, 1.9810600280761719, 2.1799123287200928, 2.3787648677825928, 2.5776171684265137, 2.7764697074890137, 2.9753220081329346, 3.1741743087768555, 3.3730268478393555, 3.5718791484832764, 3.7707314491271973, 3.9695839881896973, 4.168436050415039, 4.367288589477539, 4.566141128540039, 4.764993667602539, 4.963845729827881, 5.162698268890381]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 8.0, 5.0, 8.0, 10.0, 23.0, 18.0, 28.0, 29.0, 45.0, 43.0, 47.0, 57.0, 70.0, 57.0, 75.0, 53.0, 72.0, 58.0, 47.0, 50.0, 40.0, 29.0, 27.0, 26.0, 22.0, 13.0, 14.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3896484375, -1.3551483154296875, -1.320648193359375, -1.2861480712890625, -1.25164794921875, -1.2171478271484375, -1.182647705078125, -1.1481475830078125, -1.1136474609375, -1.0791473388671875, -1.044647216796875, -1.0101470947265625, -0.97564697265625, -0.9411468505859375, -0.906646728515625, -0.8721466064453125, -0.837646484375, -0.8031463623046875, -0.768646240234375, -0.7341461181640625, -0.69964599609375, -0.6651458740234375, -0.630645751953125, -0.5961456298828125, -0.5616455078125, -0.5271453857421875, -0.492645263671875, -0.4581451416015625, -0.42364501953125, -0.3891448974609375, -0.354644775390625, -0.3201446533203125, -0.28564453125, -0.2511444091796875, -0.216644287109375, -0.1821441650390625, -0.14764404296875, -0.1131439208984375, -0.078643798828125, -0.0441436767578125, -0.0096435546875, 0.0248565673828125, 0.059356689453125, 0.0938568115234375, 0.12835693359375, 0.1628570556640625, 0.197357177734375, 0.2318572998046875, 0.266357421875, 0.3008575439453125, 0.335357666015625, 0.3698577880859375, 0.40435791015625, 0.4388580322265625, 0.473358154296875, 0.5078582763671875, 0.5423583984375, 0.5768585205078125, 0.611358642578125, 0.6458587646484375, 0.68035888671875, 0.7148590087890625, 0.749359130859375, 0.7838592529296875, 0.818359375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 8.0, 8.0, 13.0, 18.0, 38.0, 50.0, 93.0, 144.0, 239.0, 388.0, 739.0, 1199.0, 2194.0, 4119.0, 8239.0, 17643.0, 44071.0, 145268.0, 192464.0, 62959.0, 22654.0, 10375.0, 5107.0, 2740.0, 1465.0, 788.0, 509.0, 271.0, 156.0, 108.0, 68.0, 37.0, 39.0, 22.0, 22.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.171875, -14.7276611328125, -14.283447265625, -13.8392333984375, -13.39501953125, -12.9508056640625, -12.506591796875, -12.0623779296875, -11.6181640625, -11.1739501953125, -10.729736328125, -10.2855224609375, -9.84130859375, -9.3970947265625, -8.952880859375, -8.5086669921875, -8.064453125, -7.6202392578125, -7.176025390625, -6.7318115234375, -6.28759765625, -5.8433837890625, -5.399169921875, -4.9549560546875, -4.5107421875, -4.0665283203125, -3.622314453125, -3.1781005859375, -2.73388671875, -2.2896728515625, -1.845458984375, -1.4012451171875, -0.95703125, -0.5128173828125, -0.068603515625, 0.3756103515625, 0.81982421875, 1.2640380859375, 1.708251953125, 2.1524658203125, 2.5966796875, 3.0408935546875, 3.485107421875, 3.9293212890625, 4.37353515625, 4.8177490234375, 5.261962890625, 5.7061767578125, 6.150390625, 6.5946044921875, 7.038818359375, 7.4830322265625, 7.92724609375, 8.3714599609375, 8.815673828125, 9.2598876953125, 9.7041015625, 10.1483154296875, 10.592529296875, 11.0367431640625, 11.48095703125, 11.9251708984375, 12.369384765625, 12.8135986328125, 13.2578125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 9.0, 5.0, 13.0, 13.0, 20.0, 25.0, 25.0, 27.0, 31.0, 50.0, 36.0, 43.0, 50.0, 52.0, 43.0, 48.0, 47.0, 62.0, 56.0, 58.0, 48.0, 37.0, 37.0, 25.0, 19.0, 19.0, 18.0, 19.0, 15.0, 9.0, 11.0, 5.0, 6.0, 2.0, 1.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.203125, -1.16070556640625, -1.1182861328125, -1.07586669921875, -1.033447265625, -0.99102783203125, -0.9486083984375, -0.90618896484375, -0.86376953125, -0.82135009765625, -0.7789306640625, -0.73651123046875, -0.694091796875, -0.65167236328125, -0.6092529296875, -0.56683349609375, -0.5244140625, -0.48199462890625, -0.4395751953125, -0.39715576171875, -0.354736328125, -0.31231689453125, -0.2698974609375, -0.22747802734375, -0.18505859375, -0.14263916015625, -0.1002197265625, -0.05780029296875, -0.015380859375, 0.02703857421875, 0.0694580078125, 0.11187744140625, 0.154296875, 0.19671630859375, 0.2391357421875, 0.28155517578125, 0.323974609375, 0.36639404296875, 0.4088134765625, 0.45123291015625, 0.49365234375, 0.53607177734375, 0.5784912109375, 0.62091064453125, 0.663330078125, 0.70574951171875, 0.7481689453125, 0.79058837890625, 0.8330078125, 0.87542724609375, 0.9178466796875, 0.96026611328125, 1.002685546875, 1.04510498046875, 1.0875244140625, 1.12994384765625, 1.17236328125, 1.21478271484375, 1.2572021484375, 1.29962158203125, 1.342041015625, 1.38446044921875, 1.4268798828125, 1.46929931640625, 1.51171875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 3.0, 12.0, 17.0, 19.0, 20.0, 29.0, 34.0, 41.0, 50.0, 40.0, 38.0, 33.0, 26.0, 17.0, 12.0, 13.0, 9.0, 10.0, 6.0, 9.0, 4.0, 5.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.3350343704223633, -3.226881742477417, -3.1187291145324707, -3.0105764865875244, -2.902423858642578, -2.794271230697632, -2.6861186027526855, -2.5779659748077393, -2.469813346862793, -2.3616607189178467, -2.2535080909729004, -2.145355463027954, -2.037202835083008, -1.9290502071380615, -1.8208975791931152, -1.712744951248169, -1.6045923233032227, -1.4964396953582764, -1.38828706741333, -1.2801344394683838, -1.1719818115234375, -1.0638291835784912, -0.9556765556335449, -0.8475239276885986, -0.7393712997436523, -0.631218671798706, -0.5230660438537598, -0.4149134159088135, -0.3067607879638672, -0.1986081600189209, -0.09045553207397461, 0.01769709587097168, 0.12584972381591797, 0.23400235176086426, 0.34215497970581055, 0.45030760765075684, 0.5584602355957031, 0.6666128635406494, 0.7747654914855957, 0.882918119430542, 0.9910707473754883, 1.0992233753204346, 1.2073760032653809, 1.3155286312103271, 1.4236812591552734, 1.5318338871002197, 1.639986515045166, 1.7481391429901123, 1.8562917709350586, 1.9644443988800049, 2.072597026824951, 2.1807496547698975, 2.2889022827148438, 2.39705491065979, 2.5052075386047363, 2.6133601665496826, 2.721512794494629, 2.829665422439575, 2.9378180503845215, 3.0459706783294678, 3.154123306274414, 3.2622759342193604, 3.3704285621643066, 3.478581190109253, 3.586733818054199]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 3.0, 6.0, 15.0, 6.0, 10.0, 10.0, 8.0, 15.0, 12.0, 15.0, 46.0, 105.0, 96.0, 41.0, 16.0, 11.0, 17.0, 6.0, 9.0, 8.0, 7.0, 7.0, 0.0, 3.0, 3.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.415047645568848, -6.2262067794799805, -6.037365913391113, -5.848525047302246, -5.659684181213379, -5.4708428382873535, -5.282001972198486, -5.093161106109619, -4.904320240020752, -4.715479373931885, -4.526638507843018, -4.33779764175415, -4.148956298828125, -3.960115671157837, -3.7712745666503906, -3.5824337005615234, -3.3935928344726562, -3.204751968383789, -3.015911102294922, -2.8270699977874756, -2.6382291316986084, -2.449388265609741, -2.260547161102295, -2.0717062950134277, -1.8828654289245605, -1.6940245628356934, -1.5051835775375366, -1.3163425922393799, -1.1275017261505127, -0.9386608004570007, -0.7498198747634888, -0.560978889465332, -0.37213802337646484, -0.18329709768295288, 0.005543828010559082, 0.19438475370407104, 0.383225679397583, 0.572066605091095, 0.7609075307846069, 0.9497485160827637, 1.1385893821716309, 1.327430248260498, 1.5162712335586548, 1.7051122188568115, 1.8939530849456787, 2.082793951034546, 2.271635055541992, 2.4604759216308594, 2.6493167877197266, 2.8381576538085938, 3.026998519897461, 3.2158396244049072, 3.4046804904937744, 3.5935213565826416, 3.782362461090088, 3.971203327178955, 4.160044193267822, 4.3488850593566895, 4.537725925445557, 4.726566791534424, 4.915408134460449, 5.104249000549316, 5.293089866638184, 5.481930732727051, 5.670771598815918]}, "eval/loss": 1.6609143018722534, "eval/bleu": 5.1478661845701255e-14, "eval/runtime": 2612.2734, "eval/samples_per_second": 5.65, "eval/steps_per_second": 0.706} \ No newline at end of file +{"train/loss": 0.908, "train/learning_rate": 3.0503265250974577e-06, "train/epoch": 2.93, "train/global_step": 9500, "_runtime": 94011, "_timestamp": 1651768100, "_step": 9518, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 13.0, 22.0, 81.0, 150.0, 184.0, 242.0, 156.0, 102.0, 44.0, 13.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-30.62371826171875, -30.05805778503418, -29.492395401000977, -28.926734924316406, -28.361074447631836, -27.795413970947266, -27.229751586914062, -26.664091110229492, -26.098430633544922, -25.53277015686035, -24.96710777282715, -24.401447296142578, -23.835786819458008, -23.270126342773438, -22.704463958740234, -22.138803482055664, -21.573143005371094, -21.007482528686523, -20.44182014465332, -19.87615966796875, -19.31049919128418, -18.74483871459961, -18.179176330566406, -17.613515853881836, -17.047853469848633, -16.482192993164062, -15.916531562805176, -15.350870132446289, -14.785209655761719, -14.219548225402832, -13.653886795043945, -13.088226318359375, -12.522565841674805, -11.956904411315918, -11.391243934631348, -10.825582504272461, -10.25992202758789, -9.694260597229004, -9.128599166870117, -8.562938690185547, -7.997278213500977, -7.431617259979248, -6.8659563064575195, -6.300294876098633, -5.7346343994140625, -5.168972969055176, -4.603312015533447, -4.037651062011719, -3.4719901084899902, -2.9063291549682617, -2.340668201446533, -1.7750070095062256, -1.209346055984497, -0.6436851024627686, -0.07802391052246094, 0.4876370429992676, 1.053297996520996, 1.6189589500427246, 2.184619903564453, 2.7502810955047607, 3.3159420490264893, 3.8816030025482178, 4.447264194488525, 5.012925148010254, 5.578586101531982]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 2.0, 5.0, 8.0, 11.0, 10.0, 13.0, 19.0, 13.0, 21.0, 28.0, 27.0, 26.0, 29.0, 32.0, 43.0, 50.0, 52.0, 44.0, 41.0, 37.0, 51.0, 51.0, 40.0, 36.0, 44.0, 34.0, 38.0, 17.0, 29.0, 20.0, 29.0, 11.0, 20.0, 13.0, 12.0, 10.0, 11.0, 5.0, 10.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.229267120361328, -6.004997730255127, -5.780728816986084, -5.556459426879883, -5.33219051361084, -5.107921123504639, -4.8836517333984375, -4.6593828201293945, -4.435113430023193, -4.210844039916992, -3.986575126647949, -3.762305736541748, -3.538036584854126, -3.313767433166504, -3.0894980430603027, -2.8652288913726807, -2.6409597396850586, -2.4166905879974365, -2.1924214363098145, -1.9681520462036133, -1.7438828945159912, -1.5196137428283691, -1.2953444719314575, -1.071075201034546, -0.8468060493469238, -0.622536838054657, -0.39826762676239014, -0.1739984154701233, 0.050270795822143555, 0.2745399475097656, 0.49880921840667725, 0.7230784893035889, 0.9473476409912109, 1.171616792678833, 1.3958860635757446, 1.6201553344726562, 1.8444244861602783, 2.0686936378479004, 2.2929630279541016, 2.5172321796417236, 2.7415013313293457, 2.9657704830169678, 3.19003963470459, 3.414309024810791, 3.638578176498413, 3.862847328186035, 4.087116718292236, 4.3113861083984375, 4.5356550216674805, 4.759924411773682, 4.984193325042725, 5.208462715148926, 5.432731628417969, 5.65700101852417, 5.881270408630371, 6.105539321899414, 6.329808712005615, 6.554078102111816, 6.778347015380859, 7.0026164054870605, 7.226885795593262, 7.451154708862305, 7.675424098968506, 7.899693489074707, 8.12396240234375]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 12.0, 17.0, 26.0, 30.0, 41.0, 76.0, 90.0, 122.0, 228.0, 310.0, 546.0, 819.0, 1287.0, 2034.0, 3442.0, 5938.0, 10669.0, 20185.0, 39049.0, 77009.0, 154675.0, 310051.0, 608790.0, 1069765.0, 911496.0, 488875.0, 246628.0, 120103.0, 58066.0, 28317.0, 14933.0, 8355.0, 4649.0, 2758.0, 1751.0, 1063.0, 704.0, 467.0, 293.0, 192.0, 146.0, 92.0, 60.0, 39.0, 22.0, 20.0, 13.0, 14.0, 5.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0], "bins": [-6.4296875, -6.23370361328125, -6.0377197265625, -5.84173583984375, -5.645751953125, -5.44976806640625, -5.2537841796875, -5.05780029296875, -4.86181640625, -4.66583251953125, -4.4698486328125, -4.27386474609375, -4.077880859375, -3.88189697265625, -3.6859130859375, -3.48992919921875, -3.2939453125, -3.09796142578125, -2.9019775390625, -2.70599365234375, -2.510009765625, -2.31402587890625, -2.1180419921875, -1.92205810546875, -1.72607421875, -1.53009033203125, -1.3341064453125, -1.13812255859375, -0.942138671875, -0.74615478515625, -0.5501708984375, -0.35418701171875, -0.158203125, 0.03778076171875, 0.2337646484375, 0.42974853515625, 0.625732421875, 0.82171630859375, 1.0177001953125, 1.21368408203125, 1.40966796875, 1.60565185546875, 1.8016357421875, 1.99761962890625, 2.193603515625, 2.38958740234375, 2.5855712890625, 2.78155517578125, 2.9775390625, 3.17352294921875, 3.3695068359375, 3.56549072265625, 3.761474609375, 3.95745849609375, 4.1534423828125, 4.34942626953125, 4.54541015625, 4.74139404296875, 4.9373779296875, 5.13336181640625, 5.329345703125, 5.52532958984375, 5.7213134765625, 5.91729736328125, 6.11328125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 7.0, 11.0, 17.0, 14.0, 14.0, 26.0, 21.0, 20.0, 26.0, 36.0, 30.0, 37.0, 44.0, 48.0, 49.0, 38.0, 60.0, 45.0, 50.0, 41.0, 48.0, 38.0, 33.0, 38.0, 37.0, 26.0, 33.0, 27.0, 14.0, 12.0, 11.0, 9.0, 10.0, 5.0, 5.0, 6.0, 4.0, 0.0, 4.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7734375, -10.416748046875, -10.06005859375, -9.703369140625, -9.3466796875, -8.989990234375, -8.63330078125, -8.276611328125, -7.919921875, -7.563232421875, -7.20654296875, -6.849853515625, -6.4931640625, -6.136474609375, -5.77978515625, -5.423095703125, -5.06640625, -4.709716796875, -4.35302734375, -3.996337890625, -3.6396484375, -3.282958984375, -2.92626953125, -2.569580078125, -2.212890625, -1.856201171875, -1.49951171875, -1.142822265625, -0.7861328125, -0.429443359375, -0.07275390625, 0.283935546875, 0.640625, 0.997314453125, 1.35400390625, 1.710693359375, 2.0673828125, 2.424072265625, 2.78076171875, 3.137451171875, 3.494140625, 3.850830078125, 4.20751953125, 4.564208984375, 4.9208984375, 5.277587890625, 5.63427734375, 5.990966796875, 6.34765625, 6.704345703125, 7.06103515625, 7.417724609375, 7.7744140625, 8.131103515625, 8.48779296875, 8.844482421875, 9.201171875, 9.557861328125, 9.91455078125, 10.271240234375, 10.6279296875, 10.984619140625, 11.34130859375, 11.697998046875, 12.0546875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 5.0, 17.0, 17.0, 13.0, 29.0, 38.0, 82.0, 105.0, 153.0, 257.0, 659.0, 10506.0, 4178921.0, 2338.0, 508.0, 212.0, 112.0, 79.0, 72.0, 34.0, 29.0, 23.0, 18.0, 10.0, 8.0, 7.0, 6.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.0, -134.703125, -130.40625, -126.109375, -121.8125, -117.515625, -113.21875, -108.921875, -104.625, -100.328125, -96.03125, -91.734375, -87.4375, -83.140625, -78.84375, -74.546875, -70.25, -65.953125, -61.65625, -57.359375, -53.0625, -48.765625, -44.46875, -40.171875, -35.875, -31.578125, -27.28125, -22.984375, -18.6875, -14.390625, -10.09375, -5.796875, -1.5, 2.796875, 7.09375, 11.390625, 15.6875, 19.984375, 24.28125, 28.578125, 32.875, 37.171875, 41.46875, 45.765625, 50.0625, 54.359375, 58.65625, 62.953125, 67.25, 71.546875, 75.84375, 80.140625, 84.4375, 88.734375, 93.03125, 97.328125, 101.625, 105.921875, 110.21875, 114.515625, 118.8125, 123.109375, 127.40625, 131.703125, 136.0]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 4.0, 3.0, 3.0, 9.0, 16.0, 17.0, 15.0, 23.0, 34.0, 60.0, 87.0, 118.0, 175.0, 278.0, 419.0, 713.0, 776.0, 462.0, 286.0, 166.0, 112.0, 82.0, 63.0, 39.0, 33.0, 24.0, 12.0, 10.0, 15.0, 10.0, 5.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.3828125, -5.23345947265625, -5.0841064453125, -4.93475341796875, -4.785400390625, -4.63604736328125, -4.4866943359375, -4.33734130859375, -4.18798828125, -4.03863525390625, -3.8892822265625, -3.73992919921875, -3.590576171875, -3.44122314453125, -3.2918701171875, -3.14251708984375, -2.9931640625, -2.84381103515625, -2.6944580078125, -2.54510498046875, -2.395751953125, -2.24639892578125, -2.0970458984375, -1.94769287109375, -1.79833984375, -1.64898681640625, -1.4996337890625, -1.35028076171875, -1.200927734375, -1.05157470703125, -0.9022216796875, -0.75286865234375, -0.603515625, -0.45416259765625, -0.3048095703125, -0.15545654296875, -0.006103515625, 0.14324951171875, 0.2926025390625, 0.44195556640625, 0.59130859375, 0.74066162109375, 0.8900146484375, 1.03936767578125, 1.188720703125, 1.33807373046875, 1.4874267578125, 1.63677978515625, 1.7861328125, 1.93548583984375, 2.0848388671875, 2.23419189453125, 2.383544921875, 2.53289794921875, 2.6822509765625, 2.83160400390625, 2.98095703125, 3.13031005859375, 3.2796630859375, 3.42901611328125, 3.578369140625, 3.72772216796875, 3.8770751953125, 4.02642822265625, 4.17578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 2.0, 9.0, 23.0, 14.0, 22.0, 31.0, 35.0, 38.0, 47.0, 52.0, 50.0, 38.0, 70.0, 56.0, 59.0, 60.0, 50.0, 42.0, 50.0, 43.0, 23.0, 39.0, 30.0, 23.0, 23.0, 10.0, 10.0, 9.0, 10.0, 8.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.198989868164062, -12.84326171875, -12.487532615661621, -12.131804466247559, -11.77607536315918, -11.420347213745117, -11.064619064331055, -10.708890914916992, -10.353161811828613, -9.99743366241455, -9.641704559326172, -9.28597640991211, -8.930248260498047, -8.574519157409668, -8.218791007995605, -7.863062381744385, -7.507333755493164, -7.151605129241943, -6.795876502990723, -6.44014835357666, -6.0844197273254395, -5.728691101074219, -5.372962951660156, -5.0172343254089355, -4.661505699157715, -4.305777072906494, -3.9500486850738525, -3.594320297241211, -3.2385916709899902, -2.8828630447387695, -2.527134656906128, -2.1714062690734863, -1.815678596496582, -1.4599500894546509, -1.1042215824127197, -0.7484930753707886, -0.3927645683288574, -0.03703606128692627, 0.3186924457550049, 0.6744208335876465, 1.0301494598388672, 1.3858779668807983, 1.7416064739227295, 2.097334861755371, 2.453063488006592, 2.8087921142578125, 3.164520502090454, 3.5202488899230957, 3.8759775161743164, 4.231706142425537, 4.587434768676758, 4.94316291809082, 5.298891544342041, 5.654620170593262, 6.010348320007324, 6.366076946258545, 6.721805572509766, 7.077534198760986, 7.433262825012207, 7.7889909744262695, 8.144720077514648, 8.500448226928711, 8.856176376342773, 9.211904525756836, 9.567633628845215]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 4.0, 8.0, 13.0, 11.0, 15.0, 14.0, 16.0, 20.0, 21.0, 34.0, 36.0, 30.0, 43.0, 38.0, 41.0, 47.0, 45.0, 49.0, 43.0, 52.0, 33.0, 42.0, 41.0, 51.0, 40.0, 37.0, 30.0, 22.0, 28.0, 20.0, 13.0, 11.0, 12.0, 7.0, 12.0, 11.0, 8.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-11.600353240966797, -11.251921653747559, -10.903491020202637, -10.555059432983398, -10.206628799438477, -9.858197212219238, -9.509765625, -9.161334991455078, -8.81290340423584, -8.464471817016602, -8.11604118347168, -7.767609596252441, -7.419178485870361, -7.070747375488281, -6.722316265106201, -6.373885154724121, -6.025454044342041, -5.677022933959961, -5.328591823577881, -4.980160713195801, -4.6317291259765625, -4.283298015594482, -3.9348669052124023, -3.586435556411743, -3.238004446029663, -2.889573335647583, -2.541141986846924, -2.1927108764648438, -1.8442796468734741, -1.4958484172821045, -1.1474173069000244, -0.7989859580993652, -0.45055484771728516, -0.10212364792823792, 0.24630755186080933, 0.5947387218475342, 0.9431699514389038, 1.2916011810302734, 1.6400322914123535, 1.9884636402130127, 2.3368947505950928, 2.685325860977173, 3.033757209777832, 3.382188320159912, 3.730619430541992, 4.0790510177612305, 4.427481651306152, 4.775913238525391, 5.124344348907471, 5.472775459289551, 5.821206569671631, 6.169637680053711, 6.518069267272949, 6.866500377655029, 7.214931488037109, 7.563363075256348, 7.9117937088012695, 8.260225296020508, 8.60865592956543, 8.957087516784668, 9.30551815032959, 9.653949737548828, 10.00238037109375, 10.350811958312988, 10.699243545532227]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 4.0, 12.0, 19.0, 26.0, 58.0, 60.0, 95.0, 137.0, 225.0, 320.0, 508.0, 710.0, 1149.0, 1730.0, 2759.0, 4249.0, 6709.0, 10602.0, 17128.0, 27559.0, 45057.0, 73945.0, 115451.0, 160245.0, 175343.0, 143473.0, 99357.0, 61945.0, 37495.0, 23056.0, 14292.0, 8964.0, 5635.0, 3571.0, 2305.0, 1518.0, 971.0, 645.0, 388.0, 276.0, 209.0, 133.0, 96.0, 43.0, 25.0, 18.0, 9.0, 12.0, 10.0, 6.0, 5.0, 0.0, 1.0, 3.0, 2.0], "bins": [-2.74609375, -2.663665771484375, -2.58123779296875, -2.498809814453125, -2.4163818359375, -2.333953857421875, -2.25152587890625, -2.169097900390625, -2.086669921875, -2.004241943359375, -1.92181396484375, -1.839385986328125, -1.7569580078125, -1.674530029296875, -1.59210205078125, -1.509674072265625, -1.42724609375, -1.344818115234375, -1.26239013671875, -1.179962158203125, -1.0975341796875, -1.015106201171875, -0.93267822265625, -0.850250244140625, -0.767822265625, -0.685394287109375, -0.60296630859375, -0.520538330078125, -0.4381103515625, -0.355682373046875, -0.27325439453125, -0.190826416015625, -0.1083984375, -0.025970458984375, 0.05645751953125, 0.138885498046875, 0.2213134765625, 0.303741455078125, 0.38616943359375, 0.468597412109375, 0.551025390625, 0.633453369140625, 0.71588134765625, 0.798309326171875, 0.8807373046875, 0.963165283203125, 1.04559326171875, 1.128021240234375, 1.21044921875, 1.292877197265625, 1.37530517578125, 1.457733154296875, 1.5401611328125, 1.622589111328125, 1.70501708984375, 1.787445068359375, 1.869873046875, 1.952301025390625, 2.03472900390625, 2.117156982421875, 2.1995849609375, 2.282012939453125, 2.36444091796875, 2.446868896484375, 2.529296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 9.0, 10.0, 8.0, 7.0, 8.0, 7.0, 20.0, 20.0, 25.0, 17.0, 41.0, 30.0, 33.0, 43.0, 35.0, 37.0, 44.0, 49.0, 45.0, 53.0, 39.0, 44.0, 42.0, 45.0, 28.0, 34.0, 30.0, 30.0, 27.0, 23.0, 18.0, 17.0, 15.0, 14.0, 10.0, 8.0, 5.0, 8.0, 7.0, 3.0, 4.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66796875, -7.4281005859375, -7.188232421875, -6.9483642578125, -6.70849609375, -6.4686279296875, -6.228759765625, -5.9888916015625, -5.7490234375, -5.5091552734375, -5.269287109375, -5.0294189453125, -4.78955078125, -4.5496826171875, -4.309814453125, -4.0699462890625, -3.830078125, -3.5902099609375, -3.350341796875, -3.1104736328125, -2.87060546875, -2.6307373046875, -2.390869140625, -2.1510009765625, -1.9111328125, -1.6712646484375, -1.431396484375, -1.1915283203125, -0.95166015625, -0.7117919921875, -0.471923828125, -0.2320556640625, 0.0078125, 0.2476806640625, 0.487548828125, 0.7274169921875, 0.96728515625, 1.2071533203125, 1.447021484375, 1.6868896484375, 1.9267578125, 2.1666259765625, 2.406494140625, 2.6463623046875, 2.88623046875, 3.1260986328125, 3.365966796875, 3.6058349609375, 3.845703125, 4.0855712890625, 4.325439453125, 4.5653076171875, 4.80517578125, 5.0450439453125, 5.284912109375, 5.5247802734375, 5.7646484375, 6.0045166015625, 6.244384765625, 6.4842529296875, 6.72412109375, 6.9639892578125, 7.203857421875, 7.4437255859375, 7.68359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 8.0, 8.0, 6.0, 14.0, 20.0, 25.0, 31.0, 44.0, 71.0, 74.0, 134.0, 212.0, 380.0, 652.0, 1352.0, 2888.0, 7689.0, 22490.0, 73174.0, 251760.0, 419760.0, 186638.0, 53352.0, 16922.0, 5950.0, 2387.0, 1083.0, 561.0, 303.0, 172.0, 109.0, 75.0, 62.0, 46.0, 28.0, 20.0, 16.0, 7.0, 11.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.359375, -5.18853759765625, -5.0177001953125, -4.84686279296875, -4.676025390625, -4.50518798828125, -4.3343505859375, -4.16351318359375, -3.99267578125, -3.82183837890625, -3.6510009765625, -3.48016357421875, -3.309326171875, -3.13848876953125, -2.9676513671875, -2.79681396484375, -2.6259765625, -2.45513916015625, -2.2843017578125, -2.11346435546875, -1.942626953125, -1.77178955078125, -1.6009521484375, -1.43011474609375, -1.25927734375, -1.08843994140625, -0.9176025390625, -0.74676513671875, -0.575927734375, -0.40509033203125, -0.2342529296875, -0.06341552734375, 0.107421875, 0.27825927734375, 0.4490966796875, 0.61993408203125, 0.790771484375, 0.96160888671875, 1.1324462890625, 1.30328369140625, 1.47412109375, 1.64495849609375, 1.8157958984375, 1.98663330078125, 2.157470703125, 2.32830810546875, 2.4991455078125, 2.66998291015625, 2.8408203125, 3.01165771484375, 3.1824951171875, 3.35333251953125, 3.524169921875, 3.69500732421875, 3.8658447265625, 4.03668212890625, 4.20751953125, 4.37835693359375, 4.5491943359375, 4.72003173828125, 4.890869140625, 5.06170654296875, 5.2325439453125, 5.40338134765625, 5.57421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 2.0, 5.0, 5.0, 6.0, 10.0, 9.0, 13.0, 15.0, 20.0, 20.0, 22.0, 29.0, 33.0, 33.0, 47.0, 46.0, 52.0, 51.0, 44.0, 54.0, 43.0, 46.0, 62.0, 46.0, 51.0, 25.0, 35.0, 37.0, 20.0, 23.0, 17.0, 19.0, 11.0, 16.0, 7.0, 10.0, 6.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.671875, -17.1103515625, -16.548828125, -15.9873046875, -15.42578125, -14.8642578125, -14.302734375, -13.7412109375, -13.1796875, -12.6181640625, -12.056640625, -11.4951171875, -10.93359375, -10.3720703125, -9.810546875, -9.2490234375, -8.6875, -8.1259765625, -7.564453125, -7.0029296875, -6.44140625, -5.8798828125, -5.318359375, -4.7568359375, -4.1953125, -3.6337890625, -3.072265625, -2.5107421875, -1.94921875, -1.3876953125, -0.826171875, -0.2646484375, 0.296875, 0.8583984375, 1.419921875, 1.9814453125, 2.54296875, 3.1044921875, 3.666015625, 4.2275390625, 4.7890625, 5.3505859375, 5.912109375, 6.4736328125, 7.03515625, 7.5966796875, 8.158203125, 8.7197265625, 9.28125, 9.8427734375, 10.404296875, 10.9658203125, 11.52734375, 12.0888671875, 12.650390625, 13.2119140625, 13.7734375, 14.3349609375, 14.896484375, 15.4580078125, 16.01953125, 16.5810546875, 17.142578125, 17.7041015625, 18.265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 9.0, 18.0, 30.0, 41.0, 54.0, 58.0, 95.0, 154.0, 246.0, 423.0, 676.0, 1163.0, 2464.0, 5336.0, 14670.0, 57175.0, 332256.0, 504095.0, 94617.0, 21142.0, 7214.0, 3028.0, 1476.0, 833.0, 462.0, 289.0, 171.0, 93.0, 70.0, 55.0, 42.0, 25.0, 15.0, 16.0, 9.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.6640625, -2.565948486328125, -2.46783447265625, -2.369720458984375, -2.2716064453125, -2.173492431640625, -2.07537841796875, -1.977264404296875, -1.879150390625, -1.781036376953125, -1.68292236328125, -1.584808349609375, -1.4866943359375, -1.388580322265625, -1.29046630859375, -1.192352294921875, -1.09423828125, -0.996124267578125, -0.89801025390625, -0.799896240234375, -0.7017822265625, -0.603668212890625, -0.50555419921875, -0.407440185546875, -0.309326171875, -0.211212158203125, -0.11309814453125, -0.014984130859375, 0.0831298828125, 0.181243896484375, 0.27935791015625, 0.377471923828125, 0.4755859375, 0.573699951171875, 0.67181396484375, 0.769927978515625, 0.8680419921875, 0.966156005859375, 1.06427001953125, 1.162384033203125, 1.260498046875, 1.358612060546875, 1.45672607421875, 1.554840087890625, 1.6529541015625, 1.751068115234375, 1.84918212890625, 1.947296142578125, 2.04541015625, 2.143524169921875, 2.24163818359375, 2.339752197265625, 2.4378662109375, 2.535980224609375, 2.63409423828125, 2.732208251953125, 2.830322265625, 2.928436279296875, 3.02655029296875, 3.124664306640625, 3.2227783203125, 3.320892333984375, 3.41900634765625, 3.517120361328125, 3.615234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 6.0, 7.0, 11.0, 7.0, 21.0, 23.0, 35.0, 33.0, 60.0, 81.0, 95.0, 121.0, 119.0, 86.0, 77.0, 54.0, 59.0, 23.0, 12.0, 21.0, 11.0, 14.0, 7.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001224517822265625, -0.0011822134256362915, -0.001139909029006958, -0.0010976046323776245, -0.001055300235748291, -0.0010129958391189575, -0.000970691442489624, -0.0009283870458602905, -0.000886082649230957, -0.0008437782526016235, -0.00080147385597229, -0.0007591694593429565, -0.000716865062713623, -0.0006745606660842896, -0.0006322562694549561, -0.0005899518728256226, -0.0005476474761962891, -0.0005053430795669556, -0.00046303868293762207, -0.0004207342863082886, -0.0003784298896789551, -0.0003361254930496216, -0.0002938210964202881, -0.0002515166997909546, -0.0002092123031616211, -0.0001669079065322876, -0.0001246035099029541, -8.22991132736206e-05, -3.999471664428711e-05, 2.3096799850463867e-06, 4.461407661437988e-05, 8.691847324371338e-05, 0.00012922286987304688, 0.00017152726650238037, 0.00021383166313171387, 0.00025613605976104736, 0.00029844045639038086, 0.00034074485301971436, 0.00038304924964904785, 0.00042535364627838135, 0.00046765804290771484, 0.0005099624395370483, 0.0005522668361663818, 0.0005945712327957153, 0.0006368756294250488, 0.0006791800260543823, 0.0007214844226837158, 0.0007637888193130493, 0.0008060932159423828, 0.0008483976125717163, 0.0008907020092010498, 0.0009330064058303833, 0.0009753108024597168, 0.0010176151990890503, 0.0010599195957183838, 0.0011022239923477173, 0.0011445283889770508, 0.0011868327856063843, 0.0012291371822357178, 0.0012714415788650513, 0.0013137459754943848, 0.0013560503721237183, 0.0013983547687530518, 0.0014406591653823853, 0.0014829635620117188]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 1.0, 5.0, 3.0, 7.0, 5.0, 10.0, 19.0, 23.0, 29.0, 30.0, 73.0, 140.0, 367.0, 1396.0, 7620.0, 117273.0, 865077.0, 49959.0, 4902.0, 985.0, 276.0, 135.0, 61.0, 43.0, 29.0, 16.0, 12.0, 13.0, 8.0, 8.0, 3.0, 3.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.80078125, -7.54400634765625, -7.2872314453125, -7.03045654296875, -6.773681640625, -6.51690673828125, -6.2601318359375, -6.00335693359375, -5.74658203125, -5.48980712890625, -5.2330322265625, -4.97625732421875, -4.719482421875, -4.46270751953125, -4.2059326171875, -3.94915771484375, -3.6923828125, -3.43560791015625, -3.1788330078125, -2.92205810546875, -2.665283203125, -2.40850830078125, -2.1517333984375, -1.89495849609375, -1.63818359375, -1.38140869140625, -1.1246337890625, -0.86785888671875, -0.611083984375, -0.35430908203125, -0.0975341796875, 0.15924072265625, 0.416015625, 0.67279052734375, 0.9295654296875, 1.18634033203125, 1.443115234375, 1.69989013671875, 1.9566650390625, 2.21343994140625, 2.47021484375, 2.72698974609375, 2.9837646484375, 3.24053955078125, 3.497314453125, 3.75408935546875, 4.0108642578125, 4.26763916015625, 4.5244140625, 4.78118896484375, 5.0379638671875, 5.29473876953125, 5.551513671875, 5.80828857421875, 6.0650634765625, 6.32183837890625, 6.57861328125, 6.83538818359375, 7.0921630859375, 7.34893798828125, 7.605712890625, 7.86248779296875, 8.1192626953125, 8.37603759765625, 8.6328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 0.0, 5.0, 18.0, 8.0, 16.0, 11.0, 21.0, 38.0, 42.0, 69.0, 65.0, 78.0, 90.0, 71.0, 83.0, 62.0, 70.0, 57.0, 42.0, 34.0, 42.0, 19.0, 9.0, 11.0, 7.0, 4.0, 1.0, 1.0, 1.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.92236328125, -0.8938751220703125, -0.865386962890625, -0.8368988037109375, -0.80841064453125, -0.7799224853515625, -0.751434326171875, -0.7229461669921875, -0.6944580078125, -0.6659698486328125, -0.637481689453125, -0.6089935302734375, -0.58050537109375, -0.5520172119140625, -0.523529052734375, -0.4950408935546875, -0.466552734375, -0.4380645751953125, -0.409576416015625, -0.3810882568359375, -0.35260009765625, -0.3241119384765625, -0.295623779296875, -0.2671356201171875, -0.2386474609375, -0.2101593017578125, -0.181671142578125, -0.1531829833984375, -0.12469482421875, -0.0962066650390625, -0.067718505859375, -0.0392303466796875, -0.0107421875, 0.0177459716796875, 0.046234130859375, 0.0747222900390625, 0.10321044921875, 0.1316986083984375, 0.160186767578125, 0.1886749267578125, 0.2171630859375, 0.2456512451171875, 0.274139404296875, 0.3026275634765625, 0.33111572265625, 0.3596038818359375, 0.388092041015625, 0.4165802001953125, 0.445068359375, 0.4735565185546875, 0.502044677734375, 0.5305328369140625, 0.55902099609375, 0.5875091552734375, 0.615997314453125, 0.6444854736328125, 0.6729736328125, 0.7014617919921875, 0.729949951171875, 0.7584381103515625, 0.78692626953125, 0.8154144287109375, 0.843902587890625, 0.8723907470703125, 0.90087890625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 15.0, 14.0, 32.0, 58.0, 77.0, 103.0, 127.0, 132.0, 118.0, 105.0, 87.0, 55.0, 33.0, 19.0, 9.0, 7.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.282350540161133, -18.724084854125977, -18.16581916809082, -17.607553482055664, -17.049287796020508, -16.49102210998535, -15.932756423950195, -15.374490737915039, -14.816225051879883, -14.257959365844727, -13.69969367980957, -13.141427993774414, -12.583162307739258, -12.024896621704102, -11.466630935668945, -10.908365249633789, -10.350098609924316, -9.79183292388916, -9.233567237854004, -8.675301551818848, -8.117035865783691, -7.558770179748535, -7.000504016876221, -6.4422383308410645, -5.883972644805908, -5.325706958770752, -4.767441272735596, -4.209175109863281, -3.650909662246704, -3.092643976211548, -2.5343780517578125, -1.9761123657226562, -1.4178466796875, -0.859580934047699, -0.30131518840789795, 0.25695061683654785, 0.8152163028717041, 1.3734819889068604, 1.9317479133605957, 2.490013599395752, 3.048279285430908, 3.6065449714660645, 4.164810657501221, 4.723076820373535, 5.281342506408691, 5.839608192443848, 6.397873878479004, 6.95613956451416, 7.514405250549316, 8.072670936584473, 8.630936622619629, 9.189202308654785, 9.747467994689941, 10.305733680725098, 10.86400032043457, 11.422266006469727, 11.980531692504883, 12.538797378540039, 13.097063064575195, 13.655328750610352, 14.213594436645508, 14.771860122680664, 15.33012580871582, 15.888391494750977, 16.446657180786133]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 8.0, 10.0, 8.0, 10.0, 13.0, 15.0, 19.0, 21.0, 19.0, 25.0, 36.0, 26.0, 45.0, 45.0, 44.0, 57.0, 34.0, 48.0, 40.0, 40.0, 47.0, 39.0, 51.0, 44.0, 44.0, 27.0, 38.0, 26.0, 21.0, 19.0, 16.0, 13.0, 15.0, 12.0, 7.0, 10.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.861129283905029, -7.603972911834717, -7.346816062927246, -7.089659690856934, -6.832503318786621, -6.575346946716309, -6.318190097808838, -6.061033725738525, -5.803876876831055, -5.546720504760742, -5.2895636558532715, -5.032407283782959, -4.7752509117126465, -4.518094062805176, -4.260937690734863, -4.003781318664551, -3.7466249465942383, -3.4894683361053467, -3.232311964035034, -2.9751553535461426, -2.71799898147583, -2.4608423709869385, -2.203685760498047, -1.9465292692184448, -1.6893727779388428, -1.4322162866592407, -1.1750597953796387, -0.9179031848907471, -0.660746693611145, -0.40359020233154297, -0.14643359184265137, 0.11072289943695068, 0.36787891387939453, 0.6250354051589966, 0.8821919560432434, 1.1393485069274902, 1.3965049982070923, 1.6536614894866943, 1.910818099975586, 2.1679744720458984, 2.42513108253479, 2.6822876930236816, 2.939444065093994, 3.1966006755828857, 3.4537572860717773, 3.71091365814209, 3.9680702686309814, 4.225226879119873, 4.4823832511901855, 4.739539623260498, 4.996696472167969, 5.253852844238281, 5.511009216308594, 5.768165588378906, 6.025322437286377, 6.2824788093566895, 6.53963565826416, 6.796792030334473, 7.053948879241943, 7.311105251312256, 7.568261623382568, 7.825418472290039, 8.082574844360352, 8.339731216430664, 8.596887588500977]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 8.0, 2.0, 11.0, 10.0, 21.0, 25.0, 49.0, 63.0, 103.0, 154.0, 214.0, 345.0, 593.0, 979.0, 1739.0, 3168.0, 6462.0, 13816.0, 31793.0, 74445.0, 167827.0, 290936.0, 243097.0, 118940.0, 50712.0, 22383.0, 9986.0, 4756.0, 2425.0, 1414.0, 769.0, 449.0, 270.0, 180.0, 145.0, 87.0, 66.0, 35.0, 27.0, 12.0, 16.0, 7.0, 9.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.81640625, -4.673828125, -4.53125, -4.388671875, -4.24609375, -4.103515625, -3.9609375, -3.818359375, -3.67578125, -3.533203125, -3.390625, -3.248046875, -3.10546875, -2.962890625, -2.8203125, -2.677734375, -2.53515625, -2.392578125, -2.25, -2.107421875, -1.96484375, -1.822265625, -1.6796875, -1.537109375, -1.39453125, -1.251953125, -1.109375, -0.966796875, -0.82421875, -0.681640625, -0.5390625, -0.396484375, -0.25390625, -0.111328125, 0.03125, 0.173828125, 0.31640625, 0.458984375, 0.6015625, 0.744140625, 0.88671875, 1.029296875, 1.171875, 1.314453125, 1.45703125, 1.599609375, 1.7421875, 1.884765625, 2.02734375, 2.169921875, 2.3125, 2.455078125, 2.59765625, 2.740234375, 2.8828125, 3.025390625, 3.16796875, 3.310546875, 3.453125, 3.595703125, 3.73828125, 3.880859375, 4.0234375, 4.166015625, 4.30859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 3.0, 5.0, 9.0, 6.0, 10.0, 12.0, 13.0, 11.0, 24.0, 15.0, 22.0, 23.0, 39.0, 36.0, 38.0, 32.0, 37.0, 41.0, 55.0, 48.0, 38.0, 41.0, 37.0, 43.0, 32.0, 39.0, 36.0, 45.0, 24.0, 27.0, 27.0, 19.0, 13.0, 13.0, 22.0, 14.0, 11.0, 11.0, 5.0, 4.0, 2.0, 4.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0], "bins": [-40.59375, -39.3583984375, -38.123046875, -36.8876953125, -35.65234375, -34.4169921875, -33.181640625, -31.9462890625, -30.7109375, -29.4755859375, -28.240234375, -27.0048828125, -25.76953125, -24.5341796875, -23.298828125, -22.0634765625, -20.828125, -19.5927734375, -18.357421875, -17.1220703125, -15.88671875, -14.6513671875, -13.416015625, -12.1806640625, -10.9453125, -9.7099609375, -8.474609375, -7.2392578125, -6.00390625, -4.7685546875, -3.533203125, -2.2978515625, -1.0625, 0.1728515625, 1.408203125, 2.6435546875, 3.87890625, 5.1142578125, 6.349609375, 7.5849609375, 8.8203125, 10.0556640625, 11.291015625, 12.5263671875, 13.76171875, 14.9970703125, 16.232421875, 17.4677734375, 18.703125, 19.9384765625, 21.173828125, 22.4091796875, 23.64453125, 24.8798828125, 26.115234375, 27.3505859375, 28.5859375, 29.8212890625, 31.056640625, 32.2919921875, 33.52734375, 34.7626953125, 35.998046875, 37.2333984375, 38.46875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 10.0, 5.0, 19.0, 18.0, 21.0, 31.0, 36.0, 44.0, 53.0, 51.0, 76.0, 103.0, 127.0, 181.0, 284.0, 592.0, 1568.0, 20507.0, 694046.0, 320358.0, 7900.0, 1048.0, 449.0, 283.0, 174.0, 131.0, 101.0, 71.0, 57.0, 45.0, 27.0, 23.0, 25.0, 27.0, 10.0, 14.0, 13.0, 8.0, 6.0, 3.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0], "bins": [-21.0, -20.43017578125, -19.8603515625, -19.29052734375, -18.720703125, -18.15087890625, -17.5810546875, -17.01123046875, -16.44140625, -15.87158203125, -15.3017578125, -14.73193359375, -14.162109375, -13.59228515625, -13.0224609375, -12.45263671875, -11.8828125, -11.31298828125, -10.7431640625, -10.17333984375, -9.603515625, -9.03369140625, -8.4638671875, -7.89404296875, -7.32421875, -6.75439453125, -6.1845703125, -5.61474609375, -5.044921875, -4.47509765625, -3.9052734375, -3.33544921875, -2.765625, -2.19580078125, -1.6259765625, -1.05615234375, -0.486328125, 0.08349609375, 0.6533203125, 1.22314453125, 1.79296875, 2.36279296875, 2.9326171875, 3.50244140625, 4.072265625, 4.64208984375, 5.2119140625, 5.78173828125, 6.3515625, 6.92138671875, 7.4912109375, 8.06103515625, 8.630859375, 9.20068359375, 9.7705078125, 10.34033203125, 10.91015625, 11.47998046875, 12.0498046875, 12.61962890625, 13.189453125, 13.75927734375, 14.3291015625, 14.89892578125, 15.46875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 6.0, 5.0, 16.0, 14.0, 13.0, 21.0, 19.0, 17.0, 28.0, 37.0, 33.0, 31.0, 38.0, 42.0, 52.0, 54.0, 54.0, 53.0, 42.0, 44.0, 47.0, 59.0, 40.0, 34.0, 33.0, 23.0, 36.0, 18.0, 20.0, 13.0, 11.0, 11.0, 9.0, 9.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.75, -48.37255859375, -46.9951171875, -45.61767578125, -44.240234375, -42.86279296875, -41.4853515625, -40.10791015625, -38.73046875, -37.35302734375, -35.9755859375, -34.59814453125, -33.220703125, -31.84326171875, -30.4658203125, -29.08837890625, -27.7109375, -26.33349609375, -24.9560546875, -23.57861328125, -22.201171875, -20.82373046875, -19.4462890625, -18.06884765625, -16.69140625, -15.31396484375, -13.9365234375, -12.55908203125, -11.181640625, -9.80419921875, -8.4267578125, -7.04931640625, -5.671875, -4.29443359375, -2.9169921875, -1.53955078125, -0.162109375, 1.21533203125, 2.5927734375, 3.97021484375, 5.34765625, 6.72509765625, 8.1025390625, 9.47998046875, 10.857421875, 12.23486328125, 13.6123046875, 14.98974609375, 16.3671875, 17.74462890625, 19.1220703125, 20.49951171875, 21.876953125, 23.25439453125, 24.6318359375, 26.00927734375, 27.38671875, 28.76416015625, 30.1416015625, 31.51904296875, 32.896484375, 34.27392578125, 35.6513671875, 37.02880859375, 38.40625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 8.0, 6.0, 11.0, 20.0, 37.0, 53.0, 141.0, 299.0, 733.0, 2619.0, 15310.0, 238372.0, 741515.0, 42386.0, 5009.0, 1214.0, 426.0, 181.0, 80.0, 45.0, 27.0, 14.0, 15.0, 14.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.392578125, -2.29376220703125, -2.1949462890625, -2.09613037109375, -1.997314453125, -1.89849853515625, -1.7996826171875, -1.70086669921875, -1.60205078125, -1.50323486328125, -1.4044189453125, -1.30560302734375, -1.206787109375, -1.10797119140625, -1.0091552734375, -0.91033935546875, -0.8115234375, -0.71270751953125, -0.6138916015625, -0.51507568359375, -0.416259765625, -0.31744384765625, -0.2186279296875, -0.11981201171875, -0.02099609375, 0.07781982421875, 0.1766357421875, 0.27545166015625, 0.374267578125, 0.47308349609375, 0.5718994140625, 0.67071533203125, 0.76953125, 0.86834716796875, 0.9671630859375, 1.06597900390625, 1.164794921875, 1.26361083984375, 1.3624267578125, 1.46124267578125, 1.56005859375, 1.65887451171875, 1.7576904296875, 1.85650634765625, 1.955322265625, 2.05413818359375, 2.1529541015625, 2.25177001953125, 2.3505859375, 2.44940185546875, 2.5482177734375, 2.64703369140625, 2.745849609375, 2.84466552734375, 2.9434814453125, 3.04229736328125, 3.14111328125, 3.23992919921875, 3.3387451171875, 3.43756103515625, 3.536376953125, 3.63519287109375, 3.7340087890625, 3.83282470703125, 3.931640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 7.0, 5.0, 10.0, 8.0, 15.0, 14.0, 15.0, 24.0, 24.0, 37.0, 39.0, 60.0, 90.0, 85.0, 90.0, 96.0, 80.0, 71.0, 48.0, 45.0, 27.0, 25.0, 19.0, 14.0, 11.0, 8.0, 5.0, 10.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021982192993164062, -0.00021214038133621216, -0.0002044588327407837, -0.00019677728414535522, -0.00018909573554992676, -0.0001814141869544983, -0.00017373263835906982, -0.00016605108976364136, -0.0001583695411682129, -0.00015068799257278442, -0.00014300644397735596, -0.0001353248953819275, -0.00012764334678649902, -0.00011996179819107056, -0.00011228024959564209, -0.00010459870100021362, -9.691715240478516e-05, -8.923560380935669e-05, -8.155405521392822e-05, -7.387250661849976e-05, -6.619095802307129e-05, -5.850940942764282e-05, -5.0827860832214355e-05, -4.314631223678589e-05, -3.546476364135742e-05, -2.7783215045928955e-05, -2.0101666450500488e-05, -1.2420117855072021e-05, -4.738569259643555e-06, 2.942979335784912e-06, 1.0624527931213379e-05, 1.8306076526641846e-05, 2.5987625122070312e-05, 3.366917371749878e-05, 4.1350722312927246e-05, 4.903227090835571e-05, 5.671381950378418e-05, 6.439536809921265e-05, 7.207691669464111e-05, 7.975846529006958e-05, 8.744001388549805e-05, 9.512156248092651e-05, 0.00010280311107635498, 0.00011048465967178345, 0.00011816620826721191, 0.00012584775686264038, 0.00013352930545806885, 0.00014121085405349731, 0.00014889240264892578, 0.00015657395124435425, 0.00016425549983978271, 0.00017193704843521118, 0.00017961859703063965, 0.00018730014562606812, 0.00019498169422149658, 0.00020266324281692505, 0.00021034479141235352, 0.00021802634000778198, 0.00022570788860321045, 0.00023338943719863892, 0.00024107098579406738, 0.00024875253438949585, 0.0002564340829849243, 0.0002641156315803528, 0.00027179718017578125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 20.0, 5.0, 12.0, 39.0, 72.0, 158.0, 359.0, 1463.0, 9394.0, 175905.0, 816026.0, 40217.0, 3676.0, 748.0, 251.0, 73.0, 53.0, 28.0, 20.0, 13.0, 4.0, 7.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.880859375, -2.762176513671875, -2.64349365234375, -2.524810791015625, -2.4061279296875, -2.287445068359375, -2.16876220703125, -2.050079345703125, -1.931396484375, -1.812713623046875, -1.69403076171875, -1.575347900390625, -1.4566650390625, -1.337982177734375, -1.21929931640625, -1.100616455078125, -0.98193359375, -0.863250732421875, -0.74456787109375, -0.625885009765625, -0.5072021484375, -0.388519287109375, -0.26983642578125, -0.151153564453125, -0.032470703125, 0.086212158203125, 0.20489501953125, 0.323577880859375, 0.4422607421875, 0.560943603515625, 0.67962646484375, 0.798309326171875, 0.9169921875, 1.035675048828125, 1.15435791015625, 1.273040771484375, 1.3917236328125, 1.510406494140625, 1.62908935546875, 1.747772216796875, 1.866455078125, 1.985137939453125, 2.10382080078125, 2.222503662109375, 2.3411865234375, 2.459869384765625, 2.57855224609375, 2.697235107421875, 2.81591796875, 2.934600830078125, 3.05328369140625, 3.171966552734375, 3.2906494140625, 3.409332275390625, 3.52801513671875, 3.646697998046875, 3.765380859375, 3.884063720703125, 4.00274658203125, 4.121429443359375, 4.2401123046875, 4.358795166015625, 4.47747802734375, 4.596160888671875, 4.71484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 4.0, 13.0, 9.0, 15.0, 24.0, 28.0, 35.0, 64.0, 67.0, 94.0, 122.0, 98.0, 95.0, 71.0, 80.0, 37.0, 28.0, 29.0, 16.0, 12.0, 11.0, 10.0, 10.0, 7.0, 6.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66162109375, -0.6354446411132812, -0.6092681884765625, -0.5830917358398438, -0.556915283203125, -0.5307388305664062, -0.5045623779296875, -0.47838592529296875, -0.45220947265625, -0.42603302001953125, -0.3998565673828125, -0.37368011474609375, -0.347503662109375, -0.32132720947265625, -0.2951507568359375, -0.26897430419921875, -0.2427978515625, -0.21662139892578125, -0.1904449462890625, -0.16426849365234375, -0.138092041015625, -0.11191558837890625, -0.0857391357421875, -0.05956268310546875, -0.03338623046875, -0.00720977783203125, 0.0189666748046875, 0.04514312744140625, 0.071319580078125, 0.09749603271484375, 0.1236724853515625, 0.14984893798828125, 0.176025390625, 0.20220184326171875, 0.2283782958984375, 0.25455474853515625, 0.280731201171875, 0.30690765380859375, 0.3330841064453125, 0.35926055908203125, 0.38543701171875, 0.41161346435546875, 0.4377899169921875, 0.46396636962890625, 0.490142822265625, 0.5163192749023438, 0.5424957275390625, 0.5686721801757812, 0.5948486328125, 0.6210250854492188, 0.6472015380859375, 0.6733779907226562, 0.699554443359375, 0.7257308959960938, 0.7519073486328125, 0.7780838012695312, 0.80426025390625, 0.8304367065429688, 0.8566131591796875, 0.8827896118164062, 0.908966064453125, 0.9351425170898438, 0.9613189697265625, 0.9874954223632812, 1.013671875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 61.0, 622.0, 307.0, 26.0, 2.0, 1.0], "bins": [-334.67333984375, -329.0771484375, -323.48095703125, -317.884765625, -312.2886047363281, -306.6924133300781, -301.0962219238281, -295.5000305175781, -289.9038391113281, -284.3076477050781, -278.7114562988281, -273.11529541015625, -267.51910400390625, -261.92291259765625, -256.32672119140625, -250.73052978515625, -245.1343536376953, -239.5381622314453, -233.94198608398438, -228.34579467773438, -222.74960327148438, -217.15341186523438, -211.55723571777344, -205.96104431152344, -200.3648681640625, -194.7686767578125, -189.17250061035156, -183.57630920410156, -177.98011779785156, -172.38394165039062, -166.78775024414062, -161.19155883789062, -155.5953826904297, -149.9991912841797, -144.40301513671875, -138.80682373046875, -133.21063232421875, -127.61444854736328, -122.01826477050781, -116.42207336425781, -110.82588195800781, -105.22969818115234, -99.63350677490234, -94.03732299804688, -88.44113159179688, -82.8449478149414, -77.24876403808594, -71.65257263183594, -66.05638885498047, -60.460201263427734, -54.864013671875, -49.26782989501953, -43.6716423034668, -38.07545471191406, -32.479270935058594, -26.88308334350586, -21.286897659301758, -15.69071102142334, -10.094524383544922, -4.49833869934082, 1.097848892211914, 6.694036483764648, 12.290220260620117, 17.88640785217285, 23.482595443725586]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 0.0, 2.0, 6.0, 6.0, 9.0, 14.0, 10.0, 17.0, 16.0, 16.0, 16.0, 20.0, 23.0, 37.0, 36.0, 30.0, 36.0, 31.0, 40.0, 50.0, 40.0, 29.0, 38.0, 43.0, 31.0, 38.0, 36.0, 36.0, 40.0, 24.0, 25.0, 22.0, 27.0, 18.0, 24.0, 12.0, 18.0, 13.0, 20.0, 11.0, 6.0, 5.0, 12.0, 7.0, 4.0, 3.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-56.334320068359375, -54.55524826049805, -52.77617645263672, -50.99710464477539, -49.21803283691406, -47.43896484375, -45.659889221191406, -43.880821228027344, -42.101749420166016, -40.32267761230469, -38.54360580444336, -36.76453399658203, -34.9854621887207, -33.206390380859375, -31.42732048034668, -29.648250579833984, -27.869176864624023, -26.090105056762695, -24.311033248901367, -22.531963348388672, -20.752891540527344, -18.973819732666016, -17.194747924804688, -15.415677070617676, -13.636605262756348, -11.85753345489502, -10.078462600708008, -8.29939079284668, -6.52031946182251, -4.74124813079834, -2.9621763229370117, -1.18310546875, 0.5959663391113281, 2.375037670135498, 4.154109001159668, 5.933180809020996, 7.712252140045166, 9.491323471069336, 11.270395278930664, 13.049466133117676, 14.828537940979004, 16.607608795166016, 18.386680603027344, 20.165752410888672, 21.94482421875, 23.723896026611328, 25.502967834472656, 27.28203773498535, 29.06110954284668, 30.840181350708008, 32.6192512512207, 34.39832305908203, 36.17739486694336, 37.95646667480469, 39.735538482666016, 41.514610290527344, 43.29368209838867, 45.07275390625, 46.85182571411133, 48.630897521972656, 50.409969329833984, 52.18904113769531, 53.968109130859375, 55.7471809387207, 57.52625274658203]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 5.0, 3.0, 3.0, 8.0, 8.0, 10.0, 11.0, 15.0, 18.0, 21.0, 32.0, 30.0, 34.0, 69.0, 91.0, 181.0, 385.0, 784.0, 1973.0, 5675.0, 18332.0, 85238.0, 589995.0, 2442823.0, 895133.0, 118425.0, 23609.0, 6968.0, 2546.0, 931.0, 406.0, 197.0, 98.0, 56.0, 32.0, 26.0, 21.0, 14.0, 14.0, 13.0, 9.0, 10.0, 12.0, 5.0, 5.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6875, -12.2589111328125, -11.830322265625, -11.4017333984375, -10.97314453125, -10.5445556640625, -10.115966796875, -9.6873779296875, -9.2587890625, -8.8302001953125, -8.401611328125, -7.9730224609375, -7.54443359375, -7.1158447265625, -6.687255859375, -6.2586669921875, -5.830078125, -5.4014892578125, -4.972900390625, -4.5443115234375, -4.11572265625, -3.6871337890625, -3.258544921875, -2.8299560546875, -2.4013671875, -1.9727783203125, -1.544189453125, -1.1156005859375, -0.68701171875, -0.2584228515625, 0.170166015625, 0.5987548828125, 1.02734375, 1.4559326171875, 1.884521484375, 2.3131103515625, 2.74169921875, 3.1702880859375, 3.598876953125, 4.0274658203125, 4.4560546875, 4.8846435546875, 5.313232421875, 5.7418212890625, 6.17041015625, 6.5989990234375, 7.027587890625, 7.4561767578125, 7.884765625, 8.3133544921875, 8.741943359375, 9.1705322265625, 9.59912109375, 10.0277099609375, 10.456298828125, 10.8848876953125, 11.3134765625, 11.7420654296875, 12.170654296875, 12.5992431640625, 13.02783203125, 13.4564208984375, 13.885009765625, 14.3135986328125, 14.7421875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 8.0, 5.0, 11.0, 10.0, 12.0, 19.0, 13.0, 18.0, 19.0, 18.0, 26.0, 26.0, 30.0, 48.0, 48.0, 48.0, 41.0, 42.0, 47.0, 44.0, 46.0, 29.0, 46.0, 49.0, 46.0, 40.0, 32.0, 24.0, 20.0, 26.0, 11.0, 12.0, 21.0, 13.0, 9.0, 11.0, 6.0, 3.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.45703125, -7.18463134765625, -6.9122314453125, -6.63983154296875, -6.367431640625, -6.09503173828125, -5.8226318359375, -5.55023193359375, -5.27783203125, -5.00543212890625, -4.7330322265625, -4.46063232421875, -4.188232421875, -3.91583251953125, -3.6434326171875, -3.37103271484375, -3.0986328125, -2.82623291015625, -2.5538330078125, -2.28143310546875, -2.009033203125, -1.73663330078125, -1.4642333984375, -1.19183349609375, -0.91943359375, -0.64703369140625, -0.3746337890625, -0.10223388671875, 0.170166015625, 0.44256591796875, 0.7149658203125, 0.98736572265625, 1.259765625, 1.53216552734375, 1.8045654296875, 2.07696533203125, 2.349365234375, 2.62176513671875, 2.8941650390625, 3.16656494140625, 3.43896484375, 3.71136474609375, 3.9837646484375, 4.25616455078125, 4.528564453125, 4.80096435546875, 5.0733642578125, 5.34576416015625, 5.6181640625, 5.89056396484375, 6.1629638671875, 6.43536376953125, 6.707763671875, 6.98016357421875, 7.2525634765625, 7.52496337890625, 7.79736328125, 8.06976318359375, 8.3421630859375, 8.61456298828125, 8.886962890625, 9.15936279296875, 9.4317626953125, 9.70416259765625, 9.9765625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 8.0, 12.0, 30.0, 72.0, 283.0, 4172484.0, 21111.0, 188.0, 48.0, 26.0, 6.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-399.75, -390.642578125, -381.53515625, -372.427734375, -363.3203125, -354.212890625, -345.10546875, -335.998046875, -326.890625, -317.783203125, -308.67578125, -299.568359375, -290.4609375, -281.353515625, -272.24609375, -263.138671875, -254.03125, -244.923828125, -235.81640625, -226.708984375, -217.6015625, -208.494140625, -199.38671875, -190.279296875, -181.171875, -172.064453125, -162.95703125, -153.849609375, -144.7421875, -135.634765625, -126.52734375, -117.419921875, -108.3125, -99.205078125, -90.09765625, -80.990234375, -71.8828125, -62.775390625, -53.66796875, -44.560546875, -35.453125, -26.345703125, -17.23828125, -8.130859375, 0.9765625, 10.083984375, 19.19140625, 28.298828125, 37.40625, 46.513671875, 55.62109375, 64.728515625, 73.8359375, 82.943359375, 92.05078125, 101.158203125, 110.265625, 119.373046875, 128.48046875, 137.587890625, 146.6953125, 155.802734375, 164.91015625, 174.017578125, 183.125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 10.0, 7.0, 14.0, 17.0, 38.0, 39.0, 55.0, 98.0, 120.0, 192.0, 280.0, 420.0, 639.0, 708.0, 468.0, 334.0, 211.0, 149.0, 78.0, 59.0, 33.0, 33.0, 17.0, 14.0, 13.0, 9.0, 3.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.72265625, -4.588226318359375, -4.45379638671875, -4.319366455078125, -4.1849365234375, -4.050506591796875, -3.91607666015625, -3.781646728515625, -3.647216796875, -3.512786865234375, -3.37835693359375, -3.243927001953125, -3.1094970703125, -2.975067138671875, -2.84063720703125, -2.706207275390625, -2.57177734375, -2.437347412109375, -2.30291748046875, -2.168487548828125, -2.0340576171875, -1.899627685546875, -1.76519775390625, -1.630767822265625, -1.496337890625, -1.361907958984375, -1.22747802734375, -1.093048095703125, -0.9586181640625, -0.824188232421875, -0.68975830078125, -0.555328369140625, -0.4208984375, -0.286468505859375, -0.15203857421875, -0.017608642578125, 0.1168212890625, 0.251251220703125, 0.38568115234375, 0.520111083984375, 0.654541015625, 0.788970947265625, 0.92340087890625, 1.057830810546875, 1.1922607421875, 1.326690673828125, 1.46112060546875, 1.595550537109375, 1.72998046875, 1.864410400390625, 1.99884033203125, 2.133270263671875, 2.2677001953125, 2.402130126953125, 2.53656005859375, 2.670989990234375, 2.805419921875, 2.939849853515625, 3.07427978515625, 3.208709716796875, 3.3431396484375, 3.477569580078125, 3.61199951171875, 3.746429443359375, 3.880859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 6.0, 12.0, 19.0, 25.0, 27.0, 30.0, 52.0, 45.0, 50.0, 79.0, 79.0, 70.0, 62.0, 65.0, 59.0, 60.0, 56.0, 46.0, 41.0, 26.0, 16.0, 17.0, 18.0, 8.0, 9.0, 3.0, 9.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.305008888244629, -9.923867225646973, -9.542725563049316, -9.161582946777344, -8.780441284179688, -8.399299621582031, -8.018157958984375, -7.637016296386719, -7.2558746337890625, -6.874732971191406, -6.493590831756592, -6.1124491691589355, -5.731307506561279, -5.350165367126465, -4.969023704528809, -4.587882041931152, -4.206739902496338, -3.8255980014801025, -3.4444563388824463, -3.063314437866211, -2.6821727752685547, -2.3010308742523193, -1.919888973236084, -1.5387473106384277, -1.1576054096221924, -0.7764636278152466, -0.395321786403656, -0.01417994499206543, 0.36696183681488037, 0.7481036186218262, 1.1292455196380615, 1.5103871822357178, 1.8915290832519531, 2.2726709842681885, 2.6538126468658447, 3.03495454788208, 3.4160962104797363, 3.7972381114959717, 4.178380012512207, 4.559521675109863, 4.9406633377075195, 5.321805000305176, 5.70294713973999, 6.0840888023376465, 6.465230464935303, 6.846372604370117, 7.227514266967773, 7.60865592956543, 7.989798069000244, 8.370940208435059, 8.752081871032715, 9.133223533630371, 9.514365196228027, 9.895506858825684, 10.276649475097656, 10.657791137695312, 11.038932800292969, 11.420074462890625, 11.801216125488281, 12.182357788085938, 12.56350040435791, 12.944642066955566, 13.325783729553223, 13.706925392150879, 14.088067054748535]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 6.0, 2.0, 7.0, 10.0, 7.0, 12.0, 16.0, 11.0, 21.0, 33.0, 25.0, 33.0, 28.0, 42.0, 47.0, 36.0, 46.0, 33.0, 49.0, 51.0, 55.0, 40.0, 34.0, 36.0, 37.0, 45.0, 22.0, 33.0, 30.0, 18.0, 29.0, 17.0, 16.0, 17.0, 7.0, 17.0, 10.0, 7.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.32935905456543, -9.036792755126953, -8.74422550201416, -8.451659202575684, -8.159092903137207, -7.866526126861572, -7.5739593505859375, -7.281393051147461, -6.988826274871826, -6.696259498596191, -6.403693199157715, -6.11112642288208, -5.818559646606445, -5.525993347167969, -5.233426570892334, -4.940859794616699, -4.648293495178223, -4.355726718902588, -4.063160419464111, -3.7705936431884766, -3.478027105331421, -3.1854605674743652, -2.8928937911987305, -2.600327253341675, -2.307760715484619, -2.0151941776275635, -1.7226275205612183, -1.430060863494873, -1.1374943256378174, -0.8449277877807617, -0.5523611307144165, -0.2597944736480713, 0.032772064208984375, 0.3253386616706848, 0.6179052591323853, 0.9104718565940857, 1.2030384540557861, 1.4956049919128418, 1.788171648979187, 2.0807383060455322, 2.373304843902588, 2.6658713817596436, 2.958437919616699, 3.251004695892334, 3.5435712337493896, 3.8361377716064453, 4.12870454788208, 4.421271324157715, 4.713837623596191, 5.006404399871826, 5.298970699310303, 5.5915374755859375, 5.884103775024414, 6.176670551300049, 6.469237327575684, 6.76180362701416, 7.054370403289795, 7.34693717956543, 7.639503479003906, 7.932070255279541, 8.224637031555176, 8.517203330993652, 8.809769630432129, 9.102336883544922, 9.394903182983398]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 9.0, 8.0, 13.0, 28.0, 46.0, 61.0, 106.0, 171.0, 245.0, 389.0, 654.0, 1102.0, 1798.0, 3166.0, 5740.0, 11810.0, 24824.0, 55501.0, 122546.0, 245700.0, 282392.0, 156735.0, 72029.0, 32061.0, 14759.0, 7324.0, 3906.0, 2130.0, 1254.0, 739.0, 481.0, 296.0, 196.0, 109.0, 76.0, 59.0, 28.0, 17.0, 15.0, 9.0, 10.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-4.07421875, -3.9549560546875, -3.835693359375, -3.7164306640625, -3.59716796875, -3.4779052734375, -3.358642578125, -3.2393798828125, -3.1201171875, -3.0008544921875, -2.881591796875, -2.7623291015625, -2.64306640625, -2.5238037109375, -2.404541015625, -2.2852783203125, -2.166015625, -2.0467529296875, -1.927490234375, -1.8082275390625, -1.68896484375, -1.5697021484375, -1.450439453125, -1.3311767578125, -1.2119140625, -1.0926513671875, -0.973388671875, -0.8541259765625, -0.73486328125, -0.6156005859375, -0.496337890625, -0.3770751953125, -0.2578125, -0.1385498046875, -0.019287109375, 0.0999755859375, 0.21923828125, 0.3385009765625, 0.457763671875, 0.5770263671875, 0.6962890625, 0.8155517578125, 0.934814453125, 1.0540771484375, 1.17333984375, 1.2926025390625, 1.411865234375, 1.5311279296875, 1.650390625, 1.7696533203125, 1.888916015625, 2.0081787109375, 2.12744140625, 2.2467041015625, 2.365966796875, 2.4852294921875, 2.6044921875, 2.7237548828125, 2.843017578125, 2.9622802734375, 3.08154296875, 3.2008056640625, 3.320068359375, 3.4393310546875, 3.55859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 2.0, 5.0, 8.0, 8.0, 11.0, 13.0, 17.0, 19.0, 26.0, 24.0, 32.0, 36.0, 38.0, 42.0, 42.0, 52.0, 41.0, 44.0, 40.0, 58.0, 57.0, 34.0, 40.0, 36.0, 33.0, 31.0, 41.0, 33.0, 23.0, 20.0, 13.0, 16.0, 15.0, 16.0, 4.0, 7.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.18359375, -6.9703369140625, -6.757080078125, -6.5438232421875, -6.33056640625, -6.1173095703125, -5.904052734375, -5.6907958984375, -5.4775390625, -5.2642822265625, -5.051025390625, -4.8377685546875, -4.62451171875, -4.4112548828125, -4.197998046875, -3.9847412109375, -3.771484375, -3.5582275390625, -3.344970703125, -3.1317138671875, -2.91845703125, -2.7052001953125, -2.491943359375, -2.2786865234375, -2.0654296875, -1.8521728515625, -1.638916015625, -1.4256591796875, -1.21240234375, -0.9991455078125, -0.785888671875, -0.5726318359375, -0.359375, -0.1461181640625, 0.067138671875, 0.2803955078125, 0.49365234375, 0.7069091796875, 0.920166015625, 1.1334228515625, 1.3466796875, 1.5599365234375, 1.773193359375, 1.9864501953125, 2.19970703125, 2.4129638671875, 2.626220703125, 2.8394775390625, 3.052734375, 3.2659912109375, 3.479248046875, 3.6925048828125, 3.90576171875, 4.1190185546875, 4.332275390625, 4.5455322265625, 4.7587890625, 4.9720458984375, 5.185302734375, 5.3985595703125, 5.61181640625, 5.8250732421875, 6.038330078125, 6.2515869140625, 6.46484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 5.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 8.0, 13.0, 8.0, 18.0, 25.0, 38.0, 39.0, 53.0, 74.0, 116.0, 129.0, 182.0, 307.0, 431.0, 736.0, 1243.0, 2295.0, 4324.0, 9121.0, 19814.0, 46795.0, 114000.0, 260727.0, 316576.0, 155884.0, 64177.0, 26816.0, 11930.0, 5579.0, 2846.0, 1578.0, 894.0, 539.0, 380.0, 241.0, 142.0, 97.0, 93.0, 64.0, 46.0, 45.0, 21.0, 28.0, 12.0, 10.0, 15.0, 3.0, 7.0, 9.0, 3.0, 4.0, 2.0, 1.0, 6.0], "bins": [-3.7109375, -3.599090576171875, -3.48724365234375, -3.375396728515625, -3.2635498046875, -3.151702880859375, -3.03985595703125, -2.928009033203125, -2.816162109375, -2.704315185546875, -2.59246826171875, -2.480621337890625, -2.3687744140625, -2.256927490234375, -2.14508056640625, -2.033233642578125, -1.92138671875, -1.809539794921875, -1.69769287109375, -1.585845947265625, -1.4739990234375, -1.362152099609375, -1.25030517578125, -1.138458251953125, -1.026611328125, -0.914764404296875, -0.80291748046875, -0.691070556640625, -0.5792236328125, -0.467376708984375, -0.35552978515625, -0.243682861328125, -0.1318359375, -0.019989013671875, 0.09185791015625, 0.203704833984375, 0.3155517578125, 0.427398681640625, 0.53924560546875, 0.651092529296875, 0.762939453125, 0.874786376953125, 0.98663330078125, 1.098480224609375, 1.2103271484375, 1.322174072265625, 1.43402099609375, 1.545867919921875, 1.65771484375, 1.769561767578125, 1.88140869140625, 1.993255615234375, 2.1051025390625, 2.216949462890625, 2.32879638671875, 2.440643310546875, 2.552490234375, 2.664337158203125, 2.77618408203125, 2.888031005859375, 2.9998779296875, 3.111724853515625, 3.22357177734375, 3.335418701171875, 3.447265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 8.0, 6.0, 5.0, 5.0, 9.0, 7.0, 10.0, 12.0, 18.0, 6.0, 26.0, 29.0, 14.0, 31.0, 31.0, 28.0, 51.0, 42.0, 41.0, 44.0, 50.0, 43.0, 49.0, 53.0, 33.0, 39.0, 35.0, 38.0, 43.0, 23.0, 18.0, 28.0, 12.0, 16.0, 24.0, 17.0, 9.0, 9.0, 7.0, 7.0, 5.0, 5.0, 2.0, 3.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.140625, -10.769775390625, -10.39892578125, -10.028076171875, -9.6572265625, -9.286376953125, -8.91552734375, -8.544677734375, -8.173828125, -7.802978515625, -7.43212890625, -7.061279296875, -6.6904296875, -6.319580078125, -5.94873046875, -5.577880859375, -5.20703125, -4.836181640625, -4.46533203125, -4.094482421875, -3.7236328125, -3.352783203125, -2.98193359375, -2.611083984375, -2.240234375, -1.869384765625, -1.49853515625, -1.127685546875, -0.7568359375, -0.385986328125, -0.01513671875, 0.355712890625, 0.7265625, 1.097412109375, 1.46826171875, 1.839111328125, 2.2099609375, 2.580810546875, 2.95166015625, 3.322509765625, 3.693359375, 4.064208984375, 4.43505859375, 4.805908203125, 5.1767578125, 5.547607421875, 5.91845703125, 6.289306640625, 6.66015625, 7.031005859375, 7.40185546875, 7.772705078125, 8.1435546875, 8.514404296875, 8.88525390625, 9.256103515625, 9.626953125, 9.997802734375, 10.36865234375, 10.739501953125, 11.1103515625, 11.481201171875, 11.85205078125, 12.222900390625, 12.59375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 8.0, 8.0, 20.0, 14.0, 38.0, 48.0, 67.0, 117.0, 204.0, 317.0, 603.0, 1248.0, 2849.0, 7287.0, 22206.0, 84827.0, 384538.0, 412889.0, 93961.0, 23783.0, 7637.0, 3031.0, 1305.0, 679.0, 347.0, 181.0, 119.0, 75.0, 40.0, 35.0, 22.0, 20.0, 9.0, 7.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.318359375, -2.2521820068359375, -2.186004638671875, -2.1198272705078125, -2.05364990234375, -1.9874725341796875, -1.921295166015625, -1.8551177978515625, -1.7889404296875, -1.7227630615234375, -1.656585693359375, -1.5904083251953125, -1.52423095703125, -1.4580535888671875, -1.391876220703125, -1.3256988525390625, -1.259521484375, -1.1933441162109375, -1.127166748046875, -1.0609893798828125, -0.99481201171875, -0.9286346435546875, -0.862457275390625, -0.7962799072265625, -0.7301025390625, -0.6639251708984375, -0.597747802734375, -0.5315704345703125, -0.46539306640625, -0.3992156982421875, -0.333038330078125, -0.2668609619140625, -0.20068359375, -0.1345062255859375, -0.068328857421875, -0.0021514892578125, 0.06402587890625, 0.1302032470703125, 0.196380615234375, 0.2625579833984375, 0.3287353515625, 0.3949127197265625, 0.461090087890625, 0.5272674560546875, 0.59344482421875, 0.6596221923828125, 0.725799560546875, 0.7919769287109375, 0.858154296875, 0.9243316650390625, 0.990509033203125, 1.0566864013671875, 1.12286376953125, 1.1890411376953125, 1.255218505859375, 1.3213958740234375, 1.3875732421875, 1.4537506103515625, 1.519927978515625, 1.5861053466796875, 1.65228271484375, 1.7184600830078125, 1.784637451171875, 1.8508148193359375, 1.9169921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 11.0, 8.0, 10.0, 8.0, 11.0, 12.0, 26.0, 28.0, 32.0, 66.0, 53.0, 71.0, 84.0, 93.0, 100.0, 65.0, 75.0, 61.0, 46.0, 39.0, 19.0, 14.0, 14.0, 9.0, 8.0, 6.0, 9.0, 4.0, 4.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007658004760742188, -0.0007382184267044067, -0.0007106363773345947, -0.0006830543279647827, -0.0006554722785949707, -0.0006278902292251587, -0.0006003081798553467, -0.0005727261304855347, -0.0005451440811157227, -0.0005175620317459106, -0.0004899799823760986, -0.0004623979330062866, -0.0004348158836364746, -0.0004072338342666626, -0.0003796517848968506, -0.0003520697355270386, -0.00032448768615722656, -0.00029690563678741455, -0.00026932358741760254, -0.00024174153804779053, -0.00021415948867797852, -0.0001865774393081665, -0.0001589953899383545, -0.00013141334056854248, -0.00010383129119873047, -7.624924182891846e-05, -4.8667192459106445e-05, -2.1085143089294434e-05, 6.496906280517578e-06, 3.407895565032959e-05, 6.16610050201416e-05, 8.924305438995361e-05, 0.00011682510375976562, 0.00014440715312957764, 0.00017198920249938965, 0.00019957125186920166, 0.00022715330123901367, 0.0002547353506088257, 0.0002823173999786377, 0.0003098994493484497, 0.0003374814987182617, 0.00036506354808807373, 0.00039264559745788574, 0.00042022764682769775, 0.00044780969619750977, 0.0004753917455673218, 0.0005029737949371338, 0.0005305558443069458, 0.0005581378936767578, 0.0005857199430465698, 0.0006133019924163818, 0.0006408840417861938, 0.0006684660911560059, 0.0006960481405258179, 0.0007236301898956299, 0.0007512122392654419, 0.0007787942886352539, 0.0008063763380050659, 0.0008339583873748779, 0.0008615404367446899, 0.000889122486114502, 0.000916704535484314, 0.000944286584854126, 0.000971868634223938, 0.00099945068359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 7.0, 5.0, 5.0, 6.0, 12.0, 12.0, 6.0, 14.0, 22.0, 32.0, 50.0, 99.0, 376.0, 2827.0, 133202.0, 897065.0, 13581.0, 789.0, 182.0, 79.0, 45.0, 29.0, 20.0, 13.0, 18.0, 15.0, 7.0, 6.0, 9.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.4375, -8.1837158203125, -7.929931640625, -7.6761474609375, -7.42236328125, -7.1685791015625, -6.914794921875, -6.6610107421875, -6.4072265625, -6.1534423828125, -5.899658203125, -5.6458740234375, -5.39208984375, -5.1383056640625, -4.884521484375, -4.6307373046875, -4.376953125, -4.1231689453125, -3.869384765625, -3.6156005859375, -3.36181640625, -3.1080322265625, -2.854248046875, -2.6004638671875, -2.3466796875, -2.0928955078125, -1.839111328125, -1.5853271484375, -1.33154296875, -1.0777587890625, -0.823974609375, -0.5701904296875, -0.31640625, -0.0626220703125, 0.191162109375, 0.4449462890625, 0.69873046875, 0.9525146484375, 1.206298828125, 1.4600830078125, 1.7138671875, 1.9676513671875, 2.221435546875, 2.4752197265625, 2.72900390625, 2.9827880859375, 3.236572265625, 3.4903564453125, 3.744140625, 3.9979248046875, 4.251708984375, 4.5054931640625, 4.75927734375, 5.0130615234375, 5.266845703125, 5.5206298828125, 5.7744140625, 6.0281982421875, 6.281982421875, 6.5357666015625, 6.78955078125, 7.0433349609375, 7.297119140625, 7.5509033203125, 7.8046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 6.0, 5.0, 7.0, 8.0, 11.0, 14.0, 20.0, 22.0, 43.0, 44.0, 56.0, 74.0, 93.0, 82.0, 97.0, 83.0, 74.0, 68.0, 51.0, 28.0, 24.0, 22.0, 16.0, 14.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.72705078125, -0.7067184448242188, -0.6863861083984375, -0.6660537719726562, -0.645721435546875, -0.6253890991210938, -0.6050567626953125, -0.5847244262695312, -0.56439208984375, -0.5440597534179688, -0.5237274169921875, -0.5033950805664062, -0.483062744140625, -0.46273040771484375, -0.4423980712890625, -0.42206573486328125, -0.4017333984375, -0.38140106201171875, -0.3610687255859375, -0.34073638916015625, -0.320404052734375, -0.30007171630859375, -0.2797393798828125, -0.25940704345703125, -0.23907470703125, -0.21874237060546875, -0.1984100341796875, -0.17807769775390625, -0.157745361328125, -0.13741302490234375, -0.1170806884765625, -0.09674835205078125, -0.076416015625, -0.05608367919921875, -0.0357513427734375, -0.01541900634765625, 0.004913330078125, 0.02524566650390625, 0.0455780029296875, 0.06591033935546875, 0.08624267578125, 0.10657501220703125, 0.1269073486328125, 0.14723968505859375, 0.167572021484375, 0.18790435791015625, 0.2082366943359375, 0.22856903076171875, 0.2489013671875, 0.26923370361328125, 0.2895660400390625, 0.30989837646484375, 0.330230712890625, 0.35056304931640625, 0.3708953857421875, 0.39122772216796875, 0.41156005859375, 0.43189239501953125, 0.4522247314453125, 0.47255706787109375, 0.492889404296875, 0.5132217407226562, 0.5335540771484375, 0.5538864135742188, 0.57421875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 6.0, 16.0, 21.0, 39.0, 56.0, 77.0, 114.0, 124.0, 144.0, 110.0, 94.0, 72.0, 54.0, 25.0, 23.0, 9.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.561568260192871, -8.159334182739258, -7.757099628448486, -7.354865550994873, -6.952630996704102, -6.550396919250488, -6.148162841796875, -5.745928764343262, -5.34369421005249, -4.941460132598877, -4.5392255783081055, -4.136991500854492, -3.7347571849823, -3.3325228691101074, -2.930288791656494, -2.5280544757843018, -2.1258201599121094, -1.723585844039917, -1.3213516473770142, -0.9191174507141113, -0.516883134841919, -0.11464881896972656, 0.2875852584838867, 0.6898195743560791, 1.0920538902282715, 1.4942882061004639, 1.8965224027633667, 2.2987565994262695, 2.700990915298462, 3.1032252311706543, 3.5054593086242676, 3.90769362449646, 4.309926986694336, 4.712161064147949, 5.114395618438721, 5.516629695892334, 5.9188642501831055, 6.321098327636719, 6.723332405090332, 7.125566482543945, 7.527801036834717, 7.93003511428833, 8.332269668579102, 8.734503746032715, 9.136737823486328, 9.538972854614258, 9.941205978393555, 10.343441009521484, 10.745675086975098, 11.147909164428711, 11.550143241882324, 11.952377319335938, 12.354612350463867, 12.75684642791748, 13.159080505371094, 13.561314582824707, 13.96354866027832, 14.365782737731934, 14.768016815185547, 15.170251846313477, 15.57248592376709, 15.974720001220703, 16.376953125, 16.77918815612793, 17.18142318725586]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 5.0, 7.0, 6.0, 9.0, 10.0, 9.0, 23.0, 17.0, 23.0, 26.0, 25.0, 37.0, 28.0, 32.0, 37.0, 44.0, 43.0, 45.0, 56.0, 46.0, 44.0, 42.0, 41.0, 36.0, 45.0, 30.0, 23.0, 33.0, 16.0, 25.0, 28.0, 19.0, 18.0, 13.0, 10.0, 15.0, 13.0, 7.0, 6.0, 5.0, 2.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.409859657287598, -6.216553211212158, -6.023246765136719, -5.829940319061279, -5.63663387298584, -5.4433274269104, -5.250020980834961, -5.056714057922363, -4.863408088684082, -4.670101642608643, -4.476795196533203, -4.283488750457764, -4.090182304382324, -3.8968758583068848, -3.703569173812866, -3.5102627277374268, -3.316956043243408, -3.1236495971679688, -2.9303431510925293, -2.73703670501709, -2.5437302589416504, -2.350423812866211, -2.1571171283721924, -1.963810682296753, -1.7705042362213135, -1.577197790145874, -1.3838913440704346, -1.1905847787857056, -0.9972783327102661, -0.8039718866348267, -0.6106653213500977, -0.4173588752746582, -0.22405195236206055, -0.030745476484298706, 0.16256099939346313, 0.35586750507354736, 0.5491739511489868, 0.7424803972244263, 0.9357869625091553, 1.1290934085845947, 1.3223998546600342, 1.5157063007354736, 1.709012746810913, 1.902319312095642, 2.095625877380371, 2.2889323234558105, 2.48223876953125, 2.6755452156066895, 2.868851661682129, 3.0621581077575684, 3.255464553833008, 3.4487709999084473, 3.6420774459838867, 3.835383892059326, 4.028690338134766, 4.221997261047363, 4.4153032302856445, 4.608609676361084, 4.801916122436523, 4.995222568511963, 5.188529014587402, 5.381835460662842, 5.575141906738281, 5.768448829650879, 5.961755275726318]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 10.0, 8.0, 11.0, 26.0, 36.0, 40.0, 71.0, 85.0, 153.0, 241.0, 337.0, 530.0, 800.0, 1352.0, 2257.0, 3738.0, 6298.0, 11085.0, 20127.0, 38608.0, 79584.0, 179303.0, 306662.0, 207702.0, 92877.0, 44014.0, 22649.0, 12352.0, 6946.0, 4198.0, 2401.0, 1508.0, 915.0, 525.0, 366.0, 238.0, 154.0, 103.0, 72.0, 48.0, 26.0, 31.0, 16.0, 15.0, 11.0, 10.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.869140625, -3.75396728515625, -3.6387939453125, -3.52362060546875, -3.408447265625, -3.29327392578125, -3.1781005859375, -3.06292724609375, -2.94775390625, -2.83258056640625, -2.7174072265625, -2.60223388671875, -2.487060546875, -2.37188720703125, -2.2567138671875, -2.14154052734375, -2.0263671875, -1.91119384765625, -1.7960205078125, -1.68084716796875, -1.565673828125, -1.45050048828125, -1.3353271484375, -1.22015380859375, -1.10498046875, -0.98980712890625, -0.8746337890625, -0.75946044921875, -0.644287109375, -0.52911376953125, -0.4139404296875, -0.29876708984375, -0.18359375, -0.06842041015625, 0.0467529296875, 0.16192626953125, 0.277099609375, 0.39227294921875, 0.5074462890625, 0.62261962890625, 0.73779296875, 0.85296630859375, 0.9681396484375, 1.08331298828125, 1.198486328125, 1.31365966796875, 1.4288330078125, 1.54400634765625, 1.6591796875, 1.77435302734375, 1.8895263671875, 2.00469970703125, 2.119873046875, 2.23504638671875, 2.3502197265625, 2.46539306640625, 2.58056640625, 2.69573974609375, 2.8109130859375, 2.92608642578125, 3.041259765625, 3.15643310546875, 3.2716064453125, 3.38677978515625, 3.501953125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 3.0, 4.0, 9.0, 8.0, 15.0, 14.0, 14.0, 21.0, 20.0, 31.0, 28.0, 36.0, 33.0, 42.0, 51.0, 38.0, 45.0, 39.0, 43.0, 53.0, 37.0, 44.0, 34.0, 40.0, 32.0, 27.0, 37.0, 19.0, 29.0, 25.0, 20.0, 16.0, 15.0, 9.0, 12.0, 11.0, 13.0, 12.0, 6.0, 2.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.359375, -16.853271484375, -16.34716796875, -15.841064453125, -15.3349609375, -14.828857421875, -14.32275390625, -13.816650390625, -13.310546875, -12.804443359375, -12.29833984375, -11.792236328125, -11.2861328125, -10.780029296875, -10.27392578125, -9.767822265625, -9.26171875, -8.755615234375, -8.24951171875, -7.743408203125, -7.2373046875, -6.731201171875, -6.22509765625, -5.718994140625, -5.212890625, -4.706787109375, -4.20068359375, -3.694580078125, -3.1884765625, -2.682373046875, -2.17626953125, -1.670166015625, -1.1640625, -0.657958984375, -0.15185546875, 0.354248046875, 0.8603515625, 1.366455078125, 1.87255859375, 2.378662109375, 2.884765625, 3.390869140625, 3.89697265625, 4.403076171875, 4.9091796875, 5.415283203125, 5.92138671875, 6.427490234375, 6.93359375, 7.439697265625, 7.94580078125, 8.451904296875, 8.9580078125, 9.464111328125, 9.97021484375, 10.476318359375, 10.982421875, 11.488525390625, 11.99462890625, 12.500732421875, 13.0068359375, 13.512939453125, 14.01904296875, 14.525146484375, 15.03125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 7.0, 5.0, 8.0, 7.0, 12.0, 15.0, 17.0, 26.0, 29.0, 30.0, 39.0, 55.0, 58.0, 73.0, 113.0, 486.0, 715179.0, 331386.0, 436.0, 129.0, 81.0, 62.0, 62.0, 38.0, 27.0, 34.0, 32.0, 21.0, 10.0, 12.0, 12.0, 10.0, 10.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-66.5, -64.48291015625, -62.4658203125, -60.44873046875, -58.431640625, -56.41455078125, -54.3974609375, -52.38037109375, -50.36328125, -48.34619140625, -46.3291015625, -44.31201171875, -42.294921875, -40.27783203125, -38.2607421875, -36.24365234375, -34.2265625, -32.20947265625, -30.1923828125, -28.17529296875, -26.158203125, -24.14111328125, -22.1240234375, -20.10693359375, -18.08984375, -16.07275390625, -14.0556640625, -12.03857421875, -10.021484375, -8.00439453125, -5.9873046875, -3.97021484375, -1.953125, 0.06396484375, 2.0810546875, 4.09814453125, 6.115234375, 8.13232421875, 10.1494140625, 12.16650390625, 14.18359375, 16.20068359375, 18.2177734375, 20.23486328125, 22.251953125, 24.26904296875, 26.2861328125, 28.30322265625, 30.3203125, 32.33740234375, 34.3544921875, 36.37158203125, 38.388671875, 40.40576171875, 42.4228515625, 44.43994140625, 46.45703125, 48.47412109375, 50.4912109375, 52.50830078125, 54.525390625, 56.54248046875, 58.5595703125, 60.57666015625, 62.59375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 4.0, 7.0, 13.0, 8.0, 17.0, 23.0, 23.0, 32.0, 26.0, 33.0, 49.0, 40.0, 60.0, 47.0, 42.0, 60.0, 64.0, 51.0, 45.0, 40.0, 51.0, 43.0, 28.0, 25.0, 36.0, 25.0, 19.0, 15.0, 11.0, 10.0, 13.0, 5.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.203125, -22.51416015625, -21.8251953125, -21.13623046875, -20.447265625, -19.75830078125, -19.0693359375, -18.38037109375, -17.69140625, -17.00244140625, -16.3134765625, -15.62451171875, -14.935546875, -14.24658203125, -13.5576171875, -12.86865234375, -12.1796875, -11.49072265625, -10.8017578125, -10.11279296875, -9.423828125, -8.73486328125, -8.0458984375, -7.35693359375, -6.66796875, -5.97900390625, -5.2900390625, -4.60107421875, -3.912109375, -3.22314453125, -2.5341796875, -1.84521484375, -1.15625, -0.46728515625, 0.2216796875, 0.91064453125, 1.599609375, 2.28857421875, 2.9775390625, 3.66650390625, 4.35546875, 5.04443359375, 5.7333984375, 6.42236328125, 7.111328125, 7.80029296875, 8.4892578125, 9.17822265625, 9.8671875, 10.55615234375, 11.2451171875, 11.93408203125, 12.623046875, 13.31201171875, 14.0009765625, 14.68994140625, 15.37890625, 16.06787109375, 16.7568359375, 17.44580078125, 18.134765625, 18.82373046875, 19.5126953125, 20.20166015625, 20.890625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 10.0, 11.0, 14.0, 40.0, 86.0, 177.0, 509.0, 2281.0, 20370.0, 928310.0, 90281.0, 5169.0, 844.0, 248.0, 72.0, 44.0, 22.0, 12.0, 13.0, 12.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3046875, -5.0355224609375, -4.766357421875, -4.4971923828125, -4.22802734375, -3.9588623046875, -3.689697265625, -3.4205322265625, -3.1513671875, -2.8822021484375, -2.613037109375, -2.3438720703125, -2.07470703125, -1.8055419921875, -1.536376953125, -1.2672119140625, -0.998046875, -0.7288818359375, -0.459716796875, -0.1905517578125, 0.07861328125, 0.3477783203125, 0.616943359375, 0.8861083984375, 1.1552734375, 1.4244384765625, 1.693603515625, 1.9627685546875, 2.23193359375, 2.5010986328125, 2.770263671875, 3.0394287109375, 3.30859375, 3.5777587890625, 3.846923828125, 4.1160888671875, 4.38525390625, 4.6544189453125, 4.923583984375, 5.1927490234375, 5.4619140625, 5.7310791015625, 6.000244140625, 6.2694091796875, 6.53857421875, 6.8077392578125, 7.076904296875, 7.3460693359375, 7.615234375, 7.8843994140625, 8.153564453125, 8.4227294921875, 8.69189453125, 8.9610595703125, 9.230224609375, 9.4993896484375, 9.7685546875, 10.0377197265625, 10.306884765625, 10.5760498046875, 10.84521484375, 11.1143798828125, 11.383544921875, 11.6527099609375, 11.921875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 8.0, 11.0, 7.0, 12.0, 23.0, 26.0, 28.0, 40.0, 75.0, 112.0, 185.0, 146.0, 99.0, 72.0, 39.0, 43.0, 21.0, 18.0, 13.0, 7.0, 2.0, 0.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006022453308105469, -0.0005833804607391357, -0.0005645155906677246, -0.0005456507205963135, -0.0005267858505249023, -0.0005079209804534912, -0.0004890561103820801, -0.00047019124031066895, -0.0004513263702392578, -0.0004324615001678467, -0.00041359663009643555, -0.0003947317600250244, -0.0003758668899536133, -0.00035700201988220215, -0.000338137149810791, -0.0003192722797393799, -0.00030040740966796875, -0.0002815425395965576, -0.0002626776695251465, -0.00024381279945373535, -0.00022494792938232422, -0.00020608305931091309, -0.00018721818923950195, -0.00016835331916809082, -0.0001494884490966797, -0.00013062357902526855, -0.00011175870895385742, -9.289383888244629e-05, -7.402896881103516e-05, -5.5164098739624023e-05, -3.629922866821289e-05, -1.7434358596801758e-05, 1.430511474609375e-06, 2.0295381546020508e-05, 3.916025161743164e-05, 5.8025121688842773e-05, 7.68899917602539e-05, 9.575486183166504e-05, 0.00011461973190307617, 0.0001334846019744873, 0.00015234947204589844, 0.00017121434211730957, 0.0001900792121887207, 0.00020894408226013184, 0.00022780895233154297, 0.0002466738224029541, 0.00026553869247436523, 0.00028440356254577637, 0.0003032684326171875, 0.00032213330268859863, 0.00034099817276000977, 0.0003598630428314209, 0.00037872791290283203, 0.00039759278297424316, 0.0004164576530456543, 0.00043532252311706543, 0.00045418739318847656, 0.0004730522632598877, 0.0004919171333312988, 0.00051078200340271, 0.0005296468734741211, 0.0005485117435455322, 0.0005673766136169434, 0.0005862414836883545, 0.0006051063537597656]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 12.0, 10.0, 11.0, 23.0, 39.0, 69.0, 222.0, 838.0, 3990.0, 27626.0, 686302.0, 308397.0, 17324.0, 2697.0, 635.0, 175.0, 78.0, 33.0, 15.0, 10.0, 9.0, 2.0, 3.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.65234375, -5.47509765625, -5.2978515625, -5.12060546875, -4.943359375, -4.76611328125, -4.5888671875, -4.41162109375, -4.234375, -4.05712890625, -3.8798828125, -3.70263671875, -3.525390625, -3.34814453125, -3.1708984375, -2.99365234375, -2.81640625, -2.63916015625, -2.4619140625, -2.28466796875, -2.107421875, -1.93017578125, -1.7529296875, -1.57568359375, -1.3984375, -1.22119140625, -1.0439453125, -0.86669921875, -0.689453125, -0.51220703125, -0.3349609375, -0.15771484375, 0.01953125, 0.19677734375, 0.3740234375, 0.55126953125, 0.728515625, 0.90576171875, 1.0830078125, 1.26025390625, 1.4375, 1.61474609375, 1.7919921875, 1.96923828125, 2.146484375, 2.32373046875, 2.5009765625, 2.67822265625, 2.85546875, 3.03271484375, 3.2099609375, 3.38720703125, 3.564453125, 3.74169921875, 3.9189453125, 4.09619140625, 4.2734375, 4.45068359375, 4.6279296875, 4.80517578125, 4.982421875, 5.15966796875, 5.3369140625, 5.51416015625, 5.69140625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 11.0, 7.0, 9.0, 1.0, 15.0, 7.0, 11.0, 18.0, 17.0, 27.0, 38.0, 44.0, 49.0, 63.0, 90.0, 112.0, 86.0, 79.0, 58.0, 50.0, 42.0, 24.0, 28.0, 18.0, 20.0, 19.0, 14.0, 11.0, 6.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69677734375, -0.670745849609375, -0.64471435546875, -0.618682861328125, -0.5926513671875, -0.566619873046875, -0.54058837890625, -0.514556884765625, -0.488525390625, -0.462493896484375, -0.43646240234375, -0.410430908203125, -0.3843994140625, -0.358367919921875, -0.33233642578125, -0.306304931640625, -0.2802734375, -0.254241943359375, -0.22821044921875, -0.202178955078125, -0.1761474609375, -0.150115966796875, -0.12408447265625, -0.098052978515625, -0.072021484375, -0.045989990234375, -0.01995849609375, 0.006072998046875, 0.0321044921875, 0.058135986328125, 0.08416748046875, 0.110198974609375, 0.13623046875, 0.162261962890625, 0.18829345703125, 0.214324951171875, 0.2403564453125, 0.266387939453125, 0.29241943359375, 0.318450927734375, 0.344482421875, 0.370513916015625, 0.39654541015625, 0.422576904296875, 0.4486083984375, 0.474639892578125, 0.50067138671875, 0.526702880859375, 0.552734375, 0.578765869140625, 0.60479736328125, 0.630828857421875, 0.6568603515625, 0.682891845703125, 0.70892333984375, 0.734954833984375, 0.760986328125, 0.787017822265625, 0.81304931640625, 0.839080810546875, 0.8651123046875, 0.891143798828125, 0.91717529296875, 0.943206787109375, 0.96923828125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 13.0, 121.0, 593.0, 272.0, 18.0, 2.0, 2.0], "bins": [-250.4321746826172, -246.23536682128906, -242.03855895996094, -237.8417510986328, -233.6449432373047, -229.44813537597656, -225.25132751464844, -221.05453491210938, -216.85772705078125, -212.66091918945312, -208.464111328125, -204.26730346679688, -200.07049560546875, -195.87368774414062, -191.6768798828125, -187.48007202148438, -183.28326416015625, -179.08645629882812, -174.8896484375, -170.69284057617188, -166.49603271484375, -162.29922485351562, -158.1024169921875, -153.90560913085938, -149.70880126953125, -145.51199340820312, -141.315185546875, -137.11837768554688, -132.92156982421875, -128.72476196289062, -124.52796173095703, -120.3311538696289, -116.13436126708984, -111.93755340576172, -107.7407455444336, -103.54393768310547, -99.34713745117188, -95.15032958984375, -90.95352172851562, -86.7567138671875, -82.55990600585938, -78.36309814453125, -74.16629028320312, -69.969482421875, -65.77267456054688, -61.575870513916016, -57.379066467285156, -53.18225860595703, -48.985450744628906, -44.78864288330078, -40.591835021972656, -36.3950309753418, -32.19822311401367, -28.001415252685547, -23.804609298706055, -19.607803344726562, -15.41099739074707, -11.214190483093262, -7.017383575439453, -2.8205766677856445, 1.376230239868164, 5.573038101196289, 9.769844055175781, 13.966650009155273, 18.1634578704834]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 6.0, 5.0, 6.0, 9.0, 11.0, 7.0, 7.0, 12.0, 8.0, 16.0, 14.0, 27.0, 20.0, 16.0, 24.0, 29.0, 31.0, 35.0, 43.0, 33.0, 28.0, 45.0, 42.0, 41.0, 35.0, 31.0, 31.0, 38.0, 34.0, 28.0, 32.0, 25.0, 27.0, 22.0, 24.0, 10.0, 28.0, 26.0, 12.0, 10.0, 14.0, 15.0, 7.0, 11.0, 4.0, 7.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-21.16127586364746, -20.47144317626953, -19.7816104888916, -19.091777801513672, -18.401945114135742, -17.712112426757812, -17.022281646728516, -16.332447052001953, -15.64261531829834, -14.95278263092041, -14.26294994354248, -13.573118209838867, -12.883285522460938, -12.193452835083008, -11.503620147705078, -10.813787460327148, -10.123954772949219, -9.434122085571289, -8.74428939819336, -8.05445671081543, -7.364624500274658, -6.6747918128967285, -5.984959602355957, -5.295126914978027, -4.605294227600098, -3.915461540222168, -3.2256290912628174, -2.535796642303467, -1.845963954925537, -1.1561312675476074, -0.46629905700683594, 0.22353363037109375, 0.9133682250976562, 1.6032007932662964, 2.2930333614349365, 2.982865810394287, 3.672698497772217, 4.3625311851501465, 5.052363395690918, 5.742196083068848, 6.432028770446777, 7.121861457824707, 7.811694145202637, 8.50152587890625, 9.19135856628418, 9.88119125366211, 10.571023941040039, 11.260856628417969, 11.950689315795898, 12.640522003173828, 13.330354690551758, 14.020187377929688, 14.710020065307617, 15.399852752685547, 16.089683532714844, 16.779518127441406, 17.469348907470703, 18.159181594848633, 18.849014282226562, 19.538846969604492, 20.228679656982422, 20.91851234436035, 21.60834503173828, 22.298175811767578, 22.98801040649414]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 11.0, 4.0, 9.0, 7.0, 16.0, 17.0, 33.0, 45.0, 42.0, 60.0, 104.0, 217.0, 455.0, 1282.0, 4600.0, 22958.0, 219807.0, 2653575.0, 1200587.0, 75381.0, 10789.0, 2703.0, 812.0, 338.0, 144.0, 87.0, 45.0, 38.0, 19.0, 24.0, 9.0, 13.0, 13.0, 13.0, 1.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.875, -17.34619140625, -16.8173828125, -16.28857421875, -15.759765625, -15.23095703125, -14.7021484375, -14.17333984375, -13.64453125, -13.11572265625, -12.5869140625, -12.05810546875, -11.529296875, -11.00048828125, -10.4716796875, -9.94287109375, -9.4140625, -8.88525390625, -8.3564453125, -7.82763671875, -7.298828125, -6.77001953125, -6.2412109375, -5.71240234375, -5.18359375, -4.65478515625, -4.1259765625, -3.59716796875, -3.068359375, -2.53955078125, -2.0107421875, -1.48193359375, -0.953125, -0.42431640625, 0.1044921875, 0.63330078125, 1.162109375, 1.69091796875, 2.2197265625, 2.74853515625, 3.27734375, 3.80615234375, 4.3349609375, 4.86376953125, 5.392578125, 5.92138671875, 6.4501953125, 6.97900390625, 7.5078125, 8.03662109375, 8.5654296875, 9.09423828125, 9.623046875, 10.15185546875, 10.6806640625, 11.20947265625, 11.73828125, 12.26708984375, 12.7958984375, 13.32470703125, 13.853515625, 14.38232421875, 14.9111328125, 15.43994140625, 15.96875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 7.0, 4.0, 4.0, 6.0, 10.0, 12.0, 20.0, 25.0, 19.0, 23.0, 26.0, 28.0, 26.0, 35.0, 31.0, 37.0, 48.0, 44.0, 48.0, 42.0, 54.0, 44.0, 41.0, 38.0, 47.0, 32.0, 41.0, 28.0, 24.0, 26.0, 16.0, 24.0, 14.0, 15.0, 15.0, 15.0, 7.0, 3.0, 10.0, 5.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.796875, -6.5836181640625, -6.370361328125, -6.1571044921875, -5.94384765625, -5.7305908203125, -5.517333984375, -5.3040771484375, -5.0908203125, -4.8775634765625, -4.664306640625, -4.4510498046875, -4.23779296875, -4.0245361328125, -3.811279296875, -3.5980224609375, -3.384765625, -3.1715087890625, -2.958251953125, -2.7449951171875, -2.53173828125, -2.3184814453125, -2.105224609375, -1.8919677734375, -1.6787109375, -1.4654541015625, -1.252197265625, -1.0389404296875, -0.82568359375, -0.6124267578125, -0.399169921875, -0.1859130859375, 0.02734375, 0.2406005859375, 0.453857421875, 0.6671142578125, 0.88037109375, 1.0936279296875, 1.306884765625, 1.5201416015625, 1.7333984375, 1.9466552734375, 2.159912109375, 2.3731689453125, 2.58642578125, 2.7996826171875, 3.012939453125, 3.2261962890625, 3.439453125, 3.6527099609375, 3.865966796875, 4.0792236328125, 4.29248046875, 4.5057373046875, 4.718994140625, 4.9322509765625, 5.1455078125, 5.3587646484375, 5.572021484375, 5.7852783203125, 5.99853515625, 6.2117919921875, 6.425048828125, 6.6383056640625, 6.8515625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 2.0, 6.0, 8.0, 17.0, 24.0, 49.0, 116.0, 418.0, 6999.0, 4184786.0, 1412.0, 260.0, 69.0, 33.0, 16.0, 9.0, 10.0, 11.0, 6.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-132.75, -128.8837890625, -125.017578125, -121.1513671875, -117.28515625, -113.4189453125, -109.552734375, -105.6865234375, -101.8203125, -97.9541015625, -94.087890625, -90.2216796875, -86.35546875, -82.4892578125, -78.623046875, -74.7568359375, -70.890625, -67.0244140625, -63.158203125, -59.2919921875, -55.42578125, -51.5595703125, -47.693359375, -43.8271484375, -39.9609375, -36.0947265625, -32.228515625, -28.3623046875, -24.49609375, -20.6298828125, -16.763671875, -12.8974609375, -9.03125, -5.1650390625, -1.298828125, 2.5673828125, 6.43359375, 10.2998046875, 14.166015625, 18.0322265625, 21.8984375, 25.7646484375, 29.630859375, 33.4970703125, 37.36328125, 41.2294921875, 45.095703125, 48.9619140625, 52.828125, 56.6943359375, 60.560546875, 64.4267578125, 68.29296875, 72.1591796875, 76.025390625, 79.8916015625, 83.7578125, 87.6240234375, 91.490234375, 95.3564453125, 99.22265625, 103.0888671875, 106.955078125, 110.8212890625, 114.6875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 6.0, 7.0, 5.0, 11.0, 8.0, 15.0, 28.0, 30.0, 45.0, 76.0, 102.0, 137.0, 209.0, 292.0, 468.0, 553.0, 609.0, 455.0, 310.0, 214.0, 146.0, 97.0, 82.0, 41.0, 32.0, 27.0, 22.0, 16.0, 15.0, 12.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.47265625, -4.3580322265625, -4.243408203125, -4.1287841796875, -4.01416015625, -3.8995361328125, -3.784912109375, -3.6702880859375, -3.5556640625, -3.4410400390625, -3.326416015625, -3.2117919921875, -3.09716796875, -2.9825439453125, -2.867919921875, -2.7532958984375, -2.638671875, -2.5240478515625, -2.409423828125, -2.2947998046875, -2.18017578125, -2.0655517578125, -1.950927734375, -1.8363037109375, -1.7216796875, -1.6070556640625, -1.492431640625, -1.3778076171875, -1.26318359375, -1.1485595703125, -1.033935546875, -0.9193115234375, -0.8046875, -0.6900634765625, -0.575439453125, -0.4608154296875, -0.34619140625, -0.2315673828125, -0.116943359375, -0.0023193359375, 0.1123046875, 0.2269287109375, 0.341552734375, 0.4561767578125, 0.57080078125, 0.6854248046875, 0.800048828125, 0.9146728515625, 1.029296875, 1.1439208984375, 1.258544921875, 1.3731689453125, 1.48779296875, 1.6024169921875, 1.717041015625, 1.8316650390625, 1.9462890625, 2.0609130859375, 2.175537109375, 2.2901611328125, 2.40478515625, 2.5194091796875, 2.634033203125, 2.7486572265625, 2.86328125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 8.0, 0.0, 6.0, 10.0, 14.0, 13.0, 10.0, 17.0, 30.0, 29.0, 54.0, 54.0, 73.0, 60.0, 65.0, 76.0, 77.0, 71.0, 55.0, 39.0, 51.0, 38.0, 38.0, 30.0, 20.0, 16.0, 10.0, 12.0, 7.0, 2.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.781278610229492, -9.463096618652344, -9.144915580749512, -8.826733589172363, -8.508551597595215, -8.190370559692383, -7.872188568115234, -7.554007053375244, -7.235825538635254, -6.917644023895264, -6.599462032318115, -6.281280517578125, -5.963099002838135, -5.6449174880981445, -5.326735496520996, -5.008553981781006, -4.690371990203857, -4.372190475463867, -4.054008483886719, -3.7358269691467285, -3.4176454544067383, -3.099463701248169, -2.7812819480895996, -2.4631004333496094, -2.14491868019104, -1.8267370462417603, -1.5085554122924805, -1.1903736591339111, -0.8721920251846313, -0.5540103912353516, -0.23582863807678223, 0.08235287666320801, 0.40053462982177734, 0.7187162637710571, 1.036897897720337, 1.3550796508789062, 1.673261284828186, 1.9914429187774658, 2.309624671936035, 2.6278061866760254, 2.9459879398345947, 3.264169692993164, 3.5823512077331543, 3.9005329608917236, 4.218714714050293, 4.536896228790283, 4.855077743530273, 5.173259735107422, 5.491441249847412, 5.809622764587402, 6.127804756164551, 6.445986270904541, 6.764167785644531, 7.08234977722168, 7.40053129196167, 7.71871280670166, 8.036894798278809, 8.355076789855957, 8.673257827758789, 8.991439819335938, 9.309621810913086, 9.627802848815918, 9.945984840393066, 10.264165878295898, 10.582347869873047]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 6.0, 11.0, 12.0, 12.0, 11.0, 15.0, 14.0, 17.0, 14.0, 24.0, 35.0, 22.0, 37.0, 27.0, 32.0, 27.0, 46.0, 47.0, 48.0, 39.0, 35.0, 35.0, 50.0, 36.0, 40.0, 38.0, 34.0, 24.0, 30.0, 26.0, 21.0, 26.0, 15.0, 12.0, 17.0, 7.0, 10.0, 10.0, 5.0, 5.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.5965094566345215, -6.381587028503418, -6.1666646003723145, -5.951742172241211, -5.736819744110107, -5.521897315979004, -5.306974411010742, -5.092051982879639, -4.877129554748535, -4.662207126617432, -4.447284698486328, -4.232362270355225, -4.017439842224121, -3.8025171756744385, -3.587594747543335, -3.3726720809936523, -3.157749891281128, -2.9428274631500244, -2.727905035018921, -2.5129823684692383, -2.2980599403381348, -2.0831375122070312, -1.8682150840759277, -1.6532925367355347, -1.4383701086044312, -1.2234476804733276, -1.0085251331329346, -0.793602705001831, -0.5786802172660828, -0.3637577295303345, -0.14883530139923096, 0.06608724594116211, 0.2810096740722656, 0.4959321618080139, 0.7108546495437622, 0.9257770776748657, 1.1406996250152588, 1.3556220531463623, 1.5705444812774658, 1.7854670286178589, 2.000389575958252, 2.2153120040893555, 2.430234432220459, 2.6451568603515625, 2.860079526901245, 3.0750019550323486, 3.289924383163452, 3.5048470497131348, 3.719769239425659, 3.9346916675567627, 4.149614334106445, 4.364536762237549, 4.579459190368652, 4.794381618499756, 5.009304046630859, 5.224226474761963, 5.439148902893066, 5.65407133102417, 5.868993759155273, 6.083916187286377, 6.2988386154174805, 6.513761520385742, 6.7286834716796875, 6.943606376647949, 7.158528804779053]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 5.0, 4.0, 4.0, 4.0, 5.0, 12.0, 26.0, 33.0, 75.0, 146.0, 311.0, 823.0, 2364.0, 7073.0, 26793.0, 118941.0, 412872.0, 357838.0, 91128.0, 20990.0, 5889.0, 1924.0, 733.0, 294.0, 118.0, 57.0, 36.0, 14.0, 12.0, 6.0, 8.0, 5.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.453125, -5.29693603515625, -5.1407470703125, -4.98455810546875, -4.828369140625, -4.67218017578125, -4.5159912109375, -4.35980224609375, -4.20361328125, -4.04742431640625, -3.8912353515625, -3.73504638671875, -3.578857421875, -3.42266845703125, -3.2664794921875, -3.11029052734375, -2.9541015625, -2.79791259765625, -2.6417236328125, -2.48553466796875, -2.329345703125, -2.17315673828125, -2.0169677734375, -1.86077880859375, -1.70458984375, -1.54840087890625, -1.3922119140625, -1.23602294921875, -1.079833984375, -0.92364501953125, -0.7674560546875, -0.61126708984375, -0.455078125, -0.29888916015625, -0.1427001953125, 0.01348876953125, 0.169677734375, 0.32586669921875, 0.4820556640625, 0.63824462890625, 0.79443359375, 0.95062255859375, 1.1068115234375, 1.26300048828125, 1.419189453125, 1.57537841796875, 1.7315673828125, 1.88775634765625, 2.0439453125, 2.20013427734375, 2.3563232421875, 2.51251220703125, 2.668701171875, 2.82489013671875, 2.9810791015625, 3.13726806640625, 3.29345703125, 3.44964599609375, 3.6058349609375, 3.76202392578125, 3.918212890625, 4.07440185546875, 4.2305908203125, 4.38677978515625, 4.54296875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 7.0, 9.0, 8.0, 11.0, 11.0, 21.0, 21.0, 18.0, 16.0, 20.0, 33.0, 26.0, 32.0, 36.0, 31.0, 39.0, 49.0, 35.0, 46.0, 32.0, 35.0, 42.0, 50.0, 38.0, 35.0, 36.0, 32.0, 30.0, 29.0, 27.0, 15.0, 23.0, 11.0, 17.0, 16.0, 11.0, 7.0, 5.0, 10.0, 6.0, 5.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.38671875, -4.255950927734375, -4.12518310546875, -3.994415283203125, -3.8636474609375, -3.732879638671875, -3.60211181640625, -3.471343994140625, -3.340576171875, -3.209808349609375, -3.07904052734375, -2.948272705078125, -2.8175048828125, -2.686737060546875, -2.55596923828125, -2.425201416015625, -2.29443359375, -2.163665771484375, -2.03289794921875, -1.902130126953125, -1.7713623046875, -1.640594482421875, -1.50982666015625, -1.379058837890625, -1.248291015625, -1.117523193359375, -0.98675537109375, -0.855987548828125, -0.7252197265625, -0.594451904296875, -0.46368408203125, -0.332916259765625, -0.2021484375, -0.071380615234375, 0.05938720703125, 0.190155029296875, 0.3209228515625, 0.451690673828125, 0.58245849609375, 0.713226318359375, 0.843994140625, 0.974761962890625, 1.10552978515625, 1.236297607421875, 1.3670654296875, 1.497833251953125, 1.62860107421875, 1.759368896484375, 1.89013671875, 2.020904541015625, 2.15167236328125, 2.282440185546875, 2.4132080078125, 2.543975830078125, 2.67474365234375, 2.805511474609375, 2.936279296875, 3.067047119140625, 3.19781494140625, 3.328582763671875, 3.4593505859375, 3.590118408203125, 3.72088623046875, 3.851654052734375, 3.982421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 4.0, 2.0, 7.0, 13.0, 18.0, 37.0, 48.0, 76.0, 105.0, 160.0, 227.0, 501.0, 873.0, 1856.0, 4526.0, 11979.0, 36067.0, 124516.0, 347909.0, 343399.0, 120933.0, 35446.0, 11596.0, 4333.0, 1861.0, 875.0, 476.0, 242.0, 159.0, 112.0, 62.0, 49.0, 25.0, 24.0, 11.0, 5.0, 13.0, 7.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.80859375, -2.70452880859375, -2.6004638671875, -2.49639892578125, -2.392333984375, -2.28826904296875, -2.1842041015625, -2.08013916015625, -1.97607421875, -1.87200927734375, -1.7679443359375, -1.66387939453125, -1.559814453125, -1.45574951171875, -1.3516845703125, -1.24761962890625, -1.1435546875, -1.03948974609375, -0.9354248046875, -0.83135986328125, -0.727294921875, -0.62322998046875, -0.5191650390625, -0.41510009765625, -0.31103515625, -0.20697021484375, -0.1029052734375, 0.00115966796875, 0.105224609375, 0.20928955078125, 0.3133544921875, 0.41741943359375, 0.521484375, 0.62554931640625, 0.7296142578125, 0.83367919921875, 0.937744140625, 1.04180908203125, 1.1458740234375, 1.24993896484375, 1.35400390625, 1.45806884765625, 1.5621337890625, 1.66619873046875, 1.770263671875, 1.87432861328125, 1.9783935546875, 2.08245849609375, 2.1865234375, 2.29058837890625, 2.3946533203125, 2.49871826171875, 2.602783203125, 2.70684814453125, 2.8109130859375, 2.91497802734375, 3.01904296875, 3.12310791015625, 3.2271728515625, 3.33123779296875, 3.435302734375, 3.53936767578125, 3.6434326171875, 3.74749755859375, 3.8515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 5.0, 6.0, 5.0, 10.0, 11.0, 14.0, 21.0, 19.0, 6.0, 35.0, 41.0, 47.0, 42.0, 42.0, 57.0, 57.0, 34.0, 47.0, 40.0, 50.0, 47.0, 39.0, 38.0, 51.0, 32.0, 24.0, 22.0, 25.0, 24.0, 16.0, 11.0, 22.0, 11.0, 13.0, 6.0, 9.0, 9.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.671875, -8.390869140625, -8.10986328125, -7.828857421875, -7.5478515625, -7.266845703125, -6.98583984375, -6.704833984375, -6.423828125, -6.142822265625, -5.86181640625, -5.580810546875, -5.2998046875, -5.018798828125, -4.73779296875, -4.456787109375, -4.17578125, -3.894775390625, -3.61376953125, -3.332763671875, -3.0517578125, -2.770751953125, -2.48974609375, -2.208740234375, -1.927734375, -1.646728515625, -1.36572265625, -1.084716796875, -0.8037109375, -0.522705078125, -0.24169921875, 0.039306640625, 0.3203125, 0.601318359375, 0.88232421875, 1.163330078125, 1.4443359375, 1.725341796875, 2.00634765625, 2.287353515625, 2.568359375, 2.849365234375, 3.13037109375, 3.411376953125, 3.6923828125, 3.973388671875, 4.25439453125, 4.535400390625, 4.81640625, 5.097412109375, 5.37841796875, 5.659423828125, 5.9404296875, 6.221435546875, 6.50244140625, 6.783447265625, 7.064453125, 7.345458984375, 7.62646484375, 7.907470703125, 8.1884765625, 8.469482421875, 8.75048828125, 9.031494140625, 9.3125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 10.0, 12.0, 17.0, 16.0, 31.0, 43.0, 60.0, 96.0, 179.0, 287.0, 449.0, 798.0, 1584.0, 3134.0, 6822.0, 17188.0, 53366.0, 208552.0, 469180.0, 204301.0, 51859.0, 16974.0, 6795.0, 3204.0, 1554.0, 840.0, 488.0, 275.0, 152.0, 93.0, 74.0, 38.0, 27.0, 24.0, 6.0, 10.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.8359375, -1.784210205078125, -1.73248291015625, -1.680755615234375, -1.6290283203125, -1.577301025390625, -1.52557373046875, -1.473846435546875, -1.422119140625, -1.370391845703125, -1.31866455078125, -1.266937255859375, -1.2152099609375, -1.163482666015625, -1.11175537109375, -1.060028076171875, -1.00830078125, -0.956573486328125, -0.90484619140625, -0.853118896484375, -0.8013916015625, -0.749664306640625, -0.69793701171875, -0.646209716796875, -0.594482421875, -0.542755126953125, -0.49102783203125, -0.439300537109375, -0.3875732421875, -0.335845947265625, -0.28411865234375, -0.232391357421875, -0.1806640625, -0.128936767578125, -0.07720947265625, -0.025482177734375, 0.0262451171875, 0.077972412109375, 0.12969970703125, 0.181427001953125, 0.233154296875, 0.284881591796875, 0.33660888671875, 0.388336181640625, 0.4400634765625, 0.491790771484375, 0.54351806640625, 0.595245361328125, 0.64697265625, 0.698699951171875, 0.75042724609375, 0.802154541015625, 0.8538818359375, 0.905609130859375, 0.95733642578125, 1.009063720703125, 1.060791015625, 1.112518310546875, 1.16424560546875, 1.215972900390625, 1.2677001953125, 1.319427490234375, 1.37115478515625, 1.422882080078125, 1.474609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 5.0, 17.0, 16.0, 21.0, 40.0, 54.0, 87.0, 113.0, 131.0, 126.0, 100.0, 78.0, 57.0, 45.0, 24.0, 19.0, 12.0, 10.0, 4.0, 7.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010061264038085938, -0.0009714365005493164, -0.0009367465972900391, -0.0009020566940307617, -0.0008673667907714844, -0.000832676887512207, -0.0007979869842529297, -0.0007632970809936523, -0.000728607177734375, -0.0006939172744750977, -0.0006592273712158203, -0.000624537467956543, -0.0005898475646972656, -0.0005551576614379883, -0.0005204677581787109, -0.0004857778549194336, -0.00045108795166015625, -0.0004163980484008789, -0.00038170814514160156, -0.0003470182418823242, -0.0003123283386230469, -0.00027763843536376953, -0.0002429485321044922, -0.00020825862884521484, -0.0001735687255859375, -0.00013887882232666016, -0.00010418891906738281, -6.949901580810547e-05, -3.4809112548828125e-05, -1.1920928955078125e-07, 3.457069396972656e-05, 6.92605972290039e-05, 0.00010395050048828125, 0.0001386404037475586, 0.00017333030700683594, 0.00020802021026611328, 0.00024271011352539062, 0.00027740001678466797, 0.0003120899200439453, 0.00034677982330322266, 0.0003814697265625, 0.00041615962982177734, 0.0004508495330810547, 0.00048553943634033203, 0.0005202293395996094, 0.0005549192428588867, 0.0005896091461181641, 0.0006242990493774414, 0.0006589889526367188, 0.0006936788558959961, 0.0007283687591552734, 0.0007630586624145508, 0.0007977485656738281, 0.0008324384689331055, 0.0008671283721923828, 0.0009018182754516602, 0.0009365081787109375, 0.0009711980819702148, 0.0010058879852294922, 0.0010405778884887695, 0.0010752677917480469, 0.0011099576950073242, 0.0011446475982666016, 0.001179337501525879, 0.0012140274047851562]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 7.0, 6.0, 7.0, 9.0, 12.0, 18.0, 24.0, 51.0, 70.0, 189.0, 427.0, 1286.0, 5317.0, 46516.0, 679223.0, 293484.0, 17530.0, 2955.0, 754.0, 327.0, 151.0, 65.0, 45.0, 22.0, 15.0, 11.0, 10.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.40625, -4.289703369140625, -4.17315673828125, -4.056610107421875, -3.9400634765625, -3.823516845703125, -3.70697021484375, -3.590423583984375, -3.473876953125, -3.357330322265625, -3.24078369140625, -3.124237060546875, -3.0076904296875, -2.891143798828125, -2.77459716796875, -2.658050537109375, -2.54150390625, -2.424957275390625, -2.30841064453125, -2.191864013671875, -2.0753173828125, -1.958770751953125, -1.84222412109375, -1.725677490234375, -1.609130859375, -1.492584228515625, -1.37603759765625, -1.259490966796875, -1.1429443359375, -1.026397705078125, -0.90985107421875, -0.793304443359375, -0.6767578125, -0.560211181640625, -0.44366455078125, -0.327117919921875, -0.2105712890625, -0.094024658203125, 0.02252197265625, 0.139068603515625, 0.255615234375, 0.372161865234375, 0.48870849609375, 0.605255126953125, 0.7218017578125, 0.838348388671875, 0.95489501953125, 1.071441650390625, 1.18798828125, 1.304534912109375, 1.42108154296875, 1.537628173828125, 1.6541748046875, 1.770721435546875, 1.88726806640625, 2.003814697265625, 2.120361328125, 2.236907958984375, 2.35345458984375, 2.470001220703125, 2.5865478515625, 2.703094482421875, 2.81964111328125, 2.936187744140625, 3.052734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 7.0, 3.0, 4.0, 10.0, 7.0, 3.0, 14.0, 13.0, 25.0, 17.0, 21.0, 42.0, 45.0, 51.0, 54.0, 55.0, 73.0, 76.0, 86.0, 61.0, 54.0, 45.0, 44.0, 40.0, 33.0, 26.0, 15.0, 11.0, 14.0, 15.0, 10.0, 4.0, 5.0, 6.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.367431640625, -0.3549079895019531, -0.34238433837890625, -0.3298606872558594, -0.3173370361328125, -0.3048133850097656, -0.29228973388671875, -0.2797660827636719, -0.267242431640625, -0.2547187805175781, -0.24219512939453125, -0.22967147827148438, -0.2171478271484375, -0.20462417602539062, -0.19210052490234375, -0.17957687377929688, -0.16705322265625, -0.15452957153320312, -0.14200592041015625, -0.12948226928710938, -0.1169586181640625, -0.10443496704101562, -0.09191131591796875, -0.07938766479492188, -0.066864013671875, -0.054340362548828125, -0.04181671142578125, -0.029293060302734375, -0.0167694091796875, -0.004245758056640625, 0.00827789306640625, 0.020801544189453125, 0.0333251953125, 0.045848846435546875, 0.05837249755859375, 0.07089614868164062, 0.0834197998046875, 0.09594345092773438, 0.10846710205078125, 0.12099075317382812, 0.133514404296875, 0.14603805541992188, 0.15856170654296875, 0.17108535766601562, 0.1836090087890625, 0.19613265991210938, 0.20865631103515625, 0.22117996215820312, 0.23370361328125, 0.24622726440429688, 0.25875091552734375, 0.2712745666503906, 0.2837982177734375, 0.2963218688964844, 0.30884552001953125, 0.3213691711425781, 0.333892822265625, 0.3464164733886719, 0.35894012451171875, 0.3714637756347656, 0.3839874267578125, 0.3965110778808594, 0.40903472900390625, 0.4215583801269531, 0.43408203125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 4.0, 11.0, 15.0, 16.0, 16.0, 33.0, 40.0, 48.0, 71.0, 90.0, 93.0, 98.0, 78.0, 82.0, 57.0, 64.0, 49.0, 32.0, 35.0, 19.0, 12.0, 11.0, 4.0, 2.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.510340690612793, -7.27992057800293, -7.049500942230225, -6.8190813064575195, -6.588661193847656, -6.358241081237793, -6.127821445465088, -5.897401809692383, -5.6669816970825195, -5.436561584472656, -5.206141948699951, -4.975722312927246, -4.745302200317383, -4.5148820877075195, -4.2844624519348145, -4.054042816162109, -3.823622703552246, -3.593202829360962, -3.3627829551696777, -3.1323630809783936, -2.9019432067871094, -2.671523332595825, -2.441103458404541, -2.210683584213257, -1.9802637100219727, -1.7498438358306885, -1.5194239616394043, -1.2890040874481201, -1.058584213256836, -0.8281643390655518, -0.5977444648742676, -0.3673245906829834, -0.13690471649169922, 0.09351515769958496, 0.32393503189086914, 0.5543549060821533, 0.7847747802734375, 1.0151946544647217, 1.2456145286560059, 1.47603440284729, 1.7064542770385742, 1.9368741512298584, 2.1672940254211426, 2.3977138996124268, 2.628133773803711, 2.858553647994995, 3.0889735221862793, 3.3193933963775635, 3.5498132705688477, 3.780233144760132, 4.010653018951416, 4.241072654724121, 4.471492767333984, 4.701912879943848, 4.932332515716553, 5.162752151489258, 5.393172264099121, 5.623592376708984, 5.8540120124816895, 6.0844316482543945, 6.314851760864258, 6.545271873474121, 6.775691509246826, 7.006111145019531, 7.2365312576293945]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 1.0, 3.0, 4.0, 5.0, 7.0, 16.0, 11.0, 15.0, 14.0, 18.0, 36.0, 31.0, 32.0, 34.0, 37.0, 42.0, 47.0, 42.0, 46.0, 51.0, 47.0, 55.0, 41.0, 54.0, 46.0, 42.0, 48.0, 37.0, 26.0, 25.0, 14.0, 10.0, 16.0, 10.0, 12.0, 7.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.022800445556641, -4.865961074829102, -4.709122180938721, -4.552282810211182, -4.395443916320801, -4.238604545593262, -4.081765174865723, -3.9249260425567627, -3.7680869102478027, -3.6112477779388428, -3.454408645629883, -3.2975692749023438, -3.140730142593384, -2.983891010284424, -2.8270516395568848, -2.670212507247925, -2.513373374938965, -2.356534242630005, -2.199695110321045, -2.042855739593506, -1.886016607284546, -1.729177474975586, -1.5723382234573364, -1.415498971939087, -1.258659839630127, -1.101820707321167, -0.9449814558029175, -0.7881422638893127, -0.631303071975708, -0.47446388006210327, -0.31762468814849854, -0.16078543663024902, -0.003946781158447266, 0.15289241075515747, 0.3097316026687622, 0.46657079458236694, 0.6234099864959717, 0.7802491784095764, 0.9370883703231812, 1.0939276218414307, 1.2507667541503906, 1.4076058864593506, 1.5644451379776, 1.7212843894958496, 1.8781235218048096, 2.0349626541137695, 2.1918020248413086, 2.3486411571502686, 2.5054802894592285, 2.6623194217681885, 2.8191585540771484, 2.9759979248046875, 3.1328370571136475, 3.2896761894226074, 3.4465155601501465, 3.6033546924591064, 3.7601938247680664, 3.9170329570770264, 4.073872089385986, 4.230711460113525, 4.387550354003906, 4.544389724731445, 4.701229095458984, 4.858068466186523, 5.014907360076904]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 1.0, 3.0, 2.0, 3.0, 2.0, 16.0, 18.0, 23.0, 30.0, 48.0, 96.0, 181.0, 392.0, 836.0, 1921.0, 5112.0, 14827.0, 47143.0, 181423.0, 573605.0, 158986.0, 42449.0, 13428.0, 4635.0, 1878.0, 720.0, 340.0, 187.0, 89.0, 57.0, 27.0, 19.0, 13.0, 12.0, 8.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.515625, -6.31488037109375, -6.1141357421875, -5.91339111328125, -5.712646484375, -5.51190185546875, -5.3111572265625, -5.11041259765625, -4.90966796875, -4.70892333984375, -4.5081787109375, -4.30743408203125, -4.106689453125, -3.90594482421875, -3.7052001953125, -3.50445556640625, -3.3037109375, -3.10296630859375, -2.9022216796875, -2.70147705078125, -2.500732421875, -2.29998779296875, -2.0992431640625, -1.89849853515625, -1.69775390625, -1.49700927734375, -1.2962646484375, -1.09552001953125, -0.894775390625, -0.69403076171875, -0.4932861328125, -0.29254150390625, -0.091796875, 0.10894775390625, 0.3096923828125, 0.51043701171875, 0.711181640625, 0.91192626953125, 1.1126708984375, 1.31341552734375, 1.51416015625, 1.71490478515625, 1.9156494140625, 2.11639404296875, 2.317138671875, 2.51788330078125, 2.7186279296875, 2.91937255859375, 3.1201171875, 3.32086181640625, 3.5216064453125, 3.72235107421875, 3.923095703125, 4.12384033203125, 4.3245849609375, 4.52532958984375, 4.72607421875, 4.92681884765625, 5.1275634765625, 5.32830810546875, 5.529052734375, 5.72979736328125, 5.9305419921875, 6.13128662109375, 6.33203125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 4.0, 8.0, 14.0, 9.0, 16.0, 17.0, 20.0, 24.0, 39.0, 36.0, 42.0, 38.0, 40.0, 50.0, 68.0, 58.0, 53.0, 42.0, 58.0, 42.0, 49.0, 51.0, 42.0, 32.0, 31.0, 29.0, 13.0, 16.0, 21.0, 12.0, 9.0, 7.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2109375, -11.8074951171875, -11.404052734375, -11.0006103515625, -10.59716796875, -10.1937255859375, -9.790283203125, -9.3868408203125, -8.9833984375, -8.5799560546875, -8.176513671875, -7.7730712890625, -7.36962890625, -6.9661865234375, -6.562744140625, -6.1593017578125, -5.755859375, -5.3524169921875, -4.948974609375, -4.5455322265625, -4.14208984375, -3.7386474609375, -3.335205078125, -2.9317626953125, -2.5283203125, -2.1248779296875, -1.721435546875, -1.3179931640625, -0.91455078125, -0.5111083984375, -0.107666015625, 0.2957763671875, 0.69921875, 1.1026611328125, 1.506103515625, 1.9095458984375, 2.31298828125, 2.7164306640625, 3.119873046875, 3.5233154296875, 3.9267578125, 4.3302001953125, 4.733642578125, 5.1370849609375, 5.54052734375, 5.9439697265625, 6.347412109375, 6.7508544921875, 7.154296875, 7.5577392578125, 7.961181640625, 8.3646240234375, 8.76806640625, 9.1715087890625, 9.574951171875, 9.9783935546875, 10.3818359375, 10.7852783203125, 11.188720703125, 11.5921630859375, 11.99560546875, 12.3990478515625, 12.802490234375, 13.2059326171875, 13.609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 6.0, 10.0, 13.0, 5.0, 11.0, 19.0, 18.0, 25.0, 29.0, 29.0, 31.0, 25.0, 41.0, 47.0, 42.0, 60.0, 262.0, 39092.0, 1006874.0, 1415.0, 96.0, 57.0, 53.0, 44.0, 40.0, 36.0, 25.0, 33.0, 17.0, 18.0, 25.0, 6.0, 9.0, 4.0, 4.0, 12.0, 5.0, 3.0, 3.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-42.78125, -41.45458984375, -40.1279296875, -38.80126953125, -37.474609375, -36.14794921875, -34.8212890625, -33.49462890625, -32.16796875, -30.84130859375, -29.5146484375, -28.18798828125, -26.861328125, -25.53466796875, -24.2080078125, -22.88134765625, -21.5546875, -20.22802734375, -18.9013671875, -17.57470703125, -16.248046875, -14.92138671875, -13.5947265625, -12.26806640625, -10.94140625, -9.61474609375, -8.2880859375, -6.96142578125, -5.634765625, -4.30810546875, -2.9814453125, -1.65478515625, -0.328125, 0.99853515625, 2.3251953125, 3.65185546875, 4.978515625, 6.30517578125, 7.6318359375, 8.95849609375, 10.28515625, 11.61181640625, 12.9384765625, 14.26513671875, 15.591796875, 16.91845703125, 18.2451171875, 19.57177734375, 20.8984375, 22.22509765625, 23.5517578125, 24.87841796875, 26.205078125, 27.53173828125, 28.8583984375, 30.18505859375, 31.51171875, 32.83837890625, 34.1650390625, 35.49169921875, 36.818359375, 38.14501953125, 39.4716796875, 40.79833984375, 42.125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 14.0, 9.0, 12.0, 15.0, 15.0, 13.0, 24.0, 25.0, 27.0, 29.0, 31.0, 31.0, 37.0, 36.0, 39.0, 47.0, 49.0, 34.0, 42.0, 43.0, 46.0, 46.0, 45.0, 45.0, 40.0, 26.0, 23.0, 29.0, 24.0, 24.0, 15.0, 13.0, 9.0, 5.0, 7.0, 6.0, 3.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.234375, -10.882080078125, -10.52978515625, -10.177490234375, -9.8251953125, -9.472900390625, -9.12060546875, -8.768310546875, -8.416015625, -8.063720703125, -7.71142578125, -7.359130859375, -7.0068359375, -6.654541015625, -6.30224609375, -5.949951171875, -5.59765625, -5.245361328125, -4.89306640625, -4.540771484375, -4.1884765625, -3.836181640625, -3.48388671875, -3.131591796875, -2.779296875, -2.427001953125, -2.07470703125, -1.722412109375, -1.3701171875, -1.017822265625, -0.66552734375, -0.313232421875, 0.0390625, 0.391357421875, 0.74365234375, 1.095947265625, 1.4482421875, 1.800537109375, 2.15283203125, 2.505126953125, 2.857421875, 3.209716796875, 3.56201171875, 3.914306640625, 4.2666015625, 4.618896484375, 4.97119140625, 5.323486328125, 5.67578125, 6.028076171875, 6.38037109375, 6.732666015625, 7.0849609375, 7.437255859375, 7.78955078125, 8.141845703125, 8.494140625, 8.846435546875, 9.19873046875, 9.551025390625, 9.9033203125, 10.255615234375, 10.60791015625, 10.960205078125, 11.3125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 0.0, 4.0, 4.0, 7.0, 5.0, 12.0, 15.0, 36.0, 43.0, 93.0, 243.0, 735.0, 3053.0, 26955.0, 756438.0, 246382.0, 11907.0, 1837.0, 435.0, 172.0, 71.0, 50.0, 19.0, 13.0, 10.0, 6.0, 4.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.609375, -3.46405029296875, -3.3187255859375, -3.17340087890625, -3.028076171875, -2.88275146484375, -2.7374267578125, -2.59210205078125, -2.44677734375, -2.30145263671875, -2.1561279296875, -2.01080322265625, -1.865478515625, -1.72015380859375, -1.5748291015625, -1.42950439453125, -1.2841796875, -1.13885498046875, -0.9935302734375, -0.84820556640625, -0.702880859375, -0.55755615234375, -0.4122314453125, -0.26690673828125, -0.12158203125, 0.02374267578125, 0.1690673828125, 0.31439208984375, 0.459716796875, 0.60504150390625, 0.7503662109375, 0.89569091796875, 1.041015625, 1.18634033203125, 1.3316650390625, 1.47698974609375, 1.622314453125, 1.76763916015625, 1.9129638671875, 2.05828857421875, 2.20361328125, 2.34893798828125, 2.4942626953125, 2.63958740234375, 2.784912109375, 2.93023681640625, 3.0755615234375, 3.22088623046875, 3.3662109375, 3.51153564453125, 3.6568603515625, 3.80218505859375, 3.947509765625, 4.09283447265625, 4.2381591796875, 4.38348388671875, 4.52880859375, 4.67413330078125, 4.8194580078125, 4.96478271484375, 5.110107421875, 5.25543212890625, 5.4007568359375, 5.54608154296875, 5.69140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 9.0, 10.0, 18.0, 27.0, 28.0, 36.0, 64.0, 105.0, 136.0, 164.0, 127.0, 79.0, 48.0, 51.0, 29.0, 24.0, 15.0, 9.0, 8.0, 6.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003349781036376953, -0.00032065436244010925, -0.0003063306212425232, -0.00029200688004493713, -0.0002776831388473511, -0.000263359397649765, -0.00024903565645217896, -0.0002347119152545929, -0.00022038817405700684, -0.00020606443285942078, -0.00019174069166183472, -0.00017741695046424866, -0.0001630932092666626, -0.00014876946806907654, -0.00013444572687149048, -0.00012012198567390442, -0.00010579824447631836, -9.14745032787323e-05, -7.715076208114624e-05, -6.282702088356018e-05, -4.850327968597412e-05, -3.417953848838806e-05, -1.9855797290802002e-05, -5.532056093215942e-06, 8.791685104370117e-06, 2.3115426301956177e-05, 3.7439167499542236e-05, 5.1762908697128296e-05, 6.608664989471436e-05, 8.041039109230042e-05, 9.473413228988647e-05, 0.00010905787348747253, 0.0001233816146850586, 0.00013770535588264465, 0.0001520290970802307, 0.00016635283827781677, 0.00018067657947540283, 0.0001950003206729889, 0.00020932406187057495, 0.000223647803068161, 0.00023797154426574707, 0.00025229528546333313, 0.0002666190266609192, 0.00028094276785850525, 0.0002952665090560913, 0.00030959025025367737, 0.00032391399145126343, 0.0003382377326488495, 0.00035256147384643555, 0.0003668852150440216, 0.00038120895624160767, 0.0003955326974391937, 0.0004098564386367798, 0.00042418017983436584, 0.0004385039210319519, 0.00045282766222953796, 0.000467151403427124, 0.0004814751446247101, 0.0004957988858222961, 0.0005101226270198822, 0.0005244463682174683, 0.0005387701094150543, 0.0005530938506126404, 0.0005674175918102264, 0.0005817413330078125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 12.0, 15.0, 18.0, 18.0, 42.0, 64.0, 132.0, 232.0, 443.0, 993.0, 2236.0, 5778.0, 17144.0, 62981.0, 283357.0, 529318.0, 104923.0, 26783.0, 8363.0, 3043.0, 1377.0, 598.0, 300.0, 154.0, 74.0, 62.0, 31.0, 21.0, 12.0, 12.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9736328125, -1.914154052734375, -1.85467529296875, -1.795196533203125, -1.7357177734375, -1.676239013671875, -1.61676025390625, -1.557281494140625, -1.497802734375, -1.438323974609375, -1.37884521484375, -1.319366455078125, -1.2598876953125, -1.200408935546875, -1.14093017578125, -1.081451416015625, -1.02197265625, -0.962493896484375, -0.90301513671875, -0.843536376953125, -0.7840576171875, -0.724578857421875, -0.66510009765625, -0.605621337890625, -0.546142578125, -0.486663818359375, -0.42718505859375, -0.367706298828125, -0.3082275390625, -0.248748779296875, -0.18927001953125, -0.129791259765625, -0.0703125, -0.010833740234375, 0.04864501953125, 0.108123779296875, 0.1676025390625, 0.227081298828125, 0.28656005859375, 0.346038818359375, 0.405517578125, 0.464996337890625, 0.52447509765625, 0.583953857421875, 0.6434326171875, 0.702911376953125, 0.76239013671875, 0.821868896484375, 0.88134765625, 0.940826416015625, 1.00030517578125, 1.059783935546875, 1.1192626953125, 1.178741455078125, 1.23822021484375, 1.297698974609375, 1.357177734375, 1.416656494140625, 1.47613525390625, 1.535614013671875, 1.5950927734375, 1.654571533203125, 1.71405029296875, 1.773529052734375, 1.8330078125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 9.0, 12.0, 20.0, 31.0, 26.0, 56.0, 70.0, 95.0, 167.0, 145.0, 99.0, 66.0, 50.0, 31.0, 22.0, 24.0, 19.0, 8.0, 8.0, 7.0, 2.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90283203125, -0.8706130981445312, -0.8383941650390625, -0.8061752319335938, -0.773956298828125, -0.7417373657226562, -0.7095184326171875, -0.6772994995117188, -0.64508056640625, -0.6128616333007812, -0.5806427001953125, -0.5484237670898438, -0.516204833984375, -0.48398590087890625, -0.4517669677734375, -0.41954803466796875, -0.3873291015625, -0.35511016845703125, -0.3228912353515625, -0.29067230224609375, -0.258453369140625, -0.22623443603515625, -0.1940155029296875, -0.16179656982421875, -0.12957763671875, -0.09735870361328125, -0.0651397705078125, -0.03292083740234375, -0.000701904296875, 0.03151702880859375, 0.0637359619140625, 0.09595489501953125, 0.128173828125, 0.16039276123046875, 0.1926116943359375, 0.22483062744140625, 0.257049560546875, 0.28926849365234375, 0.3214874267578125, 0.35370635986328125, 0.38592529296875, 0.41814422607421875, 0.4503631591796875, 0.48258209228515625, 0.514801025390625, 0.5470199584960938, 0.5792388916015625, 0.6114578247070312, 0.6436767578125, 0.6758956909179688, 0.7081146240234375, 0.7403335571289062, 0.772552490234375, 0.8047714233398438, 0.8369903564453125, 0.8692092895507812, 0.90142822265625, 0.9336471557617188, 0.9658660888671875, 0.9980850219726562, 1.030303955078125, 1.0625228881835938, 1.0947418212890625, 1.1269607543945312, 1.1591796875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 22.0, 198.0, 597.0, 173.0, 23.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.588369369506836, -18.250732421875, -14.913095474243164, -11.575459480285645, -8.237822532653809, -4.900186538696289, -1.5625495910644531, 1.7750873565673828, 5.112724304199219, 8.450361251831055, 11.78799819946289, 15.12563419342041, 18.463272094726562, 21.800907135009766, 25.1385440826416, 28.476181030273438, 31.813817977905273, 35.15145492553711, 38.48908996582031, 41.82672882080078, 45.164363861083984, 48.50199890136719, 51.839637756347656, 55.177276611328125, 58.51491165161133, 61.85254669189453, 65.190185546875, 68.52782440185547, 71.8654556274414, 75.20309448242188, 78.54073333740234, 81.87837219238281, 85.21601104736328, 88.55364990234375, 91.89128112792969, 95.22891998291016, 98.56655883789062, 101.90419006347656, 105.24182891845703, 108.5794677734375, 111.91710662841797, 115.25474548339844, 118.59237670898438, 121.93001556396484, 125.26765441894531, 128.60528564453125, 131.94293212890625, 135.2805633544922, 138.61819458007812, 141.95582580566406, 145.29347229003906, 148.631103515625, 151.96873474121094, 155.30638122558594, 158.64401245117188, 161.98165893554688, 165.3192901611328, 168.65692138671875, 171.99456787109375, 175.3321990966797, 178.66983032226562, 182.00747680664062, 185.34510803222656, 188.6827392578125, 192.0203857421875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 0.0, 5.0, 8.0, 4.0, 12.0, 7.0, 20.0, 14.0, 24.0, 26.0, 26.0, 24.0, 37.0, 30.0, 27.0, 47.0, 47.0, 45.0, 50.0, 33.0, 45.0, 42.0, 48.0, 41.0, 43.0, 37.0, 28.0, 43.0, 36.0, 25.0, 20.0, 23.0, 16.0, 16.0, 12.0, 8.0, 9.0, 9.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.859529495239258, -16.338594436645508, -15.817657470703125, -15.296721458435059, -14.775785446166992, -14.254849433898926, -13.73391342163086, -13.21297836303711, -12.692041397094727, -12.17110538482666, -11.650169372558594, -11.129233360290527, -10.608297348022461, -10.087361335754395, -9.566425323486328, -9.045490264892578, -8.524554252624512, -8.003618240356445, -7.482682228088379, -6.9617462158203125, -6.440810203552246, -5.91987419128418, -5.3989386558532715, -4.878002643585205, -4.357066631317139, -3.8361306190490723, -3.315194606781006, -2.7942588329315186, -2.273322820663452, -1.7523868083953857, -1.2314510345458984, -0.710515022277832, -0.18957901000976562, 0.331356942653656, 0.8522928953170776, 1.3732287883758545, 1.894164800643921, 2.4151008129119873, 2.9360365867614746, 3.456972599029541, 3.9779086112976074, 4.498844623565674, 5.01978063583374, 5.540716171264648, 6.061652183532715, 6.582588195800781, 7.103524208068848, 7.624460220336914, 8.14539623260498, 8.666332244873047, 9.187268257141113, 9.70820426940918, 10.229140281677246, 10.750076293945312, 11.271011352539062, 11.791948318481445, 12.312883377075195, 12.833819389343262, 13.354755401611328, 13.875691413879395, 14.396627426147461, 14.917563438415527, 15.438499450683594, 15.959434509277344, 16.480371475219727]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 5.0, 1.0, 3.0, 8.0, 3.0, 9.0, 6.0, 11.0, 10.0, 16.0, 24.0, 24.0, 33.0, 31.0, 50.0, 62.0, 144.0, 301.0, 681.0, 1870.0, 6532.0, 35182.0, 421020.0, 3093070.0, 579274.0, 44545.0, 7828.0, 2095.0, 725.0, 294.0, 143.0, 68.0, 56.0, 26.0, 22.0, 16.0, 19.0, 11.0, 15.0, 8.0, 13.0, 11.0, 7.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4375, -13.9649658203125, -13.492431640625, -13.0198974609375, -12.54736328125, -12.0748291015625, -11.602294921875, -11.1297607421875, -10.6572265625, -10.1846923828125, -9.712158203125, -9.2396240234375, -8.76708984375, -8.2945556640625, -7.822021484375, -7.3494873046875, -6.876953125, -6.4044189453125, -5.931884765625, -5.4593505859375, -4.98681640625, -4.5142822265625, -4.041748046875, -3.5692138671875, -3.0966796875, -2.6241455078125, -2.151611328125, -1.6790771484375, -1.20654296875, -0.7340087890625, -0.261474609375, 0.2110595703125, 0.68359375, 1.1561279296875, 1.628662109375, 2.1011962890625, 2.57373046875, 3.0462646484375, 3.518798828125, 3.9913330078125, 4.4638671875, 4.9364013671875, 5.408935546875, 5.8814697265625, 6.35400390625, 6.8265380859375, 7.299072265625, 7.7716064453125, 8.244140625, 8.7166748046875, 9.189208984375, 9.6617431640625, 10.13427734375, 10.6068115234375, 11.079345703125, 11.5518798828125, 12.0244140625, 12.4969482421875, 12.969482421875, 13.4420166015625, 13.91455078125, 14.3870849609375, 14.859619140625, 15.3321533203125, 15.8046875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 0.0, 7.0, 5.0, 6.0, 9.0, 11.0, 9.0, 13.0, 22.0, 24.0, 14.0, 25.0, 39.0, 38.0, 45.0, 48.0, 52.0, 52.0, 47.0, 52.0, 49.0, 61.0, 59.0, 41.0, 46.0, 40.0, 30.0, 19.0, 29.0, 22.0, 23.0, 16.0, 9.0, 10.0, 7.0, 5.0, 8.0, 2.0, 3.0, 5.0, 6.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7578125, -7.5338134765625, -7.309814453125, -7.0858154296875, -6.86181640625, -6.6378173828125, -6.413818359375, -6.1898193359375, -5.9658203125, -5.7418212890625, -5.517822265625, -5.2938232421875, -5.06982421875, -4.8458251953125, -4.621826171875, -4.3978271484375, -4.173828125, -3.9498291015625, -3.725830078125, -3.5018310546875, -3.27783203125, -3.0538330078125, -2.829833984375, -2.6058349609375, -2.3818359375, -2.1578369140625, -1.933837890625, -1.7098388671875, -1.48583984375, -1.2618408203125, -1.037841796875, -0.8138427734375, -0.58984375, -0.3658447265625, -0.141845703125, 0.0821533203125, 0.30615234375, 0.5301513671875, 0.754150390625, 0.9781494140625, 1.2021484375, 1.4261474609375, 1.650146484375, 1.8741455078125, 2.09814453125, 2.3221435546875, 2.546142578125, 2.7701416015625, 2.994140625, 3.2181396484375, 3.442138671875, 3.6661376953125, 3.89013671875, 4.1141357421875, 4.338134765625, 4.5621337890625, 4.7861328125, 5.0101318359375, 5.234130859375, 5.4581298828125, 5.68212890625, 5.9061279296875, 6.130126953125, 6.3541259765625, 6.578125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 5.0, 16.0, 22.0, 26.0, 63.0, 108.0, 153.0, 445.0, 1747.0, 34142.0, 4000105.0, 153264.0, 3177.0, 524.0, 219.0, 99.0, 54.0, 36.0, 21.0, 13.0, 9.0, 10.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.625, -39.649658203125, -38.67431640625, -37.698974609375, -36.7236328125, -35.748291015625, -34.77294921875, -33.797607421875, -32.822265625, -31.846923828125, -30.87158203125, -29.896240234375, -28.9208984375, -27.945556640625, -26.97021484375, -25.994873046875, -25.01953125, -24.044189453125, -23.06884765625, -22.093505859375, -21.1181640625, -20.142822265625, -19.16748046875, -18.192138671875, -17.216796875, -16.241455078125, -15.26611328125, -14.290771484375, -13.3154296875, -12.340087890625, -11.36474609375, -10.389404296875, -9.4140625, -8.438720703125, -7.46337890625, -6.488037109375, -5.5126953125, -4.537353515625, -3.56201171875, -2.586669921875, -1.611328125, -0.635986328125, 0.33935546875, 1.314697265625, 2.2900390625, 3.265380859375, 4.24072265625, 5.216064453125, 6.19140625, 7.166748046875, 8.14208984375, 9.117431640625, 10.0927734375, 11.068115234375, 12.04345703125, 13.018798828125, 13.994140625, 14.969482421875, 15.94482421875, 16.920166015625, 17.8955078125, 18.870849609375, 19.84619140625, 20.821533203125, 21.796875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 5.0, 5.0, 12.0, 6.0, 13.0, 23.0, 27.0, 35.0, 49.0, 46.0, 78.0, 124.0, 152.0, 222.0, 295.0, 456.0, 510.0, 495.0, 442.0, 305.0, 223.0, 125.0, 108.0, 74.0, 59.0, 40.0, 44.0, 25.0, 20.0, 21.0, 11.0, 4.0, 5.0, 7.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.111328125, -2.026458740234375, -1.94158935546875, -1.856719970703125, -1.7718505859375, -1.686981201171875, -1.60211181640625, -1.517242431640625, -1.432373046875, -1.347503662109375, -1.26263427734375, -1.177764892578125, -1.0928955078125, -1.008026123046875, -0.92315673828125, -0.838287353515625, -0.75341796875, -0.668548583984375, -0.58367919921875, -0.498809814453125, -0.4139404296875, -0.329071044921875, -0.24420166015625, -0.159332275390625, -0.074462890625, 0.010406494140625, 0.09527587890625, 0.180145263671875, 0.2650146484375, 0.349884033203125, 0.43475341796875, 0.519622802734375, 0.6044921875, 0.689361572265625, 0.77423095703125, 0.859100341796875, 0.9439697265625, 1.028839111328125, 1.11370849609375, 1.198577880859375, 1.283447265625, 1.368316650390625, 1.45318603515625, 1.538055419921875, 1.6229248046875, 1.707794189453125, 1.79266357421875, 1.877532958984375, 1.96240234375, 2.047271728515625, 2.13214111328125, 2.217010498046875, 2.3018798828125, 2.386749267578125, 2.47161865234375, 2.556488037109375, 2.641357421875, 2.726226806640625, 2.81109619140625, 2.895965576171875, 2.9808349609375, 3.065704345703125, 3.15057373046875, 3.235443115234375, 3.3203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 11.0, 10.0, 7.0, 14.0, 14.0, 23.0, 20.0, 32.0, 45.0, 51.0, 58.0, 97.0, 90.0, 66.0, 74.0, 76.0, 63.0, 57.0, 42.0, 33.0, 25.0, 33.0, 21.0, 8.0, 6.0, 7.0, 10.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.709470748901367, -11.387870788574219, -11.06627082824707, -10.744669914245605, -10.423069953918457, -10.101469993591309, -9.779869079589844, -9.458269119262695, -9.136669158935547, -8.815069198608398, -8.49346923828125, -8.171868324279785, -7.850268363952637, -7.528668403625488, -7.207067966461182, -6.885467529296875, -6.563867568969727, -6.242267608642578, -5.9206671714782715, -5.599066734313965, -5.277466773986816, -4.955866813659668, -4.634266376495361, -4.312665939331055, -3.9910659790039062, -3.6694657802581787, -3.347865581512451, -3.0262653827667236, -2.704665184020996, -2.3830649852752686, -2.061464786529541, -1.7398645877838135, -1.418264389038086, -1.0966641902923584, -0.7750639915466309, -0.4534637928009033, -0.13186359405517578, 0.18973660469055176, 0.5113368034362793, 0.8329370021820068, 1.1545372009277344, 1.476137399673462, 1.7977375984191895, 2.119337797164917, 2.4409379959106445, 2.762538194656372, 3.0841383934020996, 3.405738592147827, 3.7273387908935547, 4.048938751220703, 4.37053918838501, 4.692139625549316, 5.013739585876465, 5.335339546203613, 5.65693998336792, 5.978540420532227, 6.300140380859375, 6.621740341186523, 6.94334077835083, 7.264941215515137, 7.586541175842285, 7.908141136169434, 8.229742050170898, 8.551342010498047, 8.872941970825195]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 5.0, 3.0, 7.0, 5.0, 11.0, 5.0, 11.0, 10.0, 19.0, 24.0, 31.0, 21.0, 26.0, 38.0, 32.0, 43.0, 40.0, 38.0, 36.0, 45.0, 40.0, 39.0, 46.0, 41.0, 38.0, 37.0, 40.0, 33.0, 32.0, 35.0, 27.0, 23.0, 23.0, 18.0, 15.0, 13.0, 14.0, 6.0, 8.0, 8.0, 10.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.32787561416626, -7.113492012023926, -6.899107933044434, -6.6847243309021, -6.470340728759766, -6.255956649780273, -6.0415730476379395, -5.8271894454956055, -5.6128058433532715, -5.3984222412109375, -5.184038162231445, -4.969654560089111, -4.755270957946777, -4.540886878967285, -4.326503276824951, -4.112119674682617, -3.897735834121704, -3.683351993560791, -3.468968391418457, -3.254584550857544, -3.04020094871521, -2.825817108154297, -2.611433506011963, -2.39704966545105, -2.1826658248901367, -1.9682821035385132, -1.7538983821868896, -1.5395145416259766, -1.3251309394836426, -1.1107470989227295, -0.896363377571106, -0.6819796562194824, -0.46759605407714844, -0.2532123327255249, -0.03882858157157898, 0.17555516958236694, 0.3899388909339905, 0.6043226718902588, 0.8187063932418823, 1.0330901145935059, 1.2474738359451294, 1.461857557296753, 1.6762412786483765, 1.890625, 2.105008840560913, 2.319392681121826, 2.53377628326416, 2.748159885406494, 2.9625437259674072, 3.1769275665283203, 3.3913111686706543, 3.6056950092315674, 3.8200786113739014, 4.0344624519348145, 4.248846054077148, 4.463230133056641, 4.677613735198975, 4.891997337341309, 5.106381416320801, 5.320765018463135, 5.535148620605469, 5.749532699584961, 5.963916301727295, 6.178299903869629, 6.392683506011963]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 16.0, 11.0, 25.0, 29.0, 55.0, 91.0, 188.0, 371.0, 878.0, 2198.0, 6113.0, 19278.0, 69907.0, 317576.0, 471201.0, 116429.0, 29703.0, 9116.0, 3060.0, 1217.0, 491.0, 261.0, 132.0, 62.0, 46.0, 23.0, 21.0, 10.0, 7.0, 12.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.79296875, -3.675079345703125, -3.55718994140625, -3.439300537109375, -3.3214111328125, -3.203521728515625, -3.08563232421875, -2.967742919921875, -2.849853515625, -2.731964111328125, -2.61407470703125, -2.496185302734375, -2.3782958984375, -2.260406494140625, -2.14251708984375, -2.024627685546875, -1.90673828125, -1.788848876953125, -1.67095947265625, -1.553070068359375, -1.4351806640625, -1.317291259765625, -1.19940185546875, -1.081512451171875, -0.963623046875, -0.845733642578125, -0.72784423828125, -0.609954833984375, -0.4920654296875, -0.374176025390625, -0.25628662109375, -0.138397216796875, -0.0205078125, 0.097381591796875, 0.21527099609375, 0.333160400390625, 0.4510498046875, 0.568939208984375, 0.68682861328125, 0.804718017578125, 0.922607421875, 1.040496826171875, 1.15838623046875, 1.276275634765625, 1.3941650390625, 1.512054443359375, 1.62994384765625, 1.747833251953125, 1.86572265625, 1.983612060546875, 2.10150146484375, 2.219390869140625, 2.3372802734375, 2.455169677734375, 2.57305908203125, 2.690948486328125, 2.808837890625, 2.926727294921875, 3.04461669921875, 3.162506103515625, 3.2803955078125, 3.398284912109375, 3.51617431640625, 3.634063720703125, 3.751953125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 2.0, 5.0, 10.0, 10.0, 13.0, 22.0, 6.0, 22.0, 25.0, 30.0, 33.0, 31.0, 28.0, 45.0, 41.0, 46.0, 37.0, 46.0, 48.0, 39.0, 42.0, 46.0, 39.0, 42.0, 32.0, 39.0, 39.0, 23.0, 19.0, 22.0, 19.0, 18.0, 16.0, 14.0, 8.0, 6.0, 2.0, 6.0, 9.0, 3.0, 6.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.25390625, -4.12457275390625, -3.9952392578125, -3.86590576171875, -3.736572265625, -3.60723876953125, -3.4779052734375, -3.34857177734375, -3.21923828125, -3.08990478515625, -2.9605712890625, -2.83123779296875, -2.701904296875, -2.57257080078125, -2.4432373046875, -2.31390380859375, -2.1845703125, -2.05523681640625, -1.9259033203125, -1.79656982421875, -1.667236328125, -1.53790283203125, -1.4085693359375, -1.27923583984375, -1.14990234375, -1.02056884765625, -0.8912353515625, -0.76190185546875, -0.632568359375, -0.50323486328125, -0.3739013671875, -0.24456787109375, -0.115234375, 0.01409912109375, 0.1434326171875, 0.27276611328125, 0.402099609375, 0.53143310546875, 0.6607666015625, 0.79010009765625, 0.91943359375, 1.04876708984375, 1.1781005859375, 1.30743408203125, 1.436767578125, 1.56610107421875, 1.6954345703125, 1.82476806640625, 1.9541015625, 2.08343505859375, 2.2127685546875, 2.34210205078125, 2.471435546875, 2.60076904296875, 2.7301025390625, 2.85943603515625, 2.98876953125, 3.11810302734375, 3.2474365234375, 3.37677001953125, 3.506103515625, 3.63543701171875, 3.7647705078125, 3.89410400390625, 4.0234375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 6.0, 14.0, 12.0, 18.0, 31.0, 40.0, 68.0, 95.0, 151.0, 276.0, 499.0, 960.0, 2392.0, 6253.0, 20327.0, 75754.0, 343366.0, 449668.0, 107409.0, 27582.0, 8198.0, 2912.0, 1200.0, 555.0, 297.0, 175.0, 100.0, 47.0, 46.0, 39.0, 17.0, 18.0, 13.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.943359375, -2.84564208984375, -2.7479248046875, -2.65020751953125, -2.552490234375, -2.45477294921875, -2.3570556640625, -2.25933837890625, -2.16162109375, -2.06390380859375, -1.9661865234375, -1.86846923828125, -1.770751953125, -1.67303466796875, -1.5753173828125, -1.47760009765625, -1.3798828125, -1.28216552734375, -1.1844482421875, -1.08673095703125, -0.989013671875, -0.89129638671875, -0.7935791015625, -0.69586181640625, -0.59814453125, -0.50042724609375, -0.4027099609375, -0.30499267578125, -0.207275390625, -0.10955810546875, -0.0118408203125, 0.08587646484375, 0.18359375, 0.28131103515625, 0.3790283203125, 0.47674560546875, 0.574462890625, 0.67218017578125, 0.7698974609375, 0.86761474609375, 0.96533203125, 1.06304931640625, 1.1607666015625, 1.25848388671875, 1.356201171875, 1.45391845703125, 1.5516357421875, 1.64935302734375, 1.7470703125, 1.84478759765625, 1.9425048828125, 2.04022216796875, 2.137939453125, 2.23565673828125, 2.3333740234375, 2.43109130859375, 2.52880859375, 2.62652587890625, 2.7242431640625, 2.82196044921875, 2.919677734375, 3.01739501953125, 3.1151123046875, 3.21282958984375, 3.310546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 6.0, 7.0, 8.0, 10.0, 14.0, 14.0, 10.0, 9.0, 22.0, 21.0, 26.0, 29.0, 33.0, 30.0, 36.0, 38.0, 38.0, 42.0, 41.0, 43.0, 45.0, 42.0, 30.0, 51.0, 37.0, 41.0, 38.0, 23.0, 29.0, 20.0, 27.0, 18.0, 27.0, 15.0, 10.0, 15.0, 8.0, 6.0, 9.0, 7.0, 4.0, 3.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 3.0], "bins": [-8.28125, -8.0491943359375, -7.817138671875, -7.5850830078125, -7.35302734375, -7.1209716796875, -6.888916015625, -6.6568603515625, -6.4248046875, -6.1927490234375, -5.960693359375, -5.7286376953125, -5.49658203125, -5.2645263671875, -5.032470703125, -4.8004150390625, -4.568359375, -4.3363037109375, -4.104248046875, -3.8721923828125, -3.64013671875, -3.4080810546875, -3.176025390625, -2.9439697265625, -2.7119140625, -2.4798583984375, -2.247802734375, -2.0157470703125, -1.78369140625, -1.5516357421875, -1.319580078125, -1.0875244140625, -0.85546875, -0.6234130859375, -0.391357421875, -0.1593017578125, 0.07275390625, 0.3048095703125, 0.536865234375, 0.7689208984375, 1.0009765625, 1.2330322265625, 1.465087890625, 1.6971435546875, 1.92919921875, 2.1612548828125, 2.393310546875, 2.6253662109375, 2.857421875, 3.0894775390625, 3.321533203125, 3.5535888671875, 3.78564453125, 4.0177001953125, 4.249755859375, 4.4818115234375, 4.7138671875, 4.9459228515625, 5.177978515625, 5.4100341796875, 5.64208984375, 5.8741455078125, 6.106201171875, 6.3382568359375, 6.5703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 7.0, 14.0, 23.0, 25.0, 38.0, 53.0, 78.0, 111.0, 193.0, 302.0, 550.0, 993.0, 1811.0, 3693.0, 8037.0, 19232.0, 54531.0, 178331.0, 420668.0, 242247.0, 73145.0, 25079.0, 9929.0, 4435.0, 2212.0, 1154.0, 667.0, 366.0, 189.0, 157.0, 87.0, 63.0, 36.0, 29.0, 20.0, 16.0, 5.0, 5.0, 7.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7802734375, -0.7520294189453125, -0.723785400390625, -0.6955413818359375, -0.66729736328125, -0.6390533447265625, -0.610809326171875, -0.5825653076171875, -0.5543212890625, -0.5260772705078125, -0.497833251953125, -0.4695892333984375, -0.44134521484375, -0.4131011962890625, -0.384857177734375, -0.3566131591796875, -0.328369140625, -0.3001251220703125, -0.271881103515625, -0.2436370849609375, -0.21539306640625, -0.1871490478515625, -0.158905029296875, -0.1306610107421875, -0.1024169921875, -0.0741729736328125, -0.045928955078125, -0.0176849365234375, 0.01055908203125, 0.0388031005859375, 0.067047119140625, 0.0952911376953125, 0.12353515625, 0.1517791748046875, 0.180023193359375, 0.2082672119140625, 0.23651123046875, 0.2647552490234375, 0.292999267578125, 0.3212432861328125, 0.3494873046875, 0.3777313232421875, 0.405975341796875, 0.4342193603515625, 0.46246337890625, 0.4907073974609375, 0.518951416015625, 0.5471954345703125, 0.575439453125, 0.6036834716796875, 0.631927490234375, 0.6601715087890625, 0.68841552734375, 0.7166595458984375, 0.744903564453125, 0.7731475830078125, 0.8013916015625, 0.8296356201171875, 0.857879638671875, 0.8861236572265625, 0.91436767578125, 0.9426116943359375, 0.970855712890625, 0.9990997314453125, 1.02734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 1.0, 7.0, 6.0, 7.0, 7.0, 13.0, 13.0, 22.0, 30.0, 44.0, 45.0, 64.0, 107.0, 93.0, 108.0, 98.0, 80.0, 64.0, 50.0, 27.0, 27.0, 20.0, 15.0, 14.0, 12.0, 3.0, 7.0, 8.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006265640258789062, -0.0006082430481910706, -0.0005899220705032349, -0.0005716010928153992, -0.0005532801151275635, -0.0005349591374397278, -0.0005166381597518921, -0.0004983171820640564, -0.0004799962043762207, -0.000461675226688385, -0.0004433542490005493, -0.0004250332713127136, -0.00040671229362487793, -0.00038839131593704224, -0.00037007033824920654, -0.00035174936056137085, -0.00033342838287353516, -0.00031510740518569946, -0.00029678642749786377, -0.0002784654498100281, -0.0002601444721221924, -0.0002418234944343567, -0.000223502516746521, -0.0002051815390586853, -0.0001868605613708496, -0.00016853958368301392, -0.00015021860599517822, -0.00013189762830734253, -0.00011357665061950684, -9.525567293167114e-05, -7.693469524383545e-05, -5.8613717555999756e-05, -4.029273986816406e-05, -2.197176218032837e-05, -3.6507844924926758e-06, 1.4670193195343018e-05, 3.299117088317871e-05, 5.1312148571014404e-05, 6.96331262588501e-05, 8.795410394668579e-05, 0.00010627508163452148, 0.00012459605932235718, 0.00014291703701019287, 0.00016123801469802856, 0.00017955899238586426, 0.00019787997007369995, 0.00021620094776153564, 0.00023452192544937134, 0.00025284290313720703, 0.0002711638808250427, 0.0002894848585128784, 0.0003078058362007141, 0.0003261268138885498, 0.0003444477915763855, 0.0003627687692642212, 0.0003810897469520569, 0.0003994107246398926, 0.00041773170232772827, 0.00043605268001556396, 0.00045437365770339966, 0.00047269463539123535, 0.000491015613079071, 0.0005093365907669067, 0.0005276575684547424, 0.0005459785461425781]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 7.0, 9.0, 7.0, 11.0, 22.0, 28.0, 28.0, 41.0, 58.0, 142.0, 238.0, 400.0, 713.0, 1528.0, 3156.0, 7275.0, 17895.0, 52231.0, 188679.0, 458080.0, 222837.0, 60117.0, 20077.0, 8005.0, 3450.0, 1629.0, 811.0, 451.0, 239.0, 146.0, 79.0, 41.0, 41.0, 22.0, 17.0, 6.0, 12.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.93505859375, -0.9011306762695312, -0.8672027587890625, -0.8332748413085938, -0.799346923828125, -0.7654190063476562, -0.7314910888671875, -0.6975631713867188, -0.66363525390625, -0.6297073364257812, -0.5957794189453125, -0.5618515014648438, -0.527923583984375, -0.49399566650390625, -0.4600677490234375, -0.42613983154296875, -0.3922119140625, -0.35828399658203125, -0.3243560791015625, -0.29042816162109375, -0.256500244140625, -0.22257232666015625, -0.1886444091796875, -0.15471649169921875, -0.12078857421875, -0.08686065673828125, -0.0529327392578125, -0.01900482177734375, 0.014923095703125, 0.04885101318359375, 0.0827789306640625, 0.11670684814453125, 0.150634765625, 0.18456268310546875, 0.2184906005859375, 0.25241851806640625, 0.286346435546875, 0.32027435302734375, 0.3542022705078125, 0.38813018798828125, 0.42205810546875, 0.45598602294921875, 0.4899139404296875, 0.5238418579101562, 0.557769775390625, 0.5916976928710938, 0.6256256103515625, 0.6595535278320312, 0.6934814453125, 0.7274093627929688, 0.7613372802734375, 0.7952651977539062, 0.829193115234375, 0.8631210327148438, 0.8970489501953125, 0.9309768676757812, 0.96490478515625, 0.9988327026367188, 1.0327606201171875, 1.0666885375976562, 1.100616455078125, 1.1345443725585938, 1.1684722900390625, 1.2024002075195312, 1.236328125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 2.0, 3.0, 4.0, 8.0, 14.0, 11.0, 12.0, 18.0, 30.0, 34.0, 35.0, 48.0, 54.0, 51.0, 80.0, 83.0, 78.0, 81.0, 84.0, 49.0, 57.0, 35.0, 32.0, 16.0, 22.0, 14.0, 6.0, 9.0, 4.0, 4.0, 7.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.304931640625, -0.29500579833984375, -0.2850799560546875, -0.27515411376953125, -0.265228271484375, -0.25530242919921875, -0.2453765869140625, -0.23545074462890625, -0.22552490234375, -0.21559906005859375, -0.2056732177734375, -0.19574737548828125, -0.185821533203125, -0.17589569091796875, -0.1659698486328125, -0.15604400634765625, -0.1461181640625, -0.13619232177734375, -0.1262664794921875, -0.11634063720703125, -0.106414794921875, -0.09648895263671875, -0.0865631103515625, -0.07663726806640625, -0.06671142578125, -0.05678558349609375, -0.0468597412109375, -0.03693389892578125, -0.027008056640625, -0.01708221435546875, -0.0071563720703125, 0.00276947021484375, 0.0126953125, 0.02262115478515625, 0.0325469970703125, 0.04247283935546875, 0.052398681640625, 0.06232452392578125, 0.0722503662109375, 0.08217620849609375, 0.09210205078125, 0.10202789306640625, 0.1119537353515625, 0.12187957763671875, 0.131805419921875, 0.14173126220703125, 0.1516571044921875, 0.16158294677734375, 0.1715087890625, 0.18143463134765625, 0.1913604736328125, 0.20128631591796875, 0.211212158203125, 0.22113800048828125, 0.2310638427734375, 0.24098968505859375, 0.25091552734375, 0.26084136962890625, 0.2707672119140625, 0.28069305419921875, 0.290618896484375, 0.30054473876953125, 0.3104705810546875, 0.32039642333984375, 0.330322265625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 7.0, 9.0, 12.0, 9.0, 9.0, 22.0, 30.0, 30.0, 58.0, 74.0, 101.0, 108.0, 129.0, 80.0, 72.0, 78.0, 43.0, 42.0, 35.0, 17.0, 16.0, 6.0, 10.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.241601943969727, -7.002431392669678, -6.763261318206787, -6.524090766906738, -6.284920692443848, -6.045750141143799, -5.806580066680908, -5.567409515380859, -5.328239440917969, -5.08906888961792, -4.849898815155029, -4.6107282638549805, -4.37155818939209, -4.132387638092041, -3.8932175636291504, -3.6540470123291016, -3.414876699447632, -3.175706386566162, -2.9365360736846924, -2.6973657608032227, -2.458195447921753, -2.219025135040283, -1.979854702949524, -1.7406843900680542, -1.5015140771865845, -1.2623437643051147, -1.023173451423645, -0.7840030789375305, -0.5448327660560608, -0.3056623935699463, -0.06649208068847656, 0.17267823219299316, 0.4118485450744629, 0.6510188579559326, 0.8901891708374023, 1.129359483718872, 1.3685297966003418, 1.607700228691101, 1.8468705415725708, 2.08604097366333, 2.3252110481262207, 2.5643813610076904, 2.80355167388916, 3.04272198677063, 3.2818922996520996, 3.5210628509521484, 3.760232925415039, 3.999403476715088, 4.238574028015137, 4.4777445793151855, 4.716914653778076, 4.956085205078125, 5.195255279541016, 5.4344258308410645, 5.673595905303955, 5.912766456604004, 6.1519365310668945, 6.391107082366943, 6.630277156829834, 6.869447708129883, 7.108617782592773, 7.347788333892822, 7.586958408355713, 7.826128959655762, 8.065299034118652]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 7.0, 2.0, 3.0, 6.0, 8.0, 10.0, 12.0, 11.0, 14.0, 17.0, 26.0, 22.0, 24.0, 32.0, 44.0, 33.0, 47.0, 42.0, 41.0, 51.0, 42.0, 48.0, 43.0, 43.0, 39.0, 36.0, 34.0, 42.0, 40.0, 27.0, 29.0, 21.0, 19.0, 18.0, 12.0, 17.0, 12.0, 8.0, 6.0, 5.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-4.603539943695068, -4.472345352172852, -4.341151237487793, -4.209956645965576, -4.078762054443359, -3.9475677013397217, -3.816373348236084, -3.685178756713867, -3.5539844036102295, -3.422790050506592, -3.291595458984375, -3.1604011058807373, -3.0292067527770996, -2.898012161254883, -2.766817808151245, -2.6356234550476074, -2.5044288635253906, -2.373234510421753, -2.242039918899536, -2.1108455657958984, -1.9796510934829712, -1.848456621170044, -1.7172622680664062, -1.586067795753479, -1.4548733234405518, -1.3236788511276245, -1.1924843788146973, -1.0612900257110596, -0.9300955533981323, -0.7989010810852051, -0.6677066683769226, -0.5365122556686401, -0.405318021774292, -0.27412357926368713, -0.14292913675308228, -0.011734694242477417, 0.11945974826812744, 0.2506542205810547, 0.38184863328933716, 0.5130430459976196, 0.6442375183105469, 0.7754319906234741, 0.9066264033317566, 1.037820816040039, 1.1690152883529663, 1.3002097606658936, 1.4314041137695312, 1.5625985860824585, 1.6937930583953857, 1.824987530708313, 1.9561820030212402, 2.087376356124878, 2.2185707092285156, 2.3497653007507324, 2.48095965385437, 2.612154006958008, 2.7433485984802246, 2.8745429515838623, 3.005737543106079, 3.136931896209717, 3.2681264877319336, 3.3993208408355713, 3.530515193939209, 3.661709785461426, 3.7929041385650635]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 7.0, 11.0, 33.0, 51.0, 72.0, 138.0, 243.0, 542.0, 1120.0, 2528.0, 6383.0, 17727.0, 55720.0, 202793.0, 494351.0, 187837.0, 51737.0, 16514.0, 6122.0, 2451.0, 1070.0, 533.0, 238.0, 122.0, 75.0, 31.0, 33.0, 19.0, 9.0, 8.0, 1.0, 3.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.15625, -5.96063232421875, -5.7650146484375, -5.56939697265625, -5.373779296875, -5.17816162109375, -4.9825439453125, -4.78692626953125, -4.59130859375, -4.39569091796875, -4.2000732421875, -4.00445556640625, -3.808837890625, -3.61322021484375, -3.4176025390625, -3.22198486328125, -3.0263671875, -2.83074951171875, -2.6351318359375, -2.43951416015625, -2.243896484375, -2.04827880859375, -1.8526611328125, -1.65704345703125, -1.46142578125, -1.26580810546875, -1.0701904296875, -0.87457275390625, -0.678955078125, -0.48333740234375, -0.2877197265625, -0.09210205078125, 0.103515625, 0.29913330078125, 0.4947509765625, 0.69036865234375, 0.885986328125, 1.08160400390625, 1.2772216796875, 1.47283935546875, 1.66845703125, 1.86407470703125, 2.0596923828125, 2.25531005859375, 2.450927734375, 2.64654541015625, 2.8421630859375, 3.03778076171875, 3.2333984375, 3.42901611328125, 3.6246337890625, 3.82025146484375, 4.015869140625, 4.21148681640625, 4.4071044921875, 4.60272216796875, 4.79833984375, 4.99395751953125, 5.1895751953125, 5.38519287109375, 5.580810546875, 5.77642822265625, 5.9720458984375, 6.16766357421875, 6.36328125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 9.0, 12.0, 15.0, 11.0, 14.0, 14.0, 19.0, 25.0, 36.0, 44.0, 35.0, 46.0, 34.0, 47.0, 42.0, 57.0, 46.0, 50.0, 56.0, 47.0, 32.0, 42.0, 48.0, 38.0, 24.0, 23.0, 27.0, 20.0, 17.0, 19.0, 13.0, 5.0, 5.0, 5.0, 4.0, 8.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5625, -9.260986328125, -8.95947265625, -8.657958984375, -8.3564453125, -8.054931640625, -7.75341796875, -7.451904296875, -7.150390625, -6.848876953125, -6.54736328125, -6.245849609375, -5.9443359375, -5.642822265625, -5.34130859375, -5.039794921875, -4.73828125, -4.436767578125, -4.13525390625, -3.833740234375, -3.5322265625, -3.230712890625, -2.92919921875, -2.627685546875, -2.326171875, -2.024658203125, -1.72314453125, -1.421630859375, -1.1201171875, -0.818603515625, -0.51708984375, -0.215576171875, 0.0859375, 0.387451171875, 0.68896484375, 0.990478515625, 1.2919921875, 1.593505859375, 1.89501953125, 2.196533203125, 2.498046875, 2.799560546875, 3.10107421875, 3.402587890625, 3.7041015625, 4.005615234375, 4.30712890625, 4.608642578125, 4.91015625, 5.211669921875, 5.51318359375, 5.814697265625, 6.1162109375, 6.417724609375, 6.71923828125, 7.020751953125, 7.322265625, 7.623779296875, 7.92529296875, 8.226806640625, 8.5283203125, 8.829833984375, 9.13134765625, 9.432861328125, 9.734375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 6.0, 4.0, 6.0, 5.0, 11.0, 20.0, 17.0, 21.0, 27.0, 16.0, 27.0, 34.0, 36.0, 59.0, 77.0, 106.0, 335.0, 8689.0, 993840.0, 44085.0, 596.0, 140.0, 83.0, 50.0, 41.0, 28.0, 32.0, 25.0, 29.0, 28.0, 21.0, 15.0, 12.0, 7.0, 9.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-35.90625, -34.952392578125, -33.99853515625, -33.044677734375, -32.0908203125, -31.136962890625, -30.18310546875, -29.229248046875, -28.275390625, -27.321533203125, -26.36767578125, -25.413818359375, -24.4599609375, -23.506103515625, -22.55224609375, -21.598388671875, -20.64453125, -19.690673828125, -18.73681640625, -17.782958984375, -16.8291015625, -15.875244140625, -14.92138671875, -13.967529296875, -13.013671875, -12.059814453125, -11.10595703125, -10.152099609375, -9.1982421875, -8.244384765625, -7.29052734375, -6.336669921875, -5.3828125, -4.428955078125, -3.47509765625, -2.521240234375, -1.5673828125, -0.613525390625, 0.34033203125, 1.294189453125, 2.248046875, 3.201904296875, 4.15576171875, 5.109619140625, 6.0634765625, 7.017333984375, 7.97119140625, 8.925048828125, 9.87890625, 10.832763671875, 11.78662109375, 12.740478515625, 13.6943359375, 14.648193359375, 15.60205078125, 16.555908203125, 17.509765625, 18.463623046875, 19.41748046875, 20.371337890625, 21.3251953125, 22.279052734375, 23.23291015625, 24.186767578125, 25.140625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 9.0, 8.0, 3.0, 6.0, 11.0, 17.0, 14.0, 26.0, 16.0, 23.0, 26.0, 39.0, 38.0, 37.0, 38.0, 48.0, 47.0, 49.0, 38.0, 43.0, 45.0, 40.0, 51.0, 35.0, 26.0, 47.0, 40.0, 23.0, 17.0, 33.0, 19.0, 19.0, 17.0, 15.0, 7.0, 8.0, 6.0, 4.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0], "bins": [-11.5, -11.19610595703125, -10.8922119140625, -10.58831787109375, -10.284423828125, -9.98052978515625, -9.6766357421875, -9.37274169921875, -9.06884765625, -8.76495361328125, -8.4610595703125, -8.15716552734375, -7.853271484375, -7.54937744140625, -7.2454833984375, -6.94158935546875, -6.6376953125, -6.33380126953125, -6.0299072265625, -5.72601318359375, -5.422119140625, -5.11822509765625, -4.8143310546875, -4.51043701171875, -4.20654296875, -3.90264892578125, -3.5987548828125, -3.29486083984375, -2.990966796875, -2.68707275390625, -2.3831787109375, -2.07928466796875, -1.775390625, -1.47149658203125, -1.1676025390625, -0.86370849609375, -0.559814453125, -0.25592041015625, 0.0479736328125, 0.35186767578125, 0.65576171875, 0.95965576171875, 1.2635498046875, 1.56744384765625, 1.871337890625, 2.17523193359375, 2.4791259765625, 2.78302001953125, 3.0869140625, 3.39080810546875, 3.6947021484375, 3.99859619140625, 4.302490234375, 4.60638427734375, 4.9102783203125, 5.21417236328125, 5.51806640625, 5.82196044921875, 6.1258544921875, 6.42974853515625, 6.733642578125, 7.03753662109375, 7.3414306640625, 7.64532470703125, 7.94921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 10.0, 16.0, 21.0, 24.0, 37.0, 58.0, 119.0, 154.0, 272.0, 427.0, 744.0, 1422.0, 2943.0, 7316.0, 21109.0, 83156.0, 464339.0, 370494.0, 66097.0, 17693.0, 6317.0, 2733.0, 1318.0, 705.0, 374.0, 202.0, 131.0, 112.0, 65.0, 46.0, 26.0, 16.0, 15.0, 9.0, 7.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.037109375, -1.973297119140625, -1.90948486328125, -1.845672607421875, -1.7818603515625, -1.718048095703125, -1.65423583984375, -1.590423583984375, -1.526611328125, -1.462799072265625, -1.39898681640625, -1.335174560546875, -1.2713623046875, -1.207550048828125, -1.14373779296875, -1.079925537109375, -1.01611328125, -0.952301025390625, -0.88848876953125, -0.824676513671875, -0.7608642578125, -0.697052001953125, -0.63323974609375, -0.569427490234375, -0.505615234375, -0.441802978515625, -0.37799072265625, -0.314178466796875, -0.2503662109375, -0.186553955078125, -0.12274169921875, -0.058929443359375, 0.0048828125, 0.068695068359375, 0.13250732421875, 0.196319580078125, 0.2601318359375, 0.323944091796875, 0.38775634765625, 0.451568603515625, 0.515380859375, 0.579193115234375, 0.64300537109375, 0.706817626953125, 0.7706298828125, 0.834442138671875, 0.89825439453125, 0.962066650390625, 1.02587890625, 1.089691162109375, 1.15350341796875, 1.217315673828125, 1.2811279296875, 1.344940185546875, 1.40875244140625, 1.472564697265625, 1.536376953125, 1.600189208984375, 1.66400146484375, 1.727813720703125, 1.7916259765625, 1.855438232421875, 1.91925048828125, 1.983062744140625, 2.046875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 3.0, 6.0, 10.0, 7.0, 9.0, 10.0, 22.0, 15.0, 23.0, 26.0, 36.0, 51.0, 62.0, 77.0, 82.0, 99.0, 89.0, 77.0, 67.0, 43.0, 44.0, 30.0, 24.0, 12.0, 17.0, 14.0, 11.0, 6.0, 3.0, 4.0, 7.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00027942657470703125, -0.00027058646082878113, -0.000261746346950531, -0.0002529062330722809, -0.00024406611919403076, -0.00023522600531578064, -0.00022638589143753052, -0.0002175457775592804, -0.00020870566368103027, -0.00019986554980278015, -0.00019102543592453003, -0.0001821853220462799, -0.00017334520816802979, -0.00016450509428977966, -0.00015566498041152954, -0.00014682486653327942, -0.0001379847526550293, -0.00012914463877677917, -0.00012030452489852905, -0.00011146441102027893, -0.00010262429714202881, -9.378418326377869e-05, -8.494406938552856e-05, -7.610395550727844e-05, -6.726384162902832e-05, -5.84237277507782e-05, -4.9583613872528076e-05, -4.0743499994277954e-05, -3.190338611602783e-05, -2.306327223777771e-05, -1.4223158359527588e-05, -5.383044481277466e-06, 3.4570693969726562e-06, 1.2297183275222778e-05, 2.11372971534729e-05, 2.9977411031723022e-05, 3.8817524909973145e-05, 4.7657638788223267e-05, 5.649775266647339e-05, 6.533786654472351e-05, 7.417798042297363e-05, 8.301809430122375e-05, 9.185820817947388e-05, 0.000100698322057724, 0.00010953843593597412, 0.00011837854981422424, 0.00012721866369247437, 0.0001360587775707245, 0.0001448988914489746, 0.00015373900532722473, 0.00016257911920547485, 0.00017141923308372498, 0.0001802593469619751, 0.00018909946084022522, 0.00019793957471847534, 0.00020677968859672546, 0.00021561980247497559, 0.0002244599163532257, 0.00023330003023147583, 0.00024214014410972595, 0.0002509802579879761, 0.0002598203718662262, 0.0002686604857444763, 0.00027750059962272644, 0.00028634071350097656]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 12.0, 22.0, 13.0, 34.0, 41.0, 65.0, 116.0, 181.0, 287.0, 477.0, 851.0, 1555.0, 3483.0, 8932.0, 29723.0, 132804.0, 549191.0, 248407.0, 49566.0, 13455.0, 4659.0, 2071.0, 1020.0, 639.0, 339.0, 213.0, 136.0, 80.0, 56.0, 25.0, 33.0, 19.0, 14.0, 7.0, 7.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.07421875, -2.0107574462890625, -1.947296142578125, -1.8838348388671875, -1.82037353515625, -1.7569122314453125, -1.693450927734375, -1.6299896240234375, -1.5665283203125, -1.5030670166015625, -1.439605712890625, -1.3761444091796875, -1.31268310546875, -1.2492218017578125, -1.185760498046875, -1.1222991943359375, -1.058837890625, -0.9953765869140625, -0.931915283203125, -0.8684539794921875, -0.80499267578125, -0.7415313720703125, -0.678070068359375, -0.6146087646484375, -0.5511474609375, -0.4876861572265625, -0.424224853515625, -0.3607635498046875, -0.29730224609375, -0.2338409423828125, -0.170379638671875, -0.1069183349609375, -0.04345703125, 0.0200042724609375, 0.083465576171875, 0.1469268798828125, 0.21038818359375, 0.2738494873046875, 0.337310791015625, 0.4007720947265625, 0.4642333984375, 0.5276947021484375, 0.591156005859375, 0.6546173095703125, 0.71807861328125, 0.7815399169921875, 0.845001220703125, 0.9084625244140625, 0.971923828125, 1.0353851318359375, 1.098846435546875, 1.1623077392578125, 1.22576904296875, 1.2892303466796875, 1.352691650390625, 1.4161529541015625, 1.4796142578125, 1.5430755615234375, 1.606536865234375, 1.6699981689453125, 1.73345947265625, 1.7969207763671875, 1.860382080078125, 1.9238433837890625, 1.9873046875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 5.0, 5.0, 9.0, 7.0, 16.0, 16.0, 18.0, 34.0, 25.0, 55.0, 55.0, 70.0, 86.0, 93.0, 113.0, 77.0, 64.0, 58.0, 60.0, 26.0, 26.0, 18.0, 9.0, 12.0, 5.0, 3.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78955078125, -0.7613449096679688, -0.7331390380859375, -0.7049331665039062, -0.676727294921875, -0.6485214233398438, -0.6203155517578125, -0.5921096801757812, -0.56390380859375, -0.5356979370117188, -0.5074920654296875, -0.47928619384765625, -0.451080322265625, -0.42287445068359375, -0.3946685791015625, -0.36646270751953125, -0.3382568359375, -0.31005096435546875, -0.2818450927734375, -0.25363922119140625, -0.225433349609375, -0.19722747802734375, -0.1690216064453125, -0.14081573486328125, -0.11260986328125, -0.08440399169921875, -0.0561981201171875, -0.02799224853515625, 0.000213623046875, 0.02841949462890625, 0.0566253662109375, 0.08483123779296875, 0.113037109375, 0.14124298095703125, 0.1694488525390625, 0.19765472412109375, 0.225860595703125, 0.25406646728515625, 0.2822723388671875, 0.31047821044921875, 0.33868408203125, 0.36688995361328125, 0.3950958251953125, 0.42330169677734375, 0.451507568359375, 0.47971343994140625, 0.5079193115234375, 0.5361251831054688, 0.5643310546875, 0.5925369262695312, 0.6207427978515625, 0.6489486694335938, 0.677154541015625, 0.7053604125976562, 0.7335662841796875, 0.7617721557617188, 0.78997802734375, 0.8181838989257812, 0.8463897705078125, 0.8745956420898438, 0.902801513671875, 0.9310073852539062, 0.9592132568359375, 0.9874191284179688, 1.015625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 16.0, 23.0, 27.0, 65.0, 104.0, 143.0, 144.0, 150.0, 105.0, 69.0, 59.0, 33.0, 24.0, 17.0, 7.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.5211181640625, -27.821117401123047, -27.121116638183594, -26.42111587524414, -25.721115112304688, -25.021114349365234, -24.32111358642578, -23.621112823486328, -22.921112060546875, -22.221111297607422, -21.52111053466797, -20.821109771728516, -20.121109008789062, -19.42110824584961, -18.721107482910156, -18.021106719970703, -17.321104049682617, -16.621103286743164, -15.921102523803711, -15.221101760864258, -14.521100997924805, -13.821100234985352, -13.121098518371582, -12.421097755432129, -11.721096992492676, -11.021096229553223, -10.32109546661377, -9.62109375, -8.921092987060547, -8.221092224121094, -7.521091461181641, -6.8210906982421875, -6.121088027954102, -5.421087265014648, -4.721086502075195, -4.021085262298584, -3.321084499359131, -2.6210837364196777, -1.9210824966430664, -1.2210817337036133, -0.5210809707641602, 0.17891991138458252, 0.8789207935333252, 1.5789217948913574, 2.2789225578308105, 2.9789233207702637, 3.678924560546875, 4.378925323486328, 5.078926086425781, 5.778926849365234, 6.4789276123046875, 7.178928852081299, 7.878929615020752, 8.578929901123047, 9.278931617736816, 9.97893238067627, 10.678933143615723, 11.378933906555176, 12.078934669494629, 12.778936386108398, 13.478937149047852, 14.178937911987305, 14.878938674926758, 15.578939437866211, 16.278940200805664]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 9.0, 8.0, 4.0, 12.0, 9.0, 17.0, 21.0, 16.0, 21.0, 19.0, 29.0, 36.0, 45.0, 30.0, 38.0, 43.0, 42.0, 22.0, 47.0, 37.0, 33.0, 38.0, 41.0, 41.0, 36.0, 34.0, 41.0, 24.0, 25.0, 30.0, 20.0, 16.0, 21.0, 16.0, 14.0, 12.0, 13.0, 11.0, 7.0, 3.0, 10.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.488299369812012, -12.049542427062988, -11.610784530639648, -11.172027587890625, -10.733270645141602, -10.294513702392578, -9.855756759643555, -9.416998863220215, -8.978241920471191, -8.539484977722168, -8.100727081298828, -7.661970138549805, -7.223213195800781, -6.784456253051758, -6.345698833465576, -5.9069414138793945, -5.468184471130371, -5.029427528381348, -4.590670108795166, -4.151912689208984, -3.713155746459961, -3.2743985652923584, -2.835641384124756, -2.3968842029571533, -1.9581270217895508, -1.5193698406219482, -1.0806126594543457, -0.6418554782867432, -0.20309829711914062, 0.23565888404846191, 0.6744160652160645, 1.113173246383667, 1.5519304275512695, 1.990687608718872, 2.4294447898864746, 2.868201971054077, 3.3069591522216797, 3.7457163333892822, 4.184473514556885, 4.623230934143066, 5.06198787689209, 5.500744819641113, 5.939502239227295, 6.378259658813477, 6.8170166015625, 7.255773544311523, 7.694530963897705, 8.133288383483887, 8.57204532623291, 9.010802268981934, 9.449560165405273, 9.888317108154297, 10.32707405090332, 10.765830993652344, 11.204587936401367, 11.643345832824707, 12.08210277557373, 12.520859718322754, 12.959617614746094, 13.398374557495117, 13.83713150024414, 14.275888442993164, 14.714645385742188, 15.153403282165527, 15.59216022491455]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 3.0, 3.0, 4.0, 10.0, 13.0, 18.0, 23.0, 33.0, 39.0, 34.0, 71.0, 146.0, 205.0, 393.0, 835.0, 2197.0, 6584.0, 25941.0, 178527.0, 2166181.0, 1648031.0, 134782.0, 21160.0, 5543.0, 1887.0, 783.0, 336.0, 189.0, 88.0, 65.0, 40.0, 20.0, 20.0, 11.0, 19.0, 11.0, 6.0, 5.0, 3.0, 4.0, 2.0, 6.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.5390625, -12.1583251953125, -11.777587890625, -11.3968505859375, -11.01611328125, -10.6353759765625, -10.254638671875, -9.8739013671875, -9.4931640625, -9.1124267578125, -8.731689453125, -8.3509521484375, -7.97021484375, -7.5894775390625, -7.208740234375, -6.8280029296875, -6.447265625, -6.0665283203125, -5.685791015625, -5.3050537109375, -4.92431640625, -4.5435791015625, -4.162841796875, -3.7821044921875, -3.4013671875, -3.0206298828125, -2.639892578125, -2.2591552734375, -1.87841796875, -1.4976806640625, -1.116943359375, -0.7362060546875, -0.35546875, 0.0252685546875, 0.406005859375, 0.7867431640625, 1.16748046875, 1.5482177734375, 1.928955078125, 2.3096923828125, 2.6904296875, 3.0711669921875, 3.451904296875, 3.8326416015625, 4.21337890625, 4.5941162109375, 4.974853515625, 5.3555908203125, 5.736328125, 6.1170654296875, 6.497802734375, 6.8785400390625, 7.25927734375, 7.6400146484375, 8.020751953125, 8.4014892578125, 8.7822265625, 9.1629638671875, 9.543701171875, 9.9244384765625, 10.30517578125, 10.6859130859375, 11.066650390625, 11.4473876953125, 11.828125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 6.0, 6.0, 12.0, 14.0, 14.0, 35.0, 30.0, 34.0, 42.0, 57.0, 51.0, 57.0, 57.0, 52.0, 61.0, 58.0, 59.0, 77.0, 40.0, 52.0, 38.0, 29.0, 24.0, 21.0, 19.0, 12.0, 16.0, 8.0, 6.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.96875, -7.72125244140625, -7.4737548828125, -7.22625732421875, -6.978759765625, -6.73126220703125, -6.4837646484375, -6.23626708984375, -5.98876953125, -5.74127197265625, -5.4937744140625, -5.24627685546875, -4.998779296875, -4.75128173828125, -4.5037841796875, -4.25628662109375, -4.0087890625, -3.76129150390625, -3.5137939453125, -3.26629638671875, -3.018798828125, -2.77130126953125, -2.5238037109375, -2.27630615234375, -2.02880859375, -1.78131103515625, -1.5338134765625, -1.28631591796875, -1.038818359375, -0.79132080078125, -0.5438232421875, -0.29632568359375, -0.048828125, 0.19866943359375, 0.4461669921875, 0.69366455078125, 0.941162109375, 1.18865966796875, 1.4361572265625, 1.68365478515625, 1.93115234375, 2.17864990234375, 2.4261474609375, 2.67364501953125, 2.921142578125, 3.16864013671875, 3.4161376953125, 3.66363525390625, 3.9111328125, 4.15863037109375, 4.4061279296875, 4.65362548828125, 4.901123046875, 5.14862060546875, 5.3961181640625, 5.64361572265625, 5.89111328125, 6.13861083984375, 6.3861083984375, 6.63360595703125, 6.881103515625, 7.12860107421875, 7.3760986328125, 7.62359619140625, 7.87109375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 8.0, 8.0, 16.0, 17.0, 21.0, 34.0, 49.0, 64.0, 104.0, 184.0, 427.0, 2815.0, 230958.0, 3942229.0, 15776.0, 912.0, 233.0, 160.0, 86.0, 51.0, 39.0, 34.0, 11.0, 7.0, 17.0, 7.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-39.0, -38.031005859375, -37.06201171875, -36.093017578125, -35.1240234375, -34.155029296875, -33.18603515625, -32.217041015625, -31.248046875, -30.279052734375, -29.31005859375, -28.341064453125, -27.3720703125, -26.403076171875, -25.43408203125, -24.465087890625, -23.49609375, -22.527099609375, -21.55810546875, -20.589111328125, -19.6201171875, -18.651123046875, -17.68212890625, -16.713134765625, -15.744140625, -14.775146484375, -13.80615234375, -12.837158203125, -11.8681640625, -10.899169921875, -9.93017578125, -8.961181640625, -7.9921875, -7.023193359375, -6.05419921875, -5.085205078125, -4.1162109375, -3.147216796875, -2.17822265625, -1.209228515625, -0.240234375, 0.728759765625, 1.69775390625, 2.666748046875, 3.6357421875, 4.604736328125, 5.57373046875, 6.542724609375, 7.51171875, 8.480712890625, 9.44970703125, 10.418701171875, 11.3876953125, 12.356689453125, 13.32568359375, 14.294677734375, 15.263671875, 16.232666015625, 17.20166015625, 18.170654296875, 19.1396484375, 20.108642578125, 21.07763671875, 22.046630859375, 23.015625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 7.0, 12.0, 16.0, 29.0, 25.0, 33.0, 38.0, 46.0, 47.0, 62.0, 85.0, 120.0, 172.0, 231.0, 317.0, 415.0, 463.0, 418.0, 397.0, 251.0, 212.0, 155.0, 118.0, 87.0, 71.0, 50.0, 33.0, 39.0, 26.0, 27.0, 14.0, 12.0, 6.0, 10.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-2.05078125, -1.9882659912109375, -1.925750732421875, -1.8632354736328125, -1.80072021484375, -1.7382049560546875, -1.675689697265625, -1.6131744384765625, -1.5506591796875, -1.4881439208984375, -1.425628662109375, -1.3631134033203125, -1.30059814453125, -1.2380828857421875, -1.175567626953125, -1.1130523681640625, -1.050537109375, -0.9880218505859375, -0.925506591796875, -0.8629913330078125, -0.80047607421875, -0.7379608154296875, -0.675445556640625, -0.6129302978515625, -0.5504150390625, -0.4878997802734375, -0.425384521484375, -0.3628692626953125, -0.30035400390625, -0.2378387451171875, -0.175323486328125, -0.1128082275390625, -0.05029296875, 0.0122222900390625, 0.074737548828125, 0.1372528076171875, 0.19976806640625, 0.2622833251953125, 0.324798583984375, 0.3873138427734375, 0.4498291015625, 0.5123443603515625, 0.574859619140625, 0.6373748779296875, 0.69989013671875, 0.7624053955078125, 0.824920654296875, 0.8874359130859375, 0.949951171875, 1.0124664306640625, 1.074981689453125, 1.1374969482421875, 1.20001220703125, 1.2625274658203125, 1.325042724609375, 1.3875579833984375, 1.4500732421875, 1.5125885009765625, 1.575103759765625, 1.6376190185546875, 1.70013427734375, 1.7626495361328125, 1.825164794921875, 1.8876800537109375, 1.9501953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 4.0, 11.0, 11.0, 15.0, 13.0, 23.0, 37.0, 45.0, 69.0, 80.0, 97.0, 114.0, 101.0, 99.0, 89.0, 57.0, 42.0, 33.0, 25.0, 13.0, 7.0, 5.0, 10.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.368906021118164, -15.976555824279785, -15.584205627441406, -15.191855430603027, -14.799505233764648, -14.407155990600586, -14.01480484008789, -13.622455596923828, -13.23010540008545, -12.83775520324707, -12.445405006408691, -12.053054809570312, -11.660704612731934, -11.268354415893555, -10.876005172729492, -10.483654975891113, -10.091304779052734, -9.698954582214355, -9.306604385375977, -8.914254188537598, -8.521903991699219, -8.129554748535156, -7.737204074859619, -7.344854354858398, -6.952503204345703, -6.560153007507324, -6.167802810668945, -5.775452613830566, -5.383102893829346, -4.990752696990967, -4.598402500152588, -4.206052780151367, -3.8137025833129883, -3.4213523864746094, -3.0290024280548096, -2.6366522312164307, -2.244302272796631, -1.851952075958252, -1.459601879119873, -1.0672519207000732, -0.6749017238616943, -0.2825516164302826, 0.10979849100112915, 0.5021486282348633, 0.8944987058639526, 1.286848783493042, 1.679198980331421, 2.0715489387512207, 2.4638991355895996, 2.8562493324279785, 3.2485992908477783, 3.6409494876861572, 4.033299446105957, 4.425649642944336, 4.817999839782715, 5.210350036621094, 5.602700233459473, 5.995050430297852, 6.3874006271362305, 6.779750823974609, 7.17210054397583, 7.564450740814209, 7.956800937652588, 8.349150657653809, 8.741500854492188]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 5.0, 10.0, 8.0, 7.0, 18.0, 14.0, 19.0, 19.0, 22.0, 25.0, 39.0, 31.0, 38.0, 45.0, 38.0, 32.0, 40.0, 47.0, 38.0, 38.0, 43.0, 37.0, 45.0, 34.0, 45.0, 32.0, 27.0, 28.0, 24.0, 20.0, 18.0, 28.0, 13.0, 13.0, 9.0, 7.0, 8.0, 7.0, 8.0, 8.0, 1.0, 2.0, 2.0, 1.0, 6.0], "bins": [-7.3510541915893555, -7.15897798538208, -6.966901779174805, -6.774825096130371, -6.582748889923096, -6.39067268371582, -6.198596000671387, -6.006519794464111, -5.814443588256836, -5.6223673820495605, -5.430291175842285, -5.238214492797852, -5.046138286590576, -4.854062080383301, -4.661985397338867, -4.469909191131592, -4.277832984924316, -4.085756778717041, -3.8936803340911865, -3.701603889465332, -3.5095276832580566, -3.3174514770507812, -3.1253750324249268, -2.9332985877990723, -2.741222381591797, -2.5491461753845215, -2.357069730758667, -2.1649932861328125, -1.972917079925537, -1.7808407545089722, -1.5887644290924072, -1.3966881036758423, -1.2046122550964355, -1.0125359296798706, -0.8204596042633057, -0.6283832788467407, -0.4363069534301758, -0.24423062801361084, -0.0521543025970459, 0.13992202281951904, 0.331998348236084, 0.5240746736526489, 0.7161509990692139, 0.9082273244857788, 1.1003036499023438, 1.2923799753189087, 1.4844563007354736, 1.6765326261520386, 1.8686089515686035, 2.060685157775879, 2.2527616024017334, 2.444838047027588, 2.6369142532348633, 2.8289904594421387, 3.021066904067993, 3.2131433486938477, 3.405219554901123, 3.5972957611083984, 3.789372205734253, 3.9814486503601074, 4.173524856567383, 4.365601062774658, 4.557677268981934, 4.749753952026367, 4.941830158233643]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 9.0, 21.0, 24.0, 39.0, 78.0, 165.0, 327.0, 682.0, 1842.0, 4568.0, 12540.0, 38050.0, 130650.0, 400425.0, 321045.0, 94052.0, 28268.0, 9550.0, 3636.0, 1386.0, 625.0, 261.0, 124.0, 77.0, 39.0, 19.0, 18.0, 10.0, 5.0, 2.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.369140625, -2.2991943359375, -2.229248046875, -2.1593017578125, -2.08935546875, -2.0194091796875, -1.949462890625, -1.8795166015625, -1.8095703125, -1.7396240234375, -1.669677734375, -1.5997314453125, -1.52978515625, -1.4598388671875, -1.389892578125, -1.3199462890625, -1.25, -1.1800537109375, -1.110107421875, -1.0401611328125, -0.97021484375, -0.9002685546875, -0.830322265625, -0.7603759765625, -0.6904296875, -0.6204833984375, -0.550537109375, -0.4805908203125, -0.41064453125, -0.3406982421875, -0.270751953125, -0.2008056640625, -0.130859375, -0.0609130859375, 0.009033203125, 0.0789794921875, 0.14892578125, 0.2188720703125, 0.288818359375, 0.3587646484375, 0.4287109375, 0.4986572265625, 0.568603515625, 0.6385498046875, 0.70849609375, 0.7784423828125, 0.848388671875, 0.9183349609375, 0.98828125, 1.0582275390625, 1.128173828125, 1.1981201171875, 1.26806640625, 1.3380126953125, 1.407958984375, 1.4779052734375, 1.5478515625, 1.6177978515625, 1.687744140625, 1.7576904296875, 1.82763671875, 1.8975830078125, 1.967529296875, 2.0374755859375, 2.107421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 6.0, 5.0, 6.0, 7.0, 15.0, 19.0, 21.0, 27.0, 27.0, 37.0, 33.0, 35.0, 40.0, 54.0, 46.0, 59.0, 55.0, 51.0, 48.0, 46.0, 47.0, 46.0, 34.0, 44.0, 39.0, 28.0, 21.0, 24.0, 20.0, 18.0, 12.0, 10.0, 3.0, 2.0, 2.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-5.6796875, -5.5341796875, -5.388671875, -5.2431640625, -5.09765625, -4.9521484375, -4.806640625, -4.6611328125, -4.515625, -4.3701171875, -4.224609375, -4.0791015625, -3.93359375, -3.7880859375, -3.642578125, -3.4970703125, -3.3515625, -3.2060546875, -3.060546875, -2.9150390625, -2.76953125, -2.6240234375, -2.478515625, -2.3330078125, -2.1875, -2.0419921875, -1.896484375, -1.7509765625, -1.60546875, -1.4599609375, -1.314453125, -1.1689453125, -1.0234375, -0.8779296875, -0.732421875, -0.5869140625, -0.44140625, -0.2958984375, -0.150390625, -0.0048828125, 0.140625, 0.2861328125, 0.431640625, 0.5771484375, 0.72265625, 0.8681640625, 1.013671875, 1.1591796875, 1.3046875, 1.4501953125, 1.595703125, 1.7412109375, 1.88671875, 2.0322265625, 2.177734375, 2.3232421875, 2.46875, 2.6142578125, 2.759765625, 2.9052734375, 3.05078125, 3.1962890625, 3.341796875, 3.4873046875, 3.6328125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 4.0, 9.0, 6.0, 13.0, 20.0, 30.0, 40.0, 41.0, 62.0, 77.0, 104.0, 157.0, 218.0, 427.0, 731.0, 1204.0, 2645.0, 5430.0, 13012.0, 34349.0, 96169.0, 264402.0, 363290.0, 169132.0, 58762.0, 21526.0, 8538.0, 3786.0, 1780.0, 972.0, 563.0, 347.0, 210.0, 120.0, 98.0, 50.0, 55.0, 39.0, 31.0, 29.0, 23.0, 12.0, 8.0, 7.0, 3.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.66015625, -1.6102447509765625, -1.560333251953125, -1.5104217529296875, -1.46051025390625, -1.4105987548828125, -1.360687255859375, -1.3107757568359375, -1.2608642578125, -1.2109527587890625, -1.161041259765625, -1.1111297607421875, -1.06121826171875, -1.0113067626953125, -0.961395263671875, -0.9114837646484375, -0.861572265625, -0.8116607666015625, -0.761749267578125, -0.7118377685546875, -0.66192626953125, -0.6120147705078125, -0.562103271484375, -0.5121917724609375, -0.4622802734375, -0.4123687744140625, -0.362457275390625, -0.3125457763671875, -0.26263427734375, -0.2127227783203125, -0.162811279296875, -0.1128997802734375, -0.06298828125, -0.0130767822265625, 0.036834716796875, 0.0867462158203125, 0.13665771484375, 0.1865692138671875, 0.236480712890625, 0.2863922119140625, 0.3363037109375, 0.3862152099609375, 0.436126708984375, 0.4860382080078125, 0.53594970703125, 0.5858612060546875, 0.635772705078125, 0.6856842041015625, 0.735595703125, 0.7855072021484375, 0.835418701171875, 0.8853302001953125, 0.93524169921875, 0.9851531982421875, 1.035064697265625, 1.0849761962890625, 1.1348876953125, 1.1847991943359375, 1.234710693359375, 1.2846221923828125, 1.33453369140625, 1.3844451904296875, 1.434356689453125, 1.4842681884765625, 1.5341796875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 3.0, 5.0, 4.0, 4.0, 7.0, 3.0, 7.0, 6.0, 8.0, 14.0, 12.0, 19.0, 22.0, 24.0, 17.0, 22.0, 21.0, 27.0, 31.0, 38.0, 27.0, 42.0, 39.0, 27.0, 47.0, 38.0, 37.0, 40.0, 43.0, 40.0, 39.0, 28.0, 37.0, 35.0, 21.0, 25.0, 21.0, 16.0, 19.0, 16.0, 8.0, 18.0, 10.0, 10.0, 9.0, 5.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.18359375, -6.965576171875, -6.74755859375, -6.529541015625, -6.3115234375, -6.093505859375, -5.87548828125, -5.657470703125, -5.439453125, -5.221435546875, -5.00341796875, -4.785400390625, -4.5673828125, -4.349365234375, -4.13134765625, -3.913330078125, -3.6953125, -3.477294921875, -3.25927734375, -3.041259765625, -2.8232421875, -2.605224609375, -2.38720703125, -2.169189453125, -1.951171875, -1.733154296875, -1.51513671875, -1.297119140625, -1.0791015625, -0.861083984375, -0.64306640625, -0.425048828125, -0.20703125, 0.010986328125, 0.22900390625, 0.447021484375, 0.6650390625, 0.883056640625, 1.10107421875, 1.319091796875, 1.537109375, 1.755126953125, 1.97314453125, 2.191162109375, 2.4091796875, 2.627197265625, 2.84521484375, 3.063232421875, 3.28125, 3.499267578125, 3.71728515625, 3.935302734375, 4.1533203125, 4.371337890625, 4.58935546875, 4.807373046875, 5.025390625, 5.243408203125, 5.46142578125, 5.679443359375, 5.8974609375, 6.115478515625, 6.33349609375, 6.551513671875, 6.76953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 6.0, 6.0, 11.0, 17.0, 11.0, 21.0, 37.0, 61.0, 74.0, 140.0, 278.0, 512.0, 950.0, 2151.0, 4960.0, 12662.0, 38245.0, 133584.0, 389767.0, 322702.0, 96808.0, 28509.0, 9629.0, 3936.0, 1663.0, 788.0, 450.0, 250.0, 119.0, 77.0, 48.0, 26.0, 19.0, 15.0, 8.0, 8.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6845703125, -0.6600112915039062, -0.6354522705078125, -0.6108932495117188, -0.586334228515625, -0.5617752075195312, -0.5372161865234375, -0.5126571655273438, -0.48809814453125, -0.46353912353515625, -0.4389801025390625, -0.41442108154296875, -0.389862060546875, -0.36530303955078125, -0.3407440185546875, -0.31618499755859375, -0.2916259765625, -0.26706695556640625, -0.2425079345703125, -0.21794891357421875, -0.193389892578125, -0.16883087158203125, -0.1442718505859375, -0.11971282958984375, -0.09515380859375, -0.07059478759765625, -0.0460357666015625, -0.02147674560546875, 0.003082275390625, 0.02764129638671875, 0.0522003173828125, 0.07675933837890625, 0.101318359375, 0.12587738037109375, 0.1504364013671875, 0.17499542236328125, 0.199554443359375, 0.22411346435546875, 0.2486724853515625, 0.27323150634765625, 0.29779052734375, 0.32234954833984375, 0.3469085693359375, 0.37146759033203125, 0.396026611328125, 0.42058563232421875, 0.4451446533203125, 0.46970367431640625, 0.4942626953125, 0.5188217163085938, 0.5433807373046875, 0.5679397583007812, 0.592498779296875, 0.6170578002929688, 0.6416168212890625, 0.6661758422851562, 0.69073486328125, 0.7152938842773438, 0.7398529052734375, 0.7644119262695312, 0.788970947265625, 0.8135299682617188, 0.8380889892578125, 0.8626480102539062, 0.88720703125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 13.0, 14.0, 16.0, 20.0, 37.0, 37.0, 47.0, 56.0, 73.0, 89.0, 93.0, 90.0, 91.0, 71.0, 52.0, 40.0, 36.0, 25.0, 28.0, 18.0, 11.0, 3.0, 6.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00043773651123046875, -0.0004244595766067505, -0.0004111826419830322, -0.00039790570735931396, -0.0003846287727355957, -0.00037135183811187744, -0.0003580749034881592, -0.0003447979688644409, -0.00033152103424072266, -0.0003182440996170044, -0.00030496716499328613, -0.00029169023036956787, -0.0002784132957458496, -0.00026513636112213135, -0.0002518594264984131, -0.00023858249187469482, -0.00022530555725097656, -0.0002120286226272583, -0.00019875168800354004, -0.00018547475337982178, -0.00017219781875610352, -0.00015892088413238525, -0.000145643949508667, -0.00013236701488494873, -0.00011909008026123047, -0.00010581314563751221, -9.253621101379395e-05, -7.925927639007568e-05, -6.598234176635742e-05, -5.270540714263916e-05, -3.94284725189209e-05, -2.6151537895202637e-05, -1.2874603271484375e-05, 4.023313522338867e-07, 1.3679265975952148e-05, 2.695620059967041e-05, 4.023313522338867e-05, 5.3510069847106934e-05, 6.67870044708252e-05, 8.006393909454346e-05, 9.334087371826172e-05, 0.00010661780834197998, 0.00011989474296569824, 0.0001331716775894165, 0.00014644861221313477, 0.00015972554683685303, 0.0001730024814605713, 0.00018627941608428955, 0.0001995563507080078, 0.00021283328533172607, 0.00022611021995544434, 0.0002393871545791626, 0.00025266408920288086, 0.0002659410238265991, 0.0002792179584503174, 0.00029249489307403564, 0.0003057718276977539, 0.00031904876232147217, 0.00033232569694519043, 0.0003456026315689087, 0.00035887956619262695, 0.0003721565008163452, 0.0003854334354400635, 0.00039871037006378174, 0.0004119873046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 1.0, 4.0, 11.0, 8.0, 12.0, 15.0, 21.0, 36.0, 67.0, 107.0, 186.0, 416.0, 932.0, 2776.0, 9518.0, 41025.0, 211727.0, 532606.0, 197585.0, 38191.0, 8924.0, 2684.0, 898.0, 370.0, 162.0, 99.0, 61.0, 27.0, 33.0, 15.0, 13.0, 9.0, 5.0, 2.0, 2.0, 3.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.06640625, -1.0345535278320312, -1.0027008056640625, -0.9708480834960938, -0.938995361328125, -0.9071426391601562, -0.8752899169921875, -0.8434371948242188, -0.81158447265625, -0.7797317504882812, -0.7478790283203125, -0.7160263061523438, -0.684173583984375, -0.6523208618164062, -0.6204681396484375, -0.5886154174804688, -0.5567626953125, -0.5249099731445312, -0.4930572509765625, -0.46120452880859375, -0.429351806640625, -0.39749908447265625, -0.3656463623046875, -0.33379364013671875, -0.30194091796875, -0.27008819580078125, -0.2382354736328125, -0.20638275146484375, -0.174530029296875, -0.14267730712890625, -0.1108245849609375, -0.07897186279296875, -0.047119140625, -0.01526641845703125, 0.0165863037109375, 0.04843902587890625, 0.080291748046875, 0.11214447021484375, 0.1439971923828125, 0.17584991455078125, 0.20770263671875, 0.23955535888671875, 0.2714080810546875, 0.30326080322265625, 0.335113525390625, 0.36696624755859375, 0.3988189697265625, 0.43067169189453125, 0.4625244140625, 0.49437713623046875, 0.5262298583984375, 0.5580825805664062, 0.589935302734375, 0.6217880249023438, 0.6536407470703125, 0.6854934692382812, 0.71734619140625, 0.7491989135742188, 0.7810516357421875, 0.8129043579101562, 0.844757080078125, 0.8766098022460938, 0.9084625244140625, 0.9403152465820312, 0.97216796875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 4.0, 6.0, 9.0, 12.0, 19.0, 12.0, 14.0, 29.0, 31.0, 40.0, 47.0, 49.0, 49.0, 67.0, 56.0, 74.0, 65.0, 69.0, 57.0, 38.0, 45.0, 39.0, 26.0, 34.0, 29.0, 19.0, 12.0, 13.0, 12.0, 9.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.167724609375, -0.1619281768798828, -0.15613174438476562, -0.15033531188964844, -0.14453887939453125, -0.13874244689941406, -0.13294601440429688, -0.1271495819091797, -0.1213531494140625, -0.11555671691894531, -0.10976028442382812, -0.10396385192871094, -0.09816741943359375, -0.09237098693847656, -0.08657455444335938, -0.08077812194824219, -0.074981689453125, -0.06918525695800781, -0.06338882446289062, -0.05759239196777344, -0.05179595947265625, -0.04599952697753906, -0.040203094482421875, -0.03440666198730469, -0.0286102294921875, -0.022813796997070312, -0.017017364501953125, -0.011220932006835938, -0.00542449951171875, 0.0003719329833984375, 0.006168365478515625, 0.011964797973632812, 0.01776123046875, 0.023557662963867188, 0.029354095458984375, 0.03515052795410156, 0.04094696044921875, 0.04674339294433594, 0.052539825439453125, 0.05833625793457031, 0.0641326904296875, 0.06992912292480469, 0.07572555541992188, 0.08152198791503906, 0.08731842041015625, 0.09311485290527344, 0.09891128540039062, 0.10470771789550781, 0.110504150390625, 0.11630058288574219, 0.12209701538085938, 0.12789344787597656, 0.13368988037109375, 0.13948631286621094, 0.14528274536132812, 0.1510791778564453, 0.1568756103515625, 0.1626720428466797, 0.16846847534179688, 0.17426490783691406, 0.18006134033203125, 0.18585777282714844, 0.19165420532226562, 0.1974506378173828, 0.2032470703125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 15.0, 16.0, 21.0, 29.0, 48.0, 64.0, 118.0, 115.0, 130.0, 131.0, 97.0, 77.0, 42.0, 30.0, 23.0, 13.0, 10.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.168880462646484, -11.88785171508789, -11.60682201385498, -11.325793266296387, -11.044764518737793, -10.7637357711792, -10.482706069946289, -10.201677322387695, -9.920648574829102, -9.639619827270508, -9.358590126037598, -9.077561378479004, -8.79653263092041, -8.515503883361816, -8.234474182128906, -7.9534454345703125, -7.6724162101745605, -7.391386985778809, -7.110358238220215, -6.829329013824463, -6.548300266265869, -6.267271041870117, -5.986242294311523, -5.7052130699157715, -5.4241838455200195, -5.143154621124268, -4.862125873565674, -4.581096649169922, -4.300067901611328, -4.019038677215576, -3.7380096912384033, -3.4569807052612305, -3.175952434539795, -2.894923448562622, -2.613894462585449, -2.3328652381896973, -2.0518364906311035, -1.7708073854446411, -1.4897782802581787, -1.2087492942810059, -0.927720308303833, -0.6466913223266602, -0.36566227674484253, -0.0846332311630249, 0.19639575481414795, 0.4774247407913208, 0.7584538459777832, 1.039482831954956, 1.320511817932129, 1.6015408039093018, 1.8825697898864746, 2.1635990142822266, 2.4446277618408203, 2.7256569862365723, 3.006685972213745, 3.287714958190918, 3.568743944168091, 3.8497729301452637, 4.130802154541016, 4.411830902099609, 4.692860126495361, 4.973888874053955, 5.254918098449707, 5.535946846008301, 5.816976070404053]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 6.0, 3.0, 13.0, 9.0, 11.0, 19.0, 11.0, 22.0, 28.0, 40.0, 33.0, 40.0, 45.0, 43.0, 50.0, 66.0, 60.0, 41.0, 55.0, 51.0, 53.0, 50.0, 38.0, 28.0, 27.0, 29.0, 25.0, 24.0, 15.0, 15.0, 18.0, 10.0, 6.0, 1.0, 5.0, 7.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0], "bins": [-5.663597106933594, -5.51999568939209, -5.376394271850586, -5.232792854309082, -5.089191436767578, -4.945590019226074, -4.80198860168457, -4.658387184143066, -4.5147857666015625, -4.371184349060059, -4.227582931518555, -4.083981513977051, -3.940380096435547, -3.796778678894043, -3.653177499771118, -3.5095760822296143, -3.3659749031066895, -3.2223734855651855, -3.0787720680236816, -2.9351706504821777, -2.791569232940674, -2.64796781539917, -2.504366636276245, -2.360765218734741, -2.2171638011932373, -2.0735623836517334, -1.9299609661102295, -1.7863596677780151, -1.6427582502365112, -1.4991568326950073, -1.355555534362793, -1.211954116821289, -1.068352460861206, -0.9247510433197021, -0.781149685382843, -0.6375483274459839, -0.49394690990448, -0.3503454923629761, -0.20674413442611694, -0.06314277648925781, 0.0804586410522461, 0.2240600287914276, 0.36766141653060913, 0.5112627744674683, 0.6548641920089722, 0.7984656095504761, 0.9420669674873352, 1.0856683254241943, 1.2292697429656982, 1.3728711605072021, 1.516472578048706, 1.6600738763809204, 1.8036752939224243, 1.9472767114639282, 2.0908780097961426, 2.2344794273376465, 2.3780808448791504, 2.5216822624206543, 2.665283679962158, 2.808885097503662, 2.952486515045166, 3.09608793258667, 3.2396891117095947, 3.3832905292510986, 3.5268919467926025]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 4.0, 6.0, 3.0, 7.0, 3.0, 6.0, 16.0, 14.0, 18.0, 38.0, 99.0, 381.0, 4179.0, 154196.0, 869833.0, 18359.0, 1065.0, 150.0, 48.0, 31.0, 15.0, 16.0, 13.0, 13.0, 7.0, 5.0, 5.0, 8.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-24.953125, -24.178955078125, -23.40478515625, -22.630615234375, -21.8564453125, -21.082275390625, -20.30810546875, -19.533935546875, -18.759765625, -17.985595703125, -17.21142578125, -16.437255859375, -15.6630859375, -14.888916015625, -14.11474609375, -13.340576171875, -12.56640625, -11.792236328125, -11.01806640625, -10.243896484375, -9.4697265625, -8.695556640625, -7.92138671875, -7.147216796875, -6.373046875, -5.598876953125, -4.82470703125, -4.050537109375, -3.2763671875, -2.502197265625, -1.72802734375, -0.953857421875, -0.1796875, 0.594482421875, 1.36865234375, 2.142822265625, 2.9169921875, 3.691162109375, 4.46533203125, 5.239501953125, 6.013671875, 6.787841796875, 7.56201171875, 8.336181640625, 9.1103515625, 9.884521484375, 10.65869140625, 11.432861328125, 12.20703125, 12.981201171875, 13.75537109375, 14.529541015625, 15.3037109375, 16.077880859375, 16.85205078125, 17.626220703125, 18.400390625, 19.174560546875, 19.94873046875, 20.722900390625, 21.4970703125, 22.271240234375, 23.04541015625, 23.819580078125, 24.59375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 6.0, 10.0, 5.0, 8.0, 17.0, 12.0, 26.0, 29.0, 40.0, 39.0, 60.0, 54.0, 55.0, 54.0, 62.0, 68.0, 63.0, 60.0, 75.0, 44.0, 45.0, 26.0, 24.0, 24.0, 21.0, 20.0, 8.0, 13.0, 8.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.265625, -12.9073486328125, -12.549072265625, -12.1907958984375, -11.83251953125, -11.4742431640625, -11.115966796875, -10.7576904296875, -10.3994140625, -10.0411376953125, -9.682861328125, -9.3245849609375, -8.96630859375, -8.6080322265625, -8.249755859375, -7.8914794921875, -7.533203125, -7.1749267578125, -6.816650390625, -6.4583740234375, -6.10009765625, -5.7418212890625, -5.383544921875, -5.0252685546875, -4.6669921875, -4.3087158203125, -3.950439453125, -3.5921630859375, -3.23388671875, -2.8756103515625, -2.517333984375, -2.1590576171875, -1.80078125, -1.4425048828125, -1.084228515625, -0.7259521484375, -0.36767578125, -0.0093994140625, 0.348876953125, 0.7071533203125, 1.0654296875, 1.4237060546875, 1.781982421875, 2.1402587890625, 2.49853515625, 2.8568115234375, 3.215087890625, 3.5733642578125, 3.931640625, 4.2899169921875, 4.648193359375, 5.0064697265625, 5.36474609375, 5.7230224609375, 6.081298828125, 6.4395751953125, 6.7978515625, 7.1561279296875, 7.514404296875, 7.8726806640625, 8.23095703125, 8.5892333984375, 8.947509765625, 9.3057861328125, 9.6640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 9.0, 8.0, 9.0, 9.0, 11.0, 23.0, 19.0, 24.0, 21.0, 33.0, 49.0, 53.0, 71.0, 94.0, 90.0, 170.0, 351.0, 1162.0, 5287.0, 38359.0, 469654.0, 485025.0, 40333.0, 5443.0, 1155.0, 357.0, 193.0, 104.0, 77.0, 64.0, 62.0, 32.0, 32.0, 31.0, 30.0, 22.0, 19.0, 12.0, 13.0, 7.0, 11.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.46875, -9.142333984375, -8.81591796875, -8.489501953125, -8.1630859375, -7.836669921875, -7.51025390625, -7.183837890625, -6.857421875, -6.531005859375, -6.20458984375, -5.878173828125, -5.5517578125, -5.225341796875, -4.89892578125, -4.572509765625, -4.24609375, -3.919677734375, -3.59326171875, -3.266845703125, -2.9404296875, -2.614013671875, -2.28759765625, -1.961181640625, -1.634765625, -1.308349609375, -0.98193359375, -0.655517578125, -0.3291015625, -0.002685546875, 0.32373046875, 0.650146484375, 0.9765625, 1.302978515625, 1.62939453125, 1.955810546875, 2.2822265625, 2.608642578125, 2.93505859375, 3.261474609375, 3.587890625, 3.914306640625, 4.24072265625, 4.567138671875, 4.8935546875, 5.219970703125, 5.54638671875, 5.872802734375, 6.19921875, 6.525634765625, 6.85205078125, 7.178466796875, 7.5048828125, 7.831298828125, 8.15771484375, 8.484130859375, 8.810546875, 9.136962890625, 9.46337890625, 9.789794921875, 10.1162109375, 10.442626953125, 10.76904296875, 11.095458984375, 11.421875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 7.0, 6.0, 9.0, 7.0, 12.0, 18.0, 16.0, 18.0, 16.0, 22.0, 29.0, 40.0, 29.0, 30.0, 32.0, 47.0, 49.0, 40.0, 40.0, 53.0, 33.0, 33.0, 43.0, 37.0, 37.0, 38.0, 33.0, 28.0, 27.0, 29.0, 25.0, 22.0, 9.0, 16.0, 16.0, 8.0, 8.0, 2.0, 6.0, 4.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.49609375, -7.23748779296875, -6.9788818359375, -6.72027587890625, -6.461669921875, -6.20306396484375, -5.9444580078125, -5.68585205078125, -5.42724609375, -5.16864013671875, -4.9100341796875, -4.65142822265625, -4.392822265625, -4.13421630859375, -3.8756103515625, -3.61700439453125, -3.3583984375, -3.09979248046875, -2.8411865234375, -2.58258056640625, -2.323974609375, -2.06536865234375, -1.8067626953125, -1.54815673828125, -1.28955078125, -1.03094482421875, -0.7723388671875, -0.51373291015625, -0.255126953125, 0.00347900390625, 0.2620849609375, 0.52069091796875, 0.779296875, 1.03790283203125, 1.2965087890625, 1.55511474609375, 1.813720703125, 2.07232666015625, 2.3309326171875, 2.58953857421875, 2.84814453125, 3.10675048828125, 3.3653564453125, 3.62396240234375, 3.882568359375, 4.14117431640625, 4.3997802734375, 4.65838623046875, 4.9169921875, 5.17559814453125, 5.4342041015625, 5.69281005859375, 5.951416015625, 6.21002197265625, 6.4686279296875, 6.72723388671875, 6.98583984375, 7.24444580078125, 7.5030517578125, 7.76165771484375, 8.020263671875, 8.27886962890625, 8.5374755859375, 8.79608154296875, 9.0546875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 11.0, 11.0, 21.0, 24.0, 45.0, 68.0, 120.0, 187.0, 301.0, 482.0, 754.0, 1236.0, 2307.0, 4379.0, 9358.0, 23629.0, 73469.0, 281727.0, 448789.0, 135429.0, 39007.0, 13757.0, 6100.0, 3098.0, 1694.0, 1042.0, 550.0, 356.0, 216.0, 124.0, 99.0, 53.0, 40.0, 17.0, 14.0, 5.0, 12.0, 7.0, 7.0, 4.0, 1.0, 5.0, 2.0, 2.0], "bins": [-1.7939453125, -1.7470245361328125, -1.700103759765625, -1.6531829833984375, -1.60626220703125, -1.5593414306640625, -1.512420654296875, -1.4654998779296875, -1.4185791015625, -1.3716583251953125, -1.324737548828125, -1.2778167724609375, -1.23089599609375, -1.1839752197265625, -1.137054443359375, -1.0901336669921875, -1.043212890625, -0.9962921142578125, -0.949371337890625, -0.9024505615234375, -0.85552978515625, -0.8086090087890625, -0.761688232421875, -0.7147674560546875, -0.6678466796875, -0.6209259033203125, -0.574005126953125, -0.5270843505859375, -0.48016357421875, -0.4332427978515625, -0.386322021484375, -0.3394012451171875, -0.29248046875, -0.2455596923828125, -0.198638916015625, -0.1517181396484375, -0.10479736328125, -0.0578765869140625, -0.010955810546875, 0.0359649658203125, 0.0828857421875, 0.1298065185546875, 0.176727294921875, 0.2236480712890625, 0.27056884765625, 0.3174896240234375, 0.364410400390625, 0.4113311767578125, 0.458251953125, 0.5051727294921875, 0.552093505859375, 0.5990142822265625, 0.64593505859375, 0.6928558349609375, 0.739776611328125, 0.7866973876953125, 0.8336181640625, 0.8805389404296875, 0.927459716796875, 0.9743804931640625, 1.02130126953125, 1.0682220458984375, 1.115142822265625, 1.1620635986328125, 1.208984375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 5.0, 2.0, 4.0, 7.0, 19.0, 9.0, 11.0, 19.0, 31.0, 30.0, 37.0, 50.0, 68.0, 88.0, 99.0, 99.0, 71.0, 68.0, 52.0, 50.0, 34.0, 41.0, 18.0, 17.0, 13.0, 9.0, 9.0, 6.0, 4.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002574920654296875, -0.00024863332509994507, -0.00023977458477020264, -0.0002309158444404602, -0.00022205710411071777, -0.00021319836378097534, -0.0002043396234512329, -0.00019548088312149048, -0.00018662214279174805, -0.00017776340246200562, -0.00016890466213226318, -0.00016004592180252075, -0.00015118718147277832, -0.0001423284411430359, -0.00013346970081329346, -0.00012461096048355103, -0.0001157522201538086, -0.00010689347982406616, -9.803473949432373e-05, -8.91759991645813e-05, -8.031725883483887e-05, -7.145851850509644e-05, -6.2599778175354e-05, -5.374103784561157e-05, -4.488229751586914e-05, -3.602355718612671e-05, -2.7164816856384277e-05, -1.8306076526641846e-05, -9.447336196899414e-06, -5.885958671569824e-07, 8.27014446258545e-06, 1.712888479232788e-05, 2.5987625122070312e-05, 3.4846365451812744e-05, 4.3705105781555176e-05, 5.256384611129761e-05, 6.142258644104004e-05, 7.028132677078247e-05, 7.91400671005249e-05, 8.799880743026733e-05, 9.685754776000977e-05, 0.0001057162880897522, 0.00011457502841949463, 0.00012343376874923706, 0.0001322925090789795, 0.00014115124940872192, 0.00015000998973846436, 0.0001588687300682068, 0.00016772747039794922, 0.00017658621072769165, 0.00018544495105743408, 0.00019430369138717651, 0.00020316243171691895, 0.00021202117204666138, 0.0002208799123764038, 0.00022973865270614624, 0.00023859739303588867, 0.0002474561333656311, 0.00025631487369537354, 0.00026517361402511597, 0.0002740323543548584, 0.00028289109468460083, 0.00029174983501434326, 0.0003006085753440857, 0.0003094673156738281]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 12.0, 24.0, 36.0, 56.0, 63.0, 83.0, 160.0, 239.0, 434.0, 723.0, 1203.0, 2112.0, 4169.0, 9372.0, 23708.0, 70800.0, 247017.0, 448499.0, 159901.0, 48303.0, 16925.0, 7003.0, 3372.0, 1730.0, 1006.0, 593.0, 344.0, 239.0, 141.0, 88.0, 50.0, 33.0, 35.0, 22.0, 15.0, 6.0, 5.0, 7.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5283203125, -1.4824676513671875, -1.436614990234375, -1.3907623291015625, -1.34490966796875, -1.2990570068359375, -1.253204345703125, -1.2073516845703125, -1.1614990234375, -1.1156463623046875, -1.069793701171875, -1.0239410400390625, -0.97808837890625, -0.9322357177734375, -0.886383056640625, -0.8405303955078125, -0.794677734375, -0.7488250732421875, -0.702972412109375, -0.6571197509765625, -0.61126708984375, -0.5654144287109375, -0.519561767578125, -0.4737091064453125, -0.4278564453125, -0.3820037841796875, -0.336151123046875, -0.2902984619140625, -0.24444580078125, -0.1985931396484375, -0.152740478515625, -0.1068878173828125, -0.06103515625, -0.0151824951171875, 0.030670166015625, 0.0765228271484375, 0.12237548828125, 0.1682281494140625, 0.214080810546875, 0.2599334716796875, 0.3057861328125, 0.3516387939453125, 0.397491455078125, 0.4433441162109375, 0.48919677734375, 0.5350494384765625, 0.580902099609375, 0.6267547607421875, 0.672607421875, 0.7184600830078125, 0.764312744140625, 0.8101654052734375, 0.85601806640625, 0.9018707275390625, 0.947723388671875, 0.9935760498046875, 1.0394287109375, 1.0852813720703125, 1.131134033203125, 1.1769866943359375, 1.22283935546875, 1.2686920166015625, 1.314544677734375, 1.3603973388671875, 1.40625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 10.0, 19.0, 22.0, 31.0, 29.0, 32.0, 33.0, 63.0, 68.0, 98.0, 90.0, 89.0, 55.0, 68.0, 44.0, 39.0, 37.0, 43.0, 25.0, 20.0, 10.0, 14.0, 7.0, 12.0, 4.0, 5.0, 10.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7158203125, -0.6911697387695312, -0.6665191650390625, -0.6418685913085938, -0.617218017578125, -0.5925674438476562, -0.5679168701171875, -0.5432662963867188, -0.51861572265625, -0.49396514892578125, -0.4693145751953125, -0.44466400146484375, -0.420013427734375, -0.39536285400390625, -0.3707122802734375, -0.34606170654296875, -0.3214111328125, -0.29676055908203125, -0.2721099853515625, -0.24745941162109375, -0.222808837890625, -0.19815826416015625, -0.1735076904296875, -0.14885711669921875, -0.12420654296875, -0.09955596923828125, -0.0749053955078125, -0.05025482177734375, -0.025604248046875, -0.00095367431640625, 0.0236968994140625, 0.04834747314453125, 0.072998046875, 0.09764862060546875, 0.1222991943359375, 0.14694976806640625, 0.171600341796875, 0.19625091552734375, 0.2209014892578125, 0.24555206298828125, 0.27020263671875, 0.29485321044921875, 0.3195037841796875, 0.34415435791015625, 0.368804931640625, 0.39345550537109375, 0.4181060791015625, 0.44275665283203125, 0.4674072265625, 0.49205780029296875, 0.5167083740234375, 0.5413589477539062, 0.566009521484375, 0.5906600952148438, 0.6153106689453125, 0.6399612426757812, 0.66461181640625, 0.6892623901367188, 0.7139129638671875, 0.7385635375976562, 0.763214111328125, 0.7878646850585938, 0.8125152587890625, 0.8371658325195312, 0.86181640625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 2.0, 6.0, 37.0, 87.0, 200.0, 315.0, 207.0, 94.0, 39.0, 16.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.23944091796875, -62.94206619262695, -61.644691467285156, -60.347312927246094, -59.0499382019043, -57.7525634765625, -56.4551887512207, -55.157814025878906, -53.860435485839844, -52.56306076049805, -51.26568603515625, -49.96830749511719, -48.67093276977539, -47.373558044433594, -46.0761833190918, -44.77880859375, -43.48143005371094, -42.18405532836914, -40.886680603027344, -39.58930206298828, -38.291927337646484, -36.99455261230469, -35.69717788696289, -34.399803161621094, -33.1024284362793, -31.8050537109375, -30.50767707824707, -29.210302352905273, -27.912925720214844, -26.615550994873047, -25.31817626953125, -24.02079963684082, -22.723421096801758, -21.42604637145996, -20.12866973876953, -18.831295013427734, -17.533918380737305, -16.236543655395508, -14.939167976379395, -13.641792297363281, -12.344416618347168, -11.047040939331055, -9.749665260314941, -8.452289581298828, -7.154914379119873, -5.85753870010376, -4.560163497924805, -3.2627878189086914, -1.9654121398925781, -0.6680365800857544, 0.6293389797210693, 1.9267144203186035, 3.224090099334717, 4.52146577835083, 5.818840980529785, 7.116216659545898, 8.413592338562012, 9.710968017578125, 11.008343696594238, 12.305719375610352, 13.603094100952148, 14.900470733642578, 16.197845458984375, 17.495220184326172, 18.7925968170166]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 6.0, 7.0, 7.0, 8.0, 14.0, 19.0, 24.0, 23.0, 24.0, 25.0, 29.0, 24.0, 32.0, 31.0, 33.0, 38.0, 34.0, 40.0, 43.0, 45.0, 38.0, 41.0, 40.0, 24.0, 39.0, 43.0, 28.0, 28.0, 26.0, 25.0, 26.0, 17.0, 14.0, 19.0, 16.0, 15.0, 11.0, 8.0, 11.0, 3.0, 8.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-16.046903610229492, -15.610644340515137, -15.174386024475098, -14.738126754760742, -14.301868438720703, -13.865609169006348, -13.429349899291992, -12.993091583251953, -12.556832313537598, -12.120573043823242, -11.684314727783203, -11.248055458068848, -10.811796188354492, -10.375537872314453, -9.939278602600098, -9.503019332885742, -9.066761016845703, -8.630501747131348, -8.194243431091309, -7.757984161376953, -7.321725368499756, -6.885466575622559, -6.449207305908203, -6.012948513031006, -5.576689720153809, -5.140430927276611, -4.704172134399414, -4.267912864685059, -3.8316540718078613, -3.395395278930664, -2.9591362476348877, -2.5228772163391113, -2.0866193771362305, -1.6503604650497437, -1.2141015529632568, -0.77784264087677, -0.3415837287902832, 0.09467506408691406, 0.5309340953826904, 0.9671931266784668, 1.403451919555664, 1.8397108316421509, 2.2759697437286377, 2.712228775024414, 3.1484875679016113, 3.5847463607788086, 4.021005630493164, 4.457264423370361, 4.893523216247559, 5.329782009124756, 5.766040802001953, 6.202300071716309, 6.638558864593506, 7.074817657470703, 7.511076927185059, 7.947335720062256, 8.383594512939453, 8.819853782653809, 9.256112098693848, 9.692371368408203, 10.128629684448242, 10.564888954162598, 11.001148223876953, 11.437406539916992, 11.873665809631348]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 8.0, 11.0, 10.0, 14.0, 28.0, 31.0, 42.0, 68.0, 119.0, 179.0, 240.0, 412.0, 725.0, 1277.0, 2301.0, 4354.0, 9307.0, 22847.0, 68041.0, 263591.0, 1132734.0, 1939147.0, 552281.0, 128896.0, 38551.0, 15015.0, 6672.0, 3266.0, 1741.0, 925.0, 552.0, 320.0, 191.0, 115.0, 66.0, 68.0, 39.0, 30.0, 18.0, 12.0, 13.0, 5.0, 6.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.609375, -5.4239501953125, -5.238525390625, -5.0531005859375, -4.86767578125, -4.6822509765625, -4.496826171875, -4.3114013671875, -4.1259765625, -3.9405517578125, -3.755126953125, -3.5697021484375, -3.38427734375, -3.1988525390625, -3.013427734375, -2.8280029296875, -2.642578125, -2.4571533203125, -2.271728515625, -2.0863037109375, -1.90087890625, -1.7154541015625, -1.530029296875, -1.3446044921875, -1.1591796875, -0.9737548828125, -0.788330078125, -0.6029052734375, -0.41748046875, -0.2320556640625, -0.046630859375, 0.1387939453125, 0.32421875, 0.5096435546875, 0.695068359375, 0.8804931640625, 1.06591796875, 1.2513427734375, 1.436767578125, 1.6221923828125, 1.8076171875, 1.9930419921875, 2.178466796875, 2.3638916015625, 2.54931640625, 2.7347412109375, 2.920166015625, 3.1055908203125, 3.291015625, 3.4764404296875, 3.661865234375, 3.8472900390625, 4.03271484375, 4.2181396484375, 4.403564453125, 4.5889892578125, 4.7744140625, 4.9598388671875, 5.145263671875, 5.3306884765625, 5.51611328125, 5.7015380859375, 5.886962890625, 6.0723876953125, 6.2578125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 15.0, 18.0, 16.0, 23.0, 18.0, 27.0, 27.0, 31.0, 47.0, 53.0, 55.0, 53.0, 57.0, 59.0, 60.0, 59.0, 47.0, 44.0, 51.0, 43.0, 33.0, 32.0, 22.0, 20.0, 19.0, 16.0, 15.0, 5.0, 8.0, 5.0, 7.0, 6.0, 3.0, 0.0, 3.0, 0.0, 3.0], "bins": [-8.90625, -8.68853759765625, -8.4708251953125, -8.25311279296875, -8.035400390625, -7.81768798828125, -7.5999755859375, -7.38226318359375, -7.16455078125, -6.94683837890625, -6.7291259765625, -6.51141357421875, -6.293701171875, -6.07598876953125, -5.8582763671875, -5.64056396484375, -5.4228515625, -5.20513916015625, -4.9874267578125, -4.76971435546875, -4.552001953125, -4.33428955078125, -4.1165771484375, -3.89886474609375, -3.68115234375, -3.46343994140625, -3.2457275390625, -3.02801513671875, -2.810302734375, -2.59259033203125, -2.3748779296875, -2.15716552734375, -1.939453125, -1.72174072265625, -1.5040283203125, -1.28631591796875, -1.068603515625, -0.85089111328125, -0.6331787109375, -0.41546630859375, -0.19775390625, 0.01995849609375, 0.2376708984375, 0.45538330078125, 0.673095703125, 0.89080810546875, 1.1085205078125, 1.32623291015625, 1.5439453125, 1.76165771484375, 1.9793701171875, 2.19708251953125, 2.414794921875, 2.63250732421875, 2.8502197265625, 3.06793212890625, 3.28564453125, 3.50335693359375, 3.7210693359375, 3.93878173828125, 4.156494140625, 4.37420654296875, 4.5919189453125, 4.80963134765625, 5.02734375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 9.0, 13.0, 20.0, 20.0, 25.0, 40.0, 54.0, 85.0, 179.0, 335.0, 1036.0, 5158.0, 75462.0, 3844458.0, 254797.0, 10106.0, 1569.0, 405.0, 171.0, 113.0, 55.0, 37.0, 27.0, 25.0, 19.0, 13.0, 10.0, 10.0, 5.0, 2.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.8125, -18.25341796875, -17.6943359375, -17.13525390625, -16.576171875, -16.01708984375, -15.4580078125, -14.89892578125, -14.33984375, -13.78076171875, -13.2216796875, -12.66259765625, -12.103515625, -11.54443359375, -10.9853515625, -10.42626953125, -9.8671875, -9.30810546875, -8.7490234375, -8.18994140625, -7.630859375, -7.07177734375, -6.5126953125, -5.95361328125, -5.39453125, -4.83544921875, -4.2763671875, -3.71728515625, -3.158203125, -2.59912109375, -2.0400390625, -1.48095703125, -0.921875, -0.36279296875, 0.1962890625, 0.75537109375, 1.314453125, 1.87353515625, 2.4326171875, 2.99169921875, 3.55078125, 4.10986328125, 4.6689453125, 5.22802734375, 5.787109375, 6.34619140625, 6.9052734375, 7.46435546875, 8.0234375, 8.58251953125, 9.1416015625, 9.70068359375, 10.259765625, 10.81884765625, 11.3779296875, 11.93701171875, 12.49609375, 13.05517578125, 13.6142578125, 14.17333984375, 14.732421875, 15.29150390625, 15.8505859375, 16.40966796875, 16.96875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 9.0, 11.0, 8.0, 9.0, 10.0, 22.0, 29.0, 41.0, 72.0, 76.0, 105.0, 171.0, 259.0, 402.0, 605.0, 629.0, 488.0, 384.0, 232.0, 141.0, 115.0, 61.0, 67.0, 36.0, 21.0, 21.0, 16.0, 15.0, 4.0, 5.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.296875, -2.218597412109375, -2.14031982421875, -2.062042236328125, -1.9837646484375, -1.905487060546875, -1.82720947265625, -1.748931884765625, -1.670654296875, -1.592376708984375, -1.51409912109375, -1.435821533203125, -1.3575439453125, -1.279266357421875, -1.20098876953125, -1.122711181640625, -1.04443359375, -0.966156005859375, -0.88787841796875, -0.809600830078125, -0.7313232421875, -0.653045654296875, -0.57476806640625, -0.496490478515625, -0.418212890625, -0.339935302734375, -0.26165771484375, -0.183380126953125, -0.1051025390625, -0.026824951171875, 0.05145263671875, 0.129730224609375, 0.2080078125, 0.286285400390625, 0.36456298828125, 0.442840576171875, 0.5211181640625, 0.599395751953125, 0.67767333984375, 0.755950927734375, 0.834228515625, 0.912506103515625, 0.99078369140625, 1.069061279296875, 1.1473388671875, 1.225616455078125, 1.30389404296875, 1.382171630859375, 1.46044921875, 1.538726806640625, 1.61700439453125, 1.695281982421875, 1.7735595703125, 1.851837158203125, 1.93011474609375, 2.008392333984375, 2.086669921875, 2.164947509765625, 2.24322509765625, 2.321502685546875, 2.3997802734375, 2.478057861328125, 2.55633544921875, 2.634613037109375, 2.712890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 13.0, 19.0, 23.0, 48.0, 98.0, 118.0, 156.0, 175.0, 136.0, 78.0, 48.0, 44.0, 18.0, 14.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.710124969482422, -22.156557083129883, -21.602989196777344, -21.049423217773438, -20.4958553314209, -19.94228744506836, -19.38871955871582, -18.83515167236328, -18.281583786010742, -17.728015899658203, -17.174448013305664, -16.620880126953125, -16.06731414794922, -15.51374626159668, -14.96017837524414, -14.406610488891602, -13.853043556213379, -13.29947566986084, -12.745908737182617, -12.192340850830078, -11.638772964477539, -11.085205078125, -10.531638145446777, -9.978070259094238, -9.424503326416016, -8.870935440063477, -8.317368507385254, -7.763800621032715, -7.210232734680176, -6.656665325164795, -6.103097915649414, -5.549530029296875, -4.9959611892700195, -4.442393779754639, -3.8888258934020996, -3.3352584838867188, -2.781690835952759, -2.228123188018799, -1.674555778503418, -1.120988130569458, -0.567420482635498, -0.013852894306182861, 0.5397146940231323, 1.0932822227478027, 1.6468498706817627, 2.2004175186157227, 2.7539849281311035, 3.3075525760650635, 3.8611202239990234, 4.414687633514404, 4.968255519866943, 5.521822929382324, 6.075390815734863, 6.628958225250244, 7.182525634765625, 7.736093521118164, 8.289661407470703, 8.843229293823242, 9.396796226501465, 9.950364112854004, 10.503931999206543, 11.057498931884766, 11.611066818237305, 12.164634704589844, 12.718201637268066]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 11.0, 7.0, 10.0, 18.0, 10.0, 22.0, 21.0, 32.0, 25.0, 29.0, 34.0, 37.0, 34.0, 37.0, 54.0, 39.0, 58.0, 40.0, 53.0, 49.0, 49.0, 46.0, 31.0, 41.0, 34.0, 29.0, 25.0, 25.0, 26.0, 20.0, 10.0, 9.0, 11.0, 5.0, 7.0, 3.0, 3.0, 3.0, 2.0, 5.0], "bins": [-8.39116096496582, -8.183818817138672, -7.976476669311523, -7.769134521484375, -7.561792373657227, -7.354450225830078, -7.14710807800293, -6.939765930175781, -6.732423782348633, -6.525081634521484, -6.317739486694336, -6.1103973388671875, -5.903055191040039, -5.695713043212891, -5.488370895385742, -5.281028747558594, -5.073686599731445, -4.866344451904297, -4.659002304077148, -4.45166015625, -4.244318008422852, -4.036975860595703, -3.8296337127685547, -3.6222915649414062, -3.414949893951416, -3.2076077461242676, -3.000265598297119, -2.7929234504699707, -2.5855813026428223, -2.378239154815674, -2.1708970069885254, -1.9635549783706665, -1.7562127113342285, -1.54887056350708, -1.3415284156799316, -1.1341862678527832, -0.9268441796302795, -0.7195020914077759, -0.5121599435806274, -0.304817795753479, -0.09747564792633057, 0.10986648499965668, 0.3172086179256439, 0.52455073595047, 0.7318928837776184, 0.9392349720001221, 1.1465771198272705, 1.353919267654419, 1.5612614154815674, 1.7686035633087158, 1.9759457111358643, 2.1832878589630127, 2.390630006790161, 2.5979719161987305, 2.805314064025879, 3.0126562118530273, 3.219998359680176, 3.427340507507324, 3.6346826553344727, 3.842024803161621, 4.0493669509887695, 4.256709098815918, 4.464051246643066, 4.671393394470215, 4.878735542297363]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 6.0, 12.0, 16.0, 27.0, 70.0, 120.0, 268.0, 631.0, 1416.0, 3518.0, 9724.0, 31700.0, 238587.0, 661449.0, 74188.0, 16861.0, 5967.0, 2246.0, 935.0, 424.0, 192.0, 78.0, 51.0, 26.0, 15.0, 9.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.2265625, -4.124114990234375, -4.02166748046875, -3.919219970703125, -3.8167724609375, -3.714324951171875, -3.61187744140625, -3.509429931640625, -3.406982421875, -3.304534912109375, -3.20208740234375, -3.099639892578125, -2.9971923828125, -2.894744873046875, -2.79229736328125, -2.689849853515625, -2.58740234375, -2.484954833984375, -2.38250732421875, -2.280059814453125, -2.1776123046875, -2.075164794921875, -1.97271728515625, -1.870269775390625, -1.767822265625, -1.665374755859375, -1.56292724609375, -1.460479736328125, -1.3580322265625, -1.255584716796875, -1.15313720703125, -1.050689697265625, -0.9482421875, -0.845794677734375, -0.74334716796875, -0.640899658203125, -0.5384521484375, -0.436004638671875, -0.33355712890625, -0.231109619140625, -0.128662109375, -0.026214599609375, 0.07623291015625, 0.178680419921875, 0.2811279296875, 0.383575439453125, 0.48602294921875, 0.588470458984375, 0.69091796875, 0.793365478515625, 0.89581298828125, 0.998260498046875, 1.1007080078125, 1.203155517578125, 1.30560302734375, 1.408050537109375, 1.510498046875, 1.612945556640625, 1.71539306640625, 1.817840576171875, 1.9202880859375, 2.022735595703125, 2.12518310546875, 2.227630615234375, 2.330078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 7.0, 8.0, 10.0, 8.0, 16.0, 12.0, 24.0, 27.0, 18.0, 25.0, 31.0, 26.0, 36.0, 33.0, 37.0, 42.0, 60.0, 56.0, 49.0, 41.0, 41.0, 51.0, 40.0, 33.0, 34.0, 39.0, 28.0, 20.0, 21.0, 26.0, 22.0, 22.0, 9.0, 7.0, 12.0, 7.0, 4.0, 2.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.953125, -3.8270263671875, -3.700927734375, -3.5748291015625, -3.44873046875, -3.3226318359375, -3.196533203125, -3.0704345703125, -2.9443359375, -2.8182373046875, -2.692138671875, -2.5660400390625, -2.43994140625, -2.3138427734375, -2.187744140625, -2.0616455078125, -1.935546875, -1.8094482421875, -1.683349609375, -1.5572509765625, -1.43115234375, -1.3050537109375, -1.178955078125, -1.0528564453125, -0.9267578125, -0.8006591796875, -0.674560546875, -0.5484619140625, -0.42236328125, -0.2962646484375, -0.170166015625, -0.0440673828125, 0.08203125, 0.2081298828125, 0.334228515625, 0.4603271484375, 0.58642578125, 0.7125244140625, 0.838623046875, 0.9647216796875, 1.0908203125, 1.2169189453125, 1.343017578125, 1.4691162109375, 1.59521484375, 1.7213134765625, 1.847412109375, 1.9735107421875, 2.099609375, 2.2257080078125, 2.351806640625, 2.4779052734375, 2.60400390625, 2.7301025390625, 2.856201171875, 2.9822998046875, 3.1083984375, 3.2344970703125, 3.360595703125, 3.4866943359375, 3.61279296875, 3.7388916015625, 3.864990234375, 3.9910888671875, 4.1171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 5.0, 1.0, 7.0, 6.0, 16.0, 12.0, 21.0, 26.0, 52.0, 101.0, 187.0, 406.0, 851.0, 2209.0, 6370.0, 22701.0, 178567.0, 719944.0, 93049.0, 16065.0, 4844.0, 1757.0, 673.0, 306.0, 148.0, 74.0, 45.0, 33.0, 21.0, 15.0, 13.0, 10.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.80859375, -2.71612548828125, -2.6236572265625, -2.53118896484375, -2.438720703125, -2.34625244140625, -2.2537841796875, -2.16131591796875, -2.06884765625, -1.97637939453125, -1.8839111328125, -1.79144287109375, -1.698974609375, -1.60650634765625, -1.5140380859375, -1.42156982421875, -1.3291015625, -1.23663330078125, -1.1441650390625, -1.05169677734375, -0.959228515625, -0.86676025390625, -0.7742919921875, -0.68182373046875, -0.58935546875, -0.49688720703125, -0.4044189453125, -0.31195068359375, -0.219482421875, -0.12701416015625, -0.0345458984375, 0.05792236328125, 0.150390625, 0.24285888671875, 0.3353271484375, 0.42779541015625, 0.520263671875, 0.61273193359375, 0.7052001953125, 0.79766845703125, 0.89013671875, 0.98260498046875, 1.0750732421875, 1.16754150390625, 1.260009765625, 1.35247802734375, 1.4449462890625, 1.53741455078125, 1.6298828125, 1.72235107421875, 1.8148193359375, 1.90728759765625, 1.999755859375, 2.09222412109375, 2.1846923828125, 2.27716064453125, 2.36962890625, 2.46209716796875, 2.5545654296875, 2.64703369140625, 2.739501953125, 2.83197021484375, 2.9244384765625, 3.01690673828125, 3.109375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 7.0, 5.0, 14.0, 8.0, 15.0, 15.0, 14.0, 22.0, 19.0, 27.0, 30.0, 23.0, 37.0, 35.0, 37.0, 38.0, 50.0, 44.0, 38.0, 33.0, 36.0, 48.0, 40.0, 40.0, 36.0, 38.0, 30.0, 30.0, 29.0, 21.0, 16.0, 21.0, 20.0, 16.0, 12.0, 9.0, 9.0, 8.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.45703125, -7.20977783203125, -6.9625244140625, -6.71527099609375, -6.468017578125, -6.22076416015625, -5.9735107421875, -5.72625732421875, -5.47900390625, -5.23175048828125, -4.9844970703125, -4.73724365234375, -4.489990234375, -4.24273681640625, -3.9954833984375, -3.74822998046875, -3.5009765625, -3.25372314453125, -3.0064697265625, -2.75921630859375, -2.511962890625, -2.26470947265625, -2.0174560546875, -1.77020263671875, -1.52294921875, -1.27569580078125, -1.0284423828125, -0.78118896484375, -0.533935546875, -0.28668212890625, -0.0394287109375, 0.20782470703125, 0.455078125, 0.70233154296875, 0.9495849609375, 1.19683837890625, 1.444091796875, 1.69134521484375, 1.9385986328125, 2.18585205078125, 2.43310546875, 2.68035888671875, 2.9276123046875, 3.17486572265625, 3.422119140625, 3.66937255859375, 3.9166259765625, 4.16387939453125, 4.4111328125, 4.65838623046875, 4.9056396484375, 5.15289306640625, 5.400146484375, 5.64739990234375, 5.8946533203125, 6.14190673828125, 6.38916015625, 6.63641357421875, 6.8836669921875, 7.13092041015625, 7.378173828125, 7.62542724609375, 7.8726806640625, 8.11993408203125, 8.3671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 11.0, 3.0, 8.0, 9.0, 21.0, 41.0, 38.0, 60.0, 90.0, 134.0, 238.0, 377.0, 650.0, 1079.0, 2010.0, 4249.0, 10031.0, 31303.0, 153679.0, 568365.0, 213426.0, 40628.0, 11930.0, 4906.0, 2299.0, 1238.0, 662.0, 419.0, 221.0, 138.0, 92.0, 70.0, 45.0, 29.0, 7.0, 18.0, 9.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.83251953125, -0.8053054809570312, -0.7780914306640625, -0.7508773803710938, -0.723663330078125, -0.6964492797851562, -0.6692352294921875, -0.6420211791992188, -0.61480712890625, -0.5875930786132812, -0.5603790283203125, -0.5331649780273438, -0.505950927734375, -0.47873687744140625, -0.4515228271484375, -0.42430877685546875, -0.3970947265625, -0.36988067626953125, -0.3426666259765625, -0.31545257568359375, -0.288238525390625, -0.26102447509765625, -0.2338104248046875, -0.20659637451171875, -0.17938232421875, -0.15216827392578125, -0.1249542236328125, -0.09774017333984375, -0.070526123046875, -0.04331207275390625, -0.0160980224609375, 0.01111602783203125, 0.038330078125, 0.06554412841796875, 0.0927581787109375, 0.11997222900390625, 0.147186279296875, 0.17440032958984375, 0.2016143798828125, 0.22882843017578125, 0.25604248046875, 0.28325653076171875, 0.3104705810546875, 0.33768463134765625, 0.364898681640625, 0.39211273193359375, 0.4193267822265625, 0.44654083251953125, 0.4737548828125, 0.5009689331054688, 0.5281829833984375, 0.5553970336914062, 0.582611083984375, 0.6098251342773438, 0.6370391845703125, 0.6642532348632812, 0.69146728515625, 0.7186813354492188, 0.7458953857421875, 0.7731094360351562, 0.800323486328125, 0.8275375366210938, 0.8547515869140625, 0.8819656372070312, 0.9091796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 7.0, 13.0, 21.0, 22.0, 44.0, 100.0, 161.0, 183.0, 172.0, 116.0, 67.0, 39.0, 16.0, 13.0, 10.0, 7.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006513595581054688, -0.0006301179528236389, -0.0006088763475418091, -0.0005876347422599792, -0.0005663931369781494, -0.0005451515316963196, -0.0005239099264144897, -0.0005026683211326599, -0.0004814267158508301, -0.00046018511056900024, -0.0004389435052871704, -0.0004177019000053406, -0.00039646029472351074, -0.0003752186894416809, -0.0003539770841598511, -0.00033273547887802124, -0.0003114938735961914, -0.00029025226831436157, -0.00026901066303253174, -0.0002477690577507019, -0.00022652745246887207, -0.00020528584718704224, -0.0001840442419052124, -0.00016280263662338257, -0.00014156103134155273, -0.0001203194260597229, -9.907782077789307e-05, -7.783621549606323e-05, -5.65946102142334e-05, -3.5353004932403564e-05, -1.411139965057373e-05, 7.1302056312561035e-06, 2.8371810913085938e-05, 4.961341619491577e-05, 7.08550214767456e-05, 9.209662675857544e-05, 0.00011333823204040527, 0.0001345798373222351, 0.00015582144260406494, 0.00017706304788589478, 0.0001983046531677246, 0.00021954625844955444, 0.00024078786373138428, 0.0002620294690132141, 0.00028327107429504395, 0.0003045126795768738, 0.0003257542848587036, 0.00034699589014053345, 0.0003682374954223633, 0.0003894791007041931, 0.00041072070598602295, 0.0004319623112678528, 0.0004532039165496826, 0.00047444552183151245, 0.0004956871271133423, 0.0005169287323951721, 0.000538170337677002, 0.0005594119429588318, 0.0005806535482406616, 0.0006018951535224915, 0.0006231367588043213, 0.0006443783640861511, 0.000665619969367981, 0.0006868615746498108, 0.0007081031799316406]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 7.0, 10.0, 18.0, 28.0, 46.0, 63.0, 115.0, 207.0, 423.0, 905.0, 1995.0, 4756.0, 13539.0, 50160.0, 276600.0, 539225.0, 120320.0, 26277.0, 7974.0, 3055.0, 1407.0, 631.0, 345.0, 169.0, 99.0, 56.0, 33.0, 22.0, 13.0, 12.0, 7.0, 4.0, 6.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.052734375, -1.0252227783203125, -0.997711181640625, -0.9701995849609375, -0.94268798828125, -0.9151763916015625, -0.887664794921875, -0.8601531982421875, -0.8326416015625, -0.8051300048828125, -0.777618408203125, -0.7501068115234375, -0.72259521484375, -0.6950836181640625, -0.667572021484375, -0.6400604248046875, -0.612548828125, -0.5850372314453125, -0.557525634765625, -0.5300140380859375, -0.50250244140625, -0.4749908447265625, -0.447479248046875, -0.4199676513671875, -0.3924560546875, -0.3649444580078125, -0.337432861328125, -0.3099212646484375, -0.28240966796875, -0.2548980712890625, -0.227386474609375, -0.1998748779296875, -0.17236328125, -0.1448516845703125, -0.117340087890625, -0.0898284912109375, -0.06231689453125, -0.0348052978515625, -0.007293701171875, 0.0202178955078125, 0.0477294921875, 0.0752410888671875, 0.102752685546875, 0.1302642822265625, 0.15777587890625, 0.1852874755859375, 0.212799072265625, 0.2403106689453125, 0.267822265625, 0.2953338623046875, 0.322845458984375, 0.3503570556640625, 0.37786865234375, 0.4053802490234375, 0.432891845703125, 0.4604034423828125, 0.4879150390625, 0.5154266357421875, 0.542938232421875, 0.5704498291015625, 0.59796142578125, 0.6254730224609375, 0.652984619140625, 0.6804962158203125, 0.7080078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 10.0, 7.0, 16.0, 19.0, 19.0, 27.0, 47.0, 50.0, 65.0, 86.0, 111.0, 91.0, 84.0, 78.0, 66.0, 44.0, 39.0, 27.0, 27.0, 19.0, 12.0, 12.0, 7.0, 6.0, 4.0, 8.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1790771484375, -0.17230796813964844, -0.16553878784179688, -0.1587696075439453, -0.15200042724609375, -0.1452312469482422, -0.13846206665039062, -0.13169288635253906, -0.1249237060546875, -0.11815452575683594, -0.11138534545898438, -0.10461616516113281, -0.09784698486328125, -0.09107780456542969, -0.08430862426757812, -0.07753944396972656, -0.070770263671875, -0.06400108337402344, -0.057231903076171875, -0.05046272277832031, -0.04369354248046875, -0.03692436218261719, -0.030155181884765625, -0.023386001586914062, -0.0166168212890625, -0.009847640991210938, -0.003078460693359375, 0.0036907196044921875, 0.01045989990234375, 0.017229080200195312, 0.023998260498046875, 0.030767440795898438, 0.03753662109375, 0.04430580139160156, 0.051074981689453125, 0.05784416198730469, 0.06461334228515625, 0.07138252258300781, 0.07815170288085938, 0.08492088317871094, 0.0916900634765625, 0.09845924377441406, 0.10522842407226562, 0.11199760437011719, 0.11876678466796875, 0.1255359649658203, 0.13230514526367188, 0.13907432556152344, 0.145843505859375, 0.15261268615722656, 0.15938186645507812, 0.1661510467529297, 0.17292022705078125, 0.1796894073486328, 0.18645858764648438, 0.19322776794433594, 0.1999969482421875, 0.20676612854003906, 0.21353530883789062, 0.2203044891357422, 0.22707366943359375, 0.2338428497314453, 0.24061203002929688, 0.24738121032714844, 0.254150390625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 14.0, 27.0, 48.0, 90.0, 168.0, 173.0, 188.0, 117.0, 69.0, 51.0, 20.0, 9.0, 8.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.88035774230957, -15.490616798400879, -15.100874900817871, -14.71113395690918, -14.321393013000488, -13.931652069091797, -13.541910171508789, -13.152169227600098, -12.762428283691406, -12.372687339782715, -11.982945442199707, -11.593204498291016, -11.203463554382324, -10.813722610473633, -10.423980712890625, -10.034239768981934, -9.644497871398926, -9.254756927490234, -8.865015029907227, -8.475274085998535, -8.085533142089844, -7.695791721343994, -7.3060503005981445, -6.916309356689453, -6.5265679359436035, -6.136826515197754, -5.7470855712890625, -5.357344150543213, -4.967602729797363, -4.577861785888672, -4.188120365142822, -3.7983791828155518, -3.4086389541625977, -3.018897771835327, -2.6291565895080566, -2.239415168762207, -1.8496739864349365, -1.459932804107666, -1.0701913833618164, -0.6804502010345459, -0.2907090187072754, 0.09903222322463989, 0.4887734651565552, 0.8785147666931152, 1.2682559490203857, 1.6579971313476562, 2.047738552093506, 2.4374797344207764, 2.827220916748047, 3.2169620990753174, 3.606703281402588, 3.9964447021484375, 4.386185646057129, 4.7759270668029785, 5.165668487548828, 5.5554094314575195, 5.945150852203369, 6.334892272949219, 6.72463321685791, 7.11437463760376, 7.504116058349609, 7.893857002258301, 8.283597946166992, 8.67333984375, 9.063080787658691]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 7.0, 13.0, 5.0, 13.0, 18.0, 19.0, 28.0, 33.0, 33.0, 40.0, 38.0, 45.0, 53.0, 59.0, 55.0, 66.0, 55.0, 57.0, 57.0, 52.0, 46.0, 35.0, 41.0, 26.0, 39.0, 16.0, 13.0, 13.0, 8.0, 10.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.13356876373291, -5.974535942077637, -5.815502643585205, -5.656469821929932, -5.4974365234375, -5.338403701782227, -5.179370403289795, -5.0203375816345215, -4.86130428314209, -4.702271461486816, -4.543238162994385, -4.384205341339111, -4.22517204284668, -4.066139221191406, -3.9071061611175537, -3.748073101043701, -3.5890402793884277, -3.430007219314575, -3.2709741592407227, -3.11194109916687, -2.9529080390930176, -2.793875217437744, -2.6348421573638916, -2.475809097290039, -2.3167760372161865, -2.157742977142334, -1.9987099170684814, -1.8396769762039185, -1.680643916130066, -1.5216108560562134, -1.3625779151916504, -1.2035448551177979, -1.0445117950439453, -0.8854787349700928, -0.726445734500885, -0.5674127340316772, -0.4083796739578247, -0.24934661388397217, -0.0903136134147644, 0.06871938705444336, 0.2277524471282959, 0.38678547739982605, 0.5458185076713562, 0.704851508140564, 0.8638845682144165, 1.022917628288269, 1.181950569152832, 1.3409836292266846, 1.500016689300537, 1.6590497493743896, 1.8180828094482422, 1.9771157503128052, 2.1361489295959473, 2.2951817512512207, 2.4542148113250732, 2.613247871398926, 2.7722809314727783, 2.931313991546631, 3.0903470516204834, 3.249380111694336, 3.4084129333496094, 3.567446231842041, 3.7264790534973145, 3.885512113571167, 4.0445451736450195]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 4.0, 6.0, 4.0, 5.0, 6.0, 5.0, 15.0, 12.0, 18.0, 23.0, 26.0, 54.0, 59.0, 165.0, 561.0, 2447.0, 18566.0, 276175.0, 698858.0, 45072.0, 5071.0, 864.0, 270.0, 80.0, 52.0, 33.0, 25.0, 16.0, 15.0, 10.0, 8.0, 7.0, 7.0, 6.0, 3.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.125, -10.7564697265625, -10.387939453125, -10.0194091796875, -9.65087890625, -9.2823486328125, -8.913818359375, -8.5452880859375, -8.1767578125, -7.8082275390625, -7.439697265625, -7.0711669921875, -6.70263671875, -6.3341064453125, -5.965576171875, -5.5970458984375, -5.228515625, -4.8599853515625, -4.491455078125, -4.1229248046875, -3.75439453125, -3.3858642578125, -3.017333984375, -2.6488037109375, -2.2802734375, -1.9117431640625, -1.543212890625, -1.1746826171875, -0.80615234375, -0.4376220703125, -0.069091796875, 0.2994384765625, 0.66796875, 1.0364990234375, 1.405029296875, 1.7735595703125, 2.14208984375, 2.5106201171875, 2.879150390625, 3.2476806640625, 3.6162109375, 3.9847412109375, 4.353271484375, 4.7218017578125, 5.09033203125, 5.4588623046875, 5.827392578125, 6.1959228515625, 6.564453125, 6.9329833984375, 7.301513671875, 7.6700439453125, 8.03857421875, 8.4071044921875, 8.775634765625, 9.1441650390625, 9.5126953125, 9.8812255859375, 10.249755859375, 10.6182861328125, 10.98681640625, 11.3553466796875, 11.723876953125, 12.0924072265625, 12.4609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 13.0, 9.0, 11.0, 16.0, 19.0, 20.0, 27.0, 33.0, 26.0, 47.0, 41.0, 38.0, 38.0, 57.0, 52.0, 61.0, 46.0, 64.0, 46.0, 52.0, 42.0, 37.0, 37.0, 36.0, 24.0, 22.0, 24.0, 15.0, 11.0, 14.0, 7.0, 3.0, 5.0, 1.0, 4.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.359375, -11.042236328125, -10.72509765625, -10.407958984375, -10.0908203125, -9.773681640625, -9.45654296875, -9.139404296875, -8.822265625, -8.505126953125, -8.18798828125, -7.870849609375, -7.5537109375, -7.236572265625, -6.91943359375, -6.602294921875, -6.28515625, -5.968017578125, -5.65087890625, -5.333740234375, -5.0166015625, -4.699462890625, -4.38232421875, -4.065185546875, -3.748046875, -3.430908203125, -3.11376953125, -2.796630859375, -2.4794921875, -2.162353515625, -1.84521484375, -1.528076171875, -1.2109375, -0.893798828125, -0.57666015625, -0.259521484375, 0.0576171875, 0.374755859375, 0.69189453125, 1.009033203125, 1.326171875, 1.643310546875, 1.96044921875, 2.277587890625, 2.5947265625, 2.911865234375, 3.22900390625, 3.546142578125, 3.86328125, 4.180419921875, 4.49755859375, 4.814697265625, 5.1318359375, 5.448974609375, 5.76611328125, 6.083251953125, 6.400390625, 6.717529296875, 7.03466796875, 7.351806640625, 7.6689453125, 7.986083984375, 8.30322265625, 8.620361328125, 8.9375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 8.0, 10.0, 7.0, 9.0, 28.0, 25.0, 50.0, 61.0, 96.0, 127.0, 203.0, 420.0, 851.0, 1842.0, 5714.0, 23064.0, 139789.0, 636903.0, 198527.0, 30024.0, 6746.0, 2111.0, 892.0, 427.0, 207.0, 139.0, 96.0, 49.0, 43.0, 22.0, 24.0, 15.0, 9.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.17578125, -4.9881591796875, -4.800537109375, -4.6129150390625, -4.42529296875, -4.2376708984375, -4.050048828125, -3.8624267578125, -3.6748046875, -3.4871826171875, -3.299560546875, -3.1119384765625, -2.92431640625, -2.7366943359375, -2.549072265625, -2.3614501953125, -2.173828125, -1.9862060546875, -1.798583984375, -1.6109619140625, -1.42333984375, -1.2357177734375, -1.048095703125, -0.8604736328125, -0.6728515625, -0.4852294921875, -0.297607421875, -0.1099853515625, 0.07763671875, 0.2652587890625, 0.452880859375, 0.6405029296875, 0.828125, 1.0157470703125, 1.203369140625, 1.3909912109375, 1.57861328125, 1.7662353515625, 1.953857421875, 2.1414794921875, 2.3291015625, 2.5167236328125, 2.704345703125, 2.8919677734375, 3.07958984375, 3.2672119140625, 3.454833984375, 3.6424560546875, 3.830078125, 4.0177001953125, 4.205322265625, 4.3929443359375, 4.58056640625, 4.7681884765625, 4.955810546875, 5.1434326171875, 5.3310546875, 5.5186767578125, 5.706298828125, 5.8939208984375, 6.08154296875, 6.2691650390625, 6.456787109375, 6.6444091796875, 6.83203125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 8.0, 5.0, 4.0, 12.0, 17.0, 14.0, 14.0, 28.0, 24.0, 19.0, 27.0, 34.0, 36.0, 35.0, 39.0, 34.0, 30.0, 42.0, 42.0, 41.0, 47.0, 38.0, 50.0, 38.0, 37.0, 46.0, 31.0, 30.0, 21.0, 25.0, 18.0, 20.0, 20.0, 15.0, 11.0, 10.0, 9.0, 7.0, 8.0, 2.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.7578125, -11.435546875, -11.11328125, -10.791015625, -10.46875, -10.146484375, -9.82421875, -9.501953125, -9.1796875, -8.857421875, -8.53515625, -8.212890625, -7.890625, -7.568359375, -7.24609375, -6.923828125, -6.6015625, -6.279296875, -5.95703125, -5.634765625, -5.3125, -4.990234375, -4.66796875, -4.345703125, -4.0234375, -3.701171875, -3.37890625, -3.056640625, -2.734375, -2.412109375, -2.08984375, -1.767578125, -1.4453125, -1.123046875, -0.80078125, -0.478515625, -0.15625, 0.166015625, 0.48828125, 0.810546875, 1.1328125, 1.455078125, 1.77734375, 2.099609375, 2.421875, 2.744140625, 3.06640625, 3.388671875, 3.7109375, 4.033203125, 4.35546875, 4.677734375, 5.0, 5.322265625, 5.64453125, 5.966796875, 6.2890625, 6.611328125, 6.93359375, 7.255859375, 7.578125, 7.900390625, 8.22265625, 8.544921875, 8.8671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 7.0, 14.0, 16.0, 20.0, 32.0, 59.0, 80.0, 126.0, 231.0, 484.0, 1009.0, 2480.0, 6450.0, 22603.0, 105747.0, 547424.0, 288169.0, 53130.0, 12785.0, 4304.0, 1676.0, 800.0, 405.0, 208.0, 120.0, 62.0, 47.0, 23.0, 12.0, 11.0, 5.0, 6.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.0435791015625, -1.989501953125, -1.9354248046875, -1.88134765625, -1.8272705078125, -1.773193359375, -1.7191162109375, -1.6650390625, -1.6109619140625, -1.556884765625, -1.5028076171875, -1.44873046875, -1.3946533203125, -1.340576171875, -1.2864990234375, -1.232421875, -1.1783447265625, -1.124267578125, -1.0701904296875, -1.01611328125, -0.9620361328125, -0.907958984375, -0.8538818359375, -0.7998046875, -0.7457275390625, -0.691650390625, -0.6375732421875, -0.58349609375, -0.5294189453125, -0.475341796875, -0.4212646484375, -0.3671875, -0.3131103515625, -0.259033203125, -0.2049560546875, -0.15087890625, -0.0968017578125, -0.042724609375, 0.0113525390625, 0.0654296875, 0.1195068359375, 0.173583984375, 0.2276611328125, 0.28173828125, 0.3358154296875, 0.389892578125, 0.4439697265625, 0.498046875, 0.5521240234375, 0.606201171875, 0.6602783203125, 0.71435546875, 0.7684326171875, 0.822509765625, 0.8765869140625, 0.9306640625, 0.9847412109375, 1.038818359375, 1.0928955078125, 1.14697265625, 1.2010498046875, 1.255126953125, 1.3092041015625, 1.36328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 6.0, 2.0, 4.0, 5.0, 5.0, 9.0, 9.0, 5.0, 15.0, 12.0, 16.0, 25.0, 27.0, 42.0, 33.0, 45.0, 59.0, 60.0, 76.0, 104.0, 88.0, 61.0, 56.0, 43.0, 36.0, 23.0, 30.0, 24.0, 15.0, 18.0, 9.0, 7.0, 8.0, 4.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001875162124633789, -0.00018114037811756134, -0.00017476454377174377, -0.0001683887094259262, -0.00016201287508010864, -0.00015563704073429108, -0.0001492612063884735, -0.00014288537204265594, -0.00013650953769683838, -0.0001301337033510208, -0.00012375786900520325, -0.00011738203465938568, -0.00011100620031356812, -0.00010463036596775055, -9.825453162193298e-05, -9.187869727611542e-05, -8.550286293029785e-05, -7.912702858448029e-05, -7.275119423866272e-05, -6.637535989284515e-05, -5.999952554702759e-05, -5.362369120121002e-05, -4.7247856855392456e-05, -4.087202250957489e-05, -3.4496188163757324e-05, -2.8120353817939758e-05, -2.1744519472122192e-05, -1.5368685126304626e-05, -8.99285078048706e-06, -2.6170164346694946e-06, 3.7588179111480713e-06, 1.0134652256965637e-05, 1.6510486602783203e-05, 2.288632094860077e-05, 2.9262155294418335e-05, 3.56379896402359e-05, 4.201382398605347e-05, 4.838965833187103e-05, 5.47654926776886e-05, 6.114132702350616e-05, 6.751716136932373e-05, 7.38929957151413e-05, 8.026883006095886e-05, 8.664466440677643e-05, 9.3020498752594e-05, 9.939633309841156e-05, 0.00010577216744422913, 0.00011214800179004669, 0.00011852383613586426, 0.00012489967048168182, 0.0001312755048274994, 0.00013765133917331696, 0.00014402717351913452, 0.0001504030078649521, 0.00015677884221076965, 0.00016315467655658722, 0.00016953051090240479, 0.00017590634524822235, 0.00018228217959403992, 0.00018865801393985748, 0.00019503384828567505, 0.00020140968263149261, 0.00020778551697731018, 0.00021416135132312775, 0.0002205371856689453]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 8.0, 7.0, 22.0, 21.0, 45.0, 67.0, 131.0, 227.0, 466.0, 1109.0, 3098.0, 11253.0, 55121.0, 354412.0, 519641.0, 80920.0, 15324.0, 4131.0, 1402.0, 519.0, 264.0, 139.0, 87.0, 44.0, 25.0, 15.0, 14.0, 9.0, 9.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7724609375, -1.7115631103515625, -1.650665283203125, -1.5897674560546875, -1.52886962890625, -1.4679718017578125, -1.407073974609375, -1.3461761474609375, -1.2852783203125, -1.2243804931640625, -1.163482666015625, -1.1025848388671875, -1.04168701171875, -0.9807891845703125, -0.919891357421875, -0.8589935302734375, -0.798095703125, -0.7371978759765625, -0.676300048828125, -0.6154022216796875, -0.55450439453125, -0.4936065673828125, -0.432708740234375, -0.3718109130859375, -0.3109130859375, -0.2500152587890625, -0.189117431640625, -0.1282196044921875, -0.06732177734375, -0.0064239501953125, 0.054473876953125, 0.1153717041015625, 0.17626953125, 0.2371673583984375, 0.298065185546875, 0.3589630126953125, 0.41986083984375, 0.4807586669921875, 0.541656494140625, 0.6025543212890625, 0.6634521484375, 0.7243499755859375, 0.785247802734375, 0.8461456298828125, 0.90704345703125, 0.9679412841796875, 1.028839111328125, 1.0897369384765625, 1.150634765625, 1.2115325927734375, 1.272430419921875, 1.3333282470703125, 1.39422607421875, 1.4551239013671875, 1.516021728515625, 1.5769195556640625, 1.6378173828125, 1.6987152099609375, 1.759613037109375, 1.8205108642578125, 1.88140869140625, 1.9423065185546875, 2.003204345703125, 2.0641021728515625, 2.125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 4.0, 10.0, 5.0, 5.0, 6.0, 16.0, 14.0, 26.0, 19.0, 29.0, 39.0, 34.0, 53.0, 69.0, 72.0, 81.0, 94.0, 79.0, 69.0, 49.0, 52.0, 35.0, 27.0, 16.0, 17.0, 14.0, 12.0, 10.0, 13.0, 6.0, 4.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.84423828125, -0.8185577392578125, -0.792877197265625, -0.7671966552734375, -0.74151611328125, -0.7158355712890625, -0.690155029296875, -0.6644744873046875, -0.6387939453125, -0.6131134033203125, -0.587432861328125, -0.5617523193359375, -0.53607177734375, -0.5103912353515625, -0.484710693359375, -0.4590301513671875, -0.433349609375, -0.4076690673828125, -0.381988525390625, -0.3563079833984375, -0.33062744140625, -0.3049468994140625, -0.279266357421875, -0.2535858154296875, -0.2279052734375, -0.2022247314453125, -0.176544189453125, -0.1508636474609375, -0.12518310546875, -0.0995025634765625, -0.073822021484375, -0.0481414794921875, -0.0224609375, 0.0032196044921875, 0.028900146484375, 0.0545806884765625, 0.08026123046875, 0.1059417724609375, 0.131622314453125, 0.1573028564453125, 0.1829833984375, 0.2086639404296875, 0.234344482421875, 0.2600250244140625, 0.28570556640625, 0.3113861083984375, 0.337066650390625, 0.3627471923828125, 0.388427734375, 0.4141082763671875, 0.439788818359375, 0.4654693603515625, 0.49114990234375, 0.5168304443359375, 0.542510986328125, 0.5681915283203125, 0.5938720703125, 0.6195526123046875, 0.645233154296875, 0.6709136962890625, 0.69659423828125, 0.7222747802734375, 0.747955322265625, 0.7736358642578125, 0.79931640625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 15.0, 64.0, 219.0, 381.0, 229.0, 75.0, 14.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.112619400024414, -27.448816299438477, -25.78501319885254, -24.121212005615234, -22.457408905029297, -20.79360580444336, -19.129802703857422, -17.465999603271484, -15.802197456359863, -14.138394355773926, -12.474592208862305, -10.810789108276367, -9.14698600769043, -7.483183860778809, -5.819380760192871, -4.15557861328125, -2.4917755126953125, -0.8279727697372437, 0.8358299732208252, 2.4996328353881836, 4.163435459136963, 5.827238082885742, 7.49104118347168, 9.1548433303833, 10.818646430969238, 12.482449531555176, 14.146251678466797, 15.810054779052734, 17.473857879638672, 19.13766098022461, 20.801464080810547, 22.46526527404785, 24.129070281982422, 25.79287338256836, 27.456676483154297, 29.120479583740234, 30.78428077697754, 32.448081970214844, 34.11188507080078, 35.77568817138672, 37.439491271972656, 39.103294372558594, 40.76709747314453, 42.43090057373047, 44.094703674316406, 45.758506774902344, 47.42230987548828, 49.08610916137695, 50.749916076660156, 52.413719177246094, 54.07752227783203, 55.74132537841797, 57.405128479003906, 59.068931579589844, 60.73273468017578, 62.39653396606445, 64.06033325195312, 65.72413635253906, 67.387939453125, 69.05174255371094, 70.71554565429688, 72.37934875488281, 74.04315185546875, 75.70695495605469, 77.37075805664062]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 4.0, 3.0, 3.0, 7.0, 10.0, 18.0, 19.0, 16.0, 16.0, 17.0, 14.0, 20.0, 34.0, 26.0, 29.0, 47.0, 35.0, 45.0, 25.0, 36.0, 37.0, 38.0, 41.0, 47.0, 42.0, 46.0, 41.0, 34.0, 38.0, 29.0, 32.0, 20.0, 20.0, 22.0, 15.0, 15.0, 13.0, 4.0, 10.0, 7.0, 8.0, 6.0, 3.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-18.047809600830078, -17.506608963012695, -16.965408325195312, -16.424209594726562, -15.88300895690918, -15.341808319091797, -14.80060863494873, -14.259408950805664, -13.718208312988281, -13.177007675170898, -12.635807991027832, -12.094608306884766, -11.553407669067383, -11.01220703125, -10.471007347106934, -9.929807662963867, -9.388607025146484, -8.847406387329102, -8.306206703186035, -7.7650065422058105, -7.223806381225586, -6.682606220245361, -6.141406059265137, -5.600205898284912, -5.0590057373046875, -4.517805576324463, -3.9766054153442383, -3.4354052543640137, -2.894205093383789, -2.3530049324035645, -1.8118047714233398, -1.2706046104431152, -0.7294025421142578, -0.1882023811340332, 0.3529977798461914, 0.894197940826416, 1.4353981018066406, 1.9765982627868652, 2.51779842376709, 3.0589985847473145, 3.600198745727539, 4.141398906707764, 4.682599067687988, 5.223799228668213, 5.7649993896484375, 6.306199550628662, 6.847399711608887, 7.388599872589111, 7.929800033569336, 8.471000671386719, 9.012200355529785, 9.553400039672852, 10.094600677490234, 10.635801315307617, 11.177000999450684, 11.71820068359375, 12.259401321411133, 12.800601959228516, 13.341801643371582, 13.883001327514648, 14.424201965332031, 14.965402603149414, 15.50660228729248, 16.047801971435547, 16.58900260925293]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 8.0, 3.0, 10.0, 8.0, 10.0, 17.0, 22.0, 44.0, 44.0, 66.0, 103.0, 109.0, 171.0, 280.0, 446.0, 675.0, 1095.0, 1780.0, 3463.0, 6642.0, 14641.0, 39450.0, 137604.0, 618186.0, 2092646.0, 974312.0, 211431.0, 54216.0, 18738.0, 8149.0, 4190.0, 2263.0, 1255.0, 755.0, 486.0, 327.0, 197.0, 137.0, 82.0, 74.0, 43.0, 25.0, 28.0, 10.0, 17.0, 6.0, 7.0, 9.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.81640625, -5.64349365234375, -5.4705810546875, -5.29766845703125, -5.124755859375, -4.95184326171875, -4.7789306640625, -4.60601806640625, -4.43310546875, -4.26019287109375, -4.0872802734375, -3.91436767578125, -3.741455078125, -3.56854248046875, -3.3956298828125, -3.22271728515625, -3.0498046875, -2.87689208984375, -2.7039794921875, -2.53106689453125, -2.358154296875, -2.18524169921875, -2.0123291015625, -1.83941650390625, -1.66650390625, -1.49359130859375, -1.3206787109375, -1.14776611328125, -0.974853515625, -0.80194091796875, -0.6290283203125, -0.45611572265625, -0.283203125, -0.11029052734375, 0.0626220703125, 0.23553466796875, 0.408447265625, 0.58135986328125, 0.7542724609375, 0.92718505859375, 1.10009765625, 1.27301025390625, 1.4459228515625, 1.61883544921875, 1.791748046875, 1.96466064453125, 2.1375732421875, 2.31048583984375, 2.4833984375, 2.65631103515625, 2.8292236328125, 3.00213623046875, 3.175048828125, 3.34796142578125, 3.5208740234375, 3.69378662109375, 3.86669921875, 4.03961181640625, 4.2125244140625, 4.38543701171875, 4.558349609375, 4.73126220703125, 4.9041748046875, 5.07708740234375, 5.25]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 9.0, 6.0, 10.0, 18.0, 21.0, 34.0, 44.0, 38.0, 41.0, 45.0, 47.0, 63.0, 62.0, 76.0, 78.0, 87.0, 60.0, 61.0, 43.0, 30.0, 30.0, 22.0, 19.0, 17.0, 15.0, 8.0, 5.0, 7.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.4765625, -10.2303466796875, -9.984130859375, -9.7379150390625, -9.49169921875, -9.2454833984375, -8.999267578125, -8.7530517578125, -8.5068359375, -8.2606201171875, -8.014404296875, -7.7681884765625, -7.52197265625, -7.2757568359375, -7.029541015625, -6.7833251953125, -6.537109375, -6.2908935546875, -6.044677734375, -5.7984619140625, -5.55224609375, -5.3060302734375, -5.059814453125, -4.8135986328125, -4.5673828125, -4.3211669921875, -4.074951171875, -3.8287353515625, -3.58251953125, -3.3363037109375, -3.090087890625, -2.8438720703125, -2.59765625, -2.3514404296875, -2.105224609375, -1.8590087890625, -1.61279296875, -1.3665771484375, -1.120361328125, -0.8741455078125, -0.6279296875, -0.3817138671875, -0.135498046875, 0.1107177734375, 0.35693359375, 0.6031494140625, 0.849365234375, 1.0955810546875, 1.341796875, 1.5880126953125, 1.834228515625, 2.0804443359375, 2.32666015625, 2.5728759765625, 2.819091796875, 3.0653076171875, 3.3115234375, 3.5577392578125, 3.803955078125, 4.0501708984375, 4.29638671875, 4.5426025390625, 4.788818359375, 5.0350341796875, 5.28125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 0.0, 1.0, 3.0, 8.0, 3.0, 7.0, 14.0, 12.0, 11.0, 29.0, 39.0, 44.0, 76.0, 146.0, 191.0, 369.0, 701.0, 1518.0, 3988.0, 12990.0, 58849.0, 572899.0, 3226856.0, 264678.0, 36644.0, 8766.0, 2892.0, 1192.0, 558.0, 313.0, 166.0, 93.0, 63.0, 53.0, 28.0, 23.0, 13.0, 6.0, 14.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-8.6640625, -8.41192626953125, -8.1597900390625, -7.90765380859375, -7.655517578125, -7.40338134765625, -7.1512451171875, -6.89910888671875, -6.64697265625, -6.39483642578125, -6.1427001953125, -5.89056396484375, -5.638427734375, -5.38629150390625, -5.1341552734375, -4.88201904296875, -4.6298828125, -4.37774658203125, -4.1256103515625, -3.87347412109375, -3.621337890625, -3.36920166015625, -3.1170654296875, -2.86492919921875, -2.61279296875, -2.36065673828125, -2.1085205078125, -1.85638427734375, -1.604248046875, -1.35211181640625, -1.0999755859375, -0.84783935546875, -0.595703125, -0.34356689453125, -0.0914306640625, 0.16070556640625, 0.412841796875, 0.66497802734375, 0.9171142578125, 1.16925048828125, 1.42138671875, 1.67352294921875, 1.9256591796875, 2.17779541015625, 2.429931640625, 2.68206787109375, 2.9342041015625, 3.18634033203125, 3.4384765625, 3.69061279296875, 3.9427490234375, 4.19488525390625, 4.447021484375, 4.69915771484375, 4.9512939453125, 5.20343017578125, 5.45556640625, 5.70770263671875, 5.9598388671875, 6.21197509765625, 6.464111328125, 6.71624755859375, 6.9683837890625, 7.22052001953125, 7.47265625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 10.0, 6.0, 10.0, 11.0, 13.0, 13.0, 26.0, 38.0, 38.0, 55.0, 79.0, 146.0, 189.0, 262.0, 386.0, 561.0, 637.0, 459.0, 352.0, 239.0, 134.0, 102.0, 68.0, 62.0, 47.0, 31.0, 25.0, 20.0, 9.0, 7.0, 9.0, 2.0, 11.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.751953125, -1.685455322265625, -1.61895751953125, -1.552459716796875, -1.4859619140625, -1.419464111328125, -1.35296630859375, -1.286468505859375, -1.219970703125, -1.153472900390625, -1.08697509765625, -1.020477294921875, -0.9539794921875, -0.887481689453125, -0.82098388671875, -0.754486083984375, -0.68798828125, -0.621490478515625, -0.55499267578125, -0.488494873046875, -0.4219970703125, -0.355499267578125, -0.28900146484375, -0.222503662109375, -0.156005859375, -0.089508056640625, -0.02301025390625, 0.043487548828125, 0.1099853515625, 0.176483154296875, 0.24298095703125, 0.309478759765625, 0.3759765625, 0.442474365234375, 0.50897216796875, 0.575469970703125, 0.6419677734375, 0.708465576171875, 0.77496337890625, 0.841461181640625, 0.907958984375, 0.974456787109375, 1.04095458984375, 1.107452392578125, 1.1739501953125, 1.240447998046875, 1.30694580078125, 1.373443603515625, 1.43994140625, 1.506439208984375, 1.57293701171875, 1.639434814453125, 1.7059326171875, 1.772430419921875, 1.83892822265625, 1.905426025390625, 1.971923828125, 2.038421630859375, 2.10491943359375, 2.171417236328125, 2.2379150390625, 2.304412841796875, 2.37091064453125, 2.437408447265625, 2.50390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 5.0, 9.0, 16.0, 16.0, 29.0, 32.0, 45.0, 61.0, 114.0, 99.0, 116.0, 95.0, 99.0, 68.0, 56.0, 36.0, 19.0, 22.0, 20.0, 14.0, 6.0, 5.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.985001564025879, -13.64832878112793, -13.31165599822998, -12.974983215332031, -12.638311386108398, -12.30163860321045, -11.9649658203125, -11.62829303741455, -11.291620254516602, -10.954947471618652, -10.618274688720703, -10.28160285949707, -9.944930076599121, -9.608257293701172, -9.271584510803223, -8.934911727905273, -8.59823989868164, -8.261567115783691, -7.9248948097229, -7.588222026824951, -7.25154972076416, -6.914876937866211, -6.578204154968262, -6.2415313720703125, -5.9048590660095215, -5.568186283111572, -5.231513977050781, -4.894841194152832, -4.558168411254883, -4.221496105194092, -3.8848233222961426, -3.5481507778167725, -3.2114782333374023, -2.8748056888580322, -2.538133144378662, -2.201460361480713, -1.8647878170013428, -1.5281152725219727, -1.1914424896240234, -0.8547699451446533, -0.5180974006652832, -0.1814247965812683, 0.15524780750274658, 0.49192047119140625, 0.8285930156707764, 1.1652655601501465, 1.5019383430480957, 1.8386108875274658, 2.175283432006836, 2.511955976486206, 2.848628520965576, 3.1853013038635254, 3.5219738483428955, 3.8586463928222656, 4.195319175720215, 4.531991958618164, 4.868664264678955, 5.205337047576904, 5.542009353637695, 5.8786821365356445, 6.215354919433594, 6.552027225494385, 6.888700008392334, 7.225372314453125, 7.562045097351074]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 8.0, 7.0, 6.0, 18.0, 18.0, 26.0, 17.0, 18.0, 27.0, 29.0, 33.0, 36.0, 46.0, 40.0, 42.0, 36.0, 46.0, 31.0, 49.0, 36.0, 32.0, 37.0, 34.0, 37.0, 32.0, 29.0, 22.0, 35.0, 30.0, 19.0, 19.0, 16.0, 14.0, 7.0, 11.0, 9.0, 11.0, 6.0, 5.0, 2.0, 3.0, 2.0, 4.0, 4.0], "bins": [-6.488039970397949, -6.322866916656494, -6.157694339752197, -5.992521286010742, -5.827348709106445, -5.66217565536499, -5.497002601623535, -5.331830024719238, -5.166656970977783, -5.001483917236328, -4.836311340332031, -4.671138286590576, -4.505965709686279, -4.340792655944824, -4.175620079040527, -4.010447025299072, -3.8452742099761963, -3.6801013946533203, -3.5149285793304443, -3.3497557640075684, -3.1845827102661133, -3.0194098949432373, -2.8542370796203613, -2.6890640258789062, -2.5238914489746094, -2.3587186336517334, -2.1935458183288574, -2.0283727645874023, -1.8631999492645264, -1.6980271339416504, -1.5328543186187744, -1.3676813840866089, -1.2025084495544434, -1.0373356342315674, -0.8721626996994019, -0.7069898843765259, -0.5418170094490051, -0.3766441345214844, -0.2114713191986084, -0.04629838466644287, 0.1188744306564331, 0.28404730558395386, 0.4492201507091522, 0.6143929958343506, 0.7795658707618713, 0.9447387456893921, 1.109911561012268, 1.2750844955444336, 1.4402573108673096, 1.6054301261901855, 1.770603060722351, 1.935775876045227, 2.1009488105773926, 2.2661216259002686, 2.4312944412231445, 2.5964674949645996, 2.7616400718688965, 2.9268128871917725, 3.0919857025146484, 3.2571587562561035, 3.4223315715789795, 3.5875043869018555, 3.7526772022247314, 3.9178500175476074, 4.0830230712890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 14.0, 9.0, 19.0, 27.0, 37.0, 50.0, 77.0, 121.0, 175.0, 300.0, 507.0, 824.0, 1583.0, 2845.0, 5513.0, 11243.0, 24065.0, 54810.0, 123629.0, 235932.0, 272076.0, 169971.0, 78764.0, 34404.0, 15496.0, 7456.0, 3781.0, 2004.0, 1097.0, 657.0, 384.0, 246.0, 138.0, 105.0, 66.0, 39.0, 34.0, 22.0, 13.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.67431640625, -0.6512374877929688, -0.6281585693359375, -0.6050796508789062, -0.582000732421875, -0.5589218139648438, -0.5358428955078125, -0.5127639770507812, -0.48968505859375, -0.46660614013671875, -0.4435272216796875, -0.42044830322265625, -0.397369384765625, -0.37429046630859375, -0.3512115478515625, -0.32813262939453125, -0.3050537109375, -0.28197479248046875, -0.2588958740234375, -0.23581695556640625, -0.212738037109375, -0.18965911865234375, -0.1665802001953125, -0.14350128173828125, -0.12042236328125, -0.09734344482421875, -0.0742645263671875, -0.05118560791015625, -0.028106689453125, -0.00502777099609375, 0.0180511474609375, 0.04113006591796875, 0.064208984375, 0.08728790283203125, 0.1103668212890625, 0.13344573974609375, 0.156524658203125, 0.17960357666015625, 0.2026824951171875, 0.22576141357421875, 0.24884033203125, 0.27191925048828125, 0.2949981689453125, 0.31807708740234375, 0.341156005859375, 0.36423492431640625, 0.3873138427734375, 0.41039276123046875, 0.4334716796875, 0.45655059814453125, 0.4796295166015625, 0.5027084350585938, 0.525787353515625, 0.5488662719726562, 0.5719451904296875, 0.5950241088867188, 0.61810302734375, 0.6411819458007812, 0.6642608642578125, 0.6873397827148438, 0.710418701171875, 0.7334976196289062, 0.7565765380859375, 0.7796554565429688, 0.802734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 8.0, 11.0, 22.0, 14.0, 22.0, 21.0, 34.0, 32.0, 35.0, 46.0, 38.0, 37.0, 52.0, 54.0, 60.0, 65.0, 34.0, 36.0, 40.0, 49.0, 41.0, 40.0, 33.0, 28.0, 25.0, 22.0, 21.0, 16.0, 8.0, 14.0, 10.0, 9.0, 5.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-4.91015625, -4.785400390625, -4.66064453125, -4.535888671875, -4.4111328125, -4.286376953125, -4.16162109375, -4.036865234375, -3.912109375, -3.787353515625, -3.66259765625, -3.537841796875, -3.4130859375, -3.288330078125, -3.16357421875, -3.038818359375, -2.9140625, -2.789306640625, -2.66455078125, -2.539794921875, -2.4150390625, -2.290283203125, -2.16552734375, -2.040771484375, -1.916015625, -1.791259765625, -1.66650390625, -1.541748046875, -1.4169921875, -1.292236328125, -1.16748046875, -1.042724609375, -0.91796875, -0.793212890625, -0.66845703125, -0.543701171875, -0.4189453125, -0.294189453125, -0.16943359375, -0.044677734375, 0.080078125, 0.204833984375, 0.32958984375, 0.454345703125, 0.5791015625, 0.703857421875, 0.82861328125, 0.953369140625, 1.078125, 1.202880859375, 1.32763671875, 1.452392578125, 1.5771484375, 1.701904296875, 1.82666015625, 1.951416015625, 2.076171875, 2.200927734375, 2.32568359375, 2.450439453125, 2.5751953125, 2.699951171875, 2.82470703125, 2.949462890625, 3.07421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 8.0, 12.0, 9.0, 22.0, 21.0, 43.0, 64.0, 102.0, 163.0, 310.0, 555.0, 1123.0, 2911.0, 8454.0, 31948.0, 145385.0, 455000.0, 305079.0, 71856.0, 16691.0, 5044.0, 1854.0, 840.0, 445.0, 237.0, 133.0, 90.0, 58.0, 32.0, 23.0, 16.0, 9.0, 6.0, 4.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2060546875, -1.1680908203125, -1.130126953125, -1.0921630859375, -1.05419921875, -1.0162353515625, -0.978271484375, -0.9403076171875, -0.90234375, -0.8643798828125, -0.826416015625, -0.7884521484375, -0.75048828125, -0.7125244140625, -0.674560546875, -0.6365966796875, -0.5986328125, -0.5606689453125, -0.522705078125, -0.4847412109375, -0.44677734375, -0.4088134765625, -0.370849609375, -0.3328857421875, -0.294921875, -0.2569580078125, -0.218994140625, -0.1810302734375, -0.14306640625, -0.1051025390625, -0.067138671875, -0.0291748046875, 0.0087890625, 0.0467529296875, 0.084716796875, 0.1226806640625, 0.16064453125, 0.1986083984375, 0.236572265625, 0.2745361328125, 0.3125, 0.3504638671875, 0.388427734375, 0.4263916015625, 0.46435546875, 0.5023193359375, 0.540283203125, 0.5782470703125, 0.6162109375, 0.6541748046875, 0.692138671875, 0.7301025390625, 0.76806640625, 0.8060302734375, 0.843994140625, 0.8819580078125, 0.919921875, 0.9578857421875, 0.995849609375, 1.0338134765625, 1.07177734375, 1.1097412109375, 1.147705078125, 1.1856689453125, 1.2236328125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 5.0, 9.0, 8.0, 5.0, 16.0, 20.0, 16.0, 28.0, 25.0, 46.0, 45.0, 52.0, 53.0, 51.0, 68.0, 36.0, 51.0, 52.0, 58.0, 56.0, 47.0, 54.0, 31.0, 30.0, 20.0, 23.0, 13.0, 21.0, 15.0, 12.0, 3.0, 9.0, 5.0, 3.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-10.2578125, -9.982666015625, -9.70751953125, -9.432373046875, -9.1572265625, -8.882080078125, -8.60693359375, -8.331787109375, -8.056640625, -7.781494140625, -7.50634765625, -7.231201171875, -6.9560546875, -6.680908203125, -6.40576171875, -6.130615234375, -5.85546875, -5.580322265625, -5.30517578125, -5.030029296875, -4.7548828125, -4.479736328125, -4.20458984375, -3.929443359375, -3.654296875, -3.379150390625, -3.10400390625, -2.828857421875, -2.5537109375, -2.278564453125, -2.00341796875, -1.728271484375, -1.453125, -1.177978515625, -0.90283203125, -0.627685546875, -0.3525390625, -0.077392578125, 0.19775390625, 0.472900390625, 0.748046875, 1.023193359375, 1.29833984375, 1.573486328125, 1.8486328125, 2.123779296875, 2.39892578125, 2.674072265625, 2.94921875, 3.224365234375, 3.49951171875, 3.774658203125, 4.0498046875, 4.324951171875, 4.60009765625, 4.875244140625, 5.150390625, 5.425537109375, 5.70068359375, 5.975830078125, 6.2509765625, 6.526123046875, 6.80126953125, 7.076416015625, 7.3515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 11.0, 16.0, 22.0, 37.0, 61.0, 131.0, 253.0, 486.0, 1096.0, 2804.0, 9125.0, 39693.0, 261361.0, 588574.0, 115048.0, 20927.0, 5521.0, 1844.0, 727.0, 364.0, 187.0, 110.0, 62.0, 29.0, 23.0, 8.0, 9.0, 6.0, 2.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8056640625, -0.781463623046875, -0.75726318359375, -0.733062744140625, -0.7088623046875, -0.684661865234375, -0.66046142578125, -0.636260986328125, -0.612060546875, -0.587860107421875, -0.56365966796875, -0.539459228515625, -0.5152587890625, -0.491058349609375, -0.46685791015625, -0.442657470703125, -0.41845703125, -0.394256591796875, -0.37005615234375, -0.345855712890625, -0.3216552734375, -0.297454833984375, -0.27325439453125, -0.249053955078125, -0.224853515625, -0.200653076171875, -0.17645263671875, -0.152252197265625, -0.1280517578125, -0.103851318359375, -0.07965087890625, -0.055450439453125, -0.03125, -0.007049560546875, 0.01715087890625, 0.041351318359375, 0.0655517578125, 0.089752197265625, 0.11395263671875, 0.138153076171875, 0.162353515625, 0.186553955078125, 0.21075439453125, 0.234954833984375, 0.2591552734375, 0.283355712890625, 0.30755615234375, 0.331756591796875, 0.35595703125, 0.380157470703125, 0.40435791015625, 0.428558349609375, 0.4527587890625, 0.476959228515625, 0.50115966796875, 0.525360107421875, 0.549560546875, 0.573760986328125, 0.59796142578125, 0.622161865234375, 0.6463623046875, 0.670562744140625, 0.69476318359375, 0.718963623046875, 0.7431640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 5.0, 13.0, 16.0, 15.0, 25.0, 28.0, 39.0, 37.0, 55.0, 90.0, 87.0, 94.0, 93.0, 98.0, 61.0, 47.0, 40.0, 39.0, 33.0, 20.0, 17.0, 11.0, 7.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002295970916748047, -0.00022165104746818542, -0.00021370500326156616, -0.0002057589590549469, -0.00019781291484832764, -0.00018986687064170837, -0.0001819208264350891, -0.00017397478222846985, -0.00016602873802185059, -0.00015808269381523132, -0.00015013664960861206, -0.0001421906054019928, -0.00013424456119537354, -0.00012629851698875427, -0.00011835247278213501, -0.00011040642857551575, -0.00010246038436889648, -9.451434016227722e-05, -8.656829595565796e-05, -7.86222517490387e-05, -7.067620754241943e-05, -6.273016333580017e-05, -5.478411912918091e-05, -4.6838074922561646e-05, -3.889203071594238e-05, -3.094598650932312e-05, -2.2999942302703857e-05, -1.5053898096084595e-05, -7.107853889465332e-06, 8.381903171539307e-07, 8.784234523773193e-06, 1.6730278730392456e-05, 2.467632293701172e-05, 3.262236714363098e-05, 4.0568411350250244e-05, 4.851445555686951e-05, 5.646049976348877e-05, 6.440654397010803e-05, 7.23525881767273e-05, 8.029863238334656e-05, 8.824467658996582e-05, 9.619072079658508e-05, 0.00010413676500320435, 0.00011208280920982361, 0.00012002885341644287, 0.00012797489762306213, 0.0001359209418296814, 0.00014386698603630066, 0.00015181303024291992, 0.00015975907444953918, 0.00016770511865615845, 0.0001756511628627777, 0.00018359720706939697, 0.00019154325127601624, 0.0001994892954826355, 0.00020743533968925476, 0.00021538138389587402, 0.00022332742810249329, 0.00023127347230911255, 0.0002392195165157318, 0.0002471655607223511, 0.00025511160492897034, 0.0002630576491355896, 0.00027100369334220886, 0.0002789497375488281]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 0.0, 5.0, 4.0, 3.0, 6.0, 10.0, 7.0, 11.0, 21.0, 25.0, 30.0, 63.0, 99.0, 188.0, 355.0, 743.0, 1719.0, 4083.0, 10899.0, 31934.0, 107682.0, 338358.0, 371137.0, 124535.0, 36438.0, 12044.0, 4546.0, 1838.0, 815.0, 349.0, 218.0, 139.0, 71.0, 52.0, 33.0, 15.0, 15.0, 24.0, 10.0, 7.0, 8.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54736328125, -0.5312919616699219, -0.5152206420898438, -0.4991493225097656, -0.4830780029296875, -0.4670066833496094, -0.45093536376953125, -0.4348640441894531, -0.418792724609375, -0.4027214050292969, -0.38665008544921875, -0.3705787658691406, -0.3545074462890625, -0.3384361267089844, -0.32236480712890625, -0.3062934875488281, -0.29022216796875, -0.2741508483886719, -0.25807952880859375, -0.24200820922851562, -0.2259368896484375, -0.20986557006835938, -0.19379425048828125, -0.17772293090820312, -0.161651611328125, -0.14558029174804688, -0.12950897216796875, -0.11343765258789062, -0.0973663330078125, -0.08129501342773438, -0.06522369384765625, -0.049152374267578125, -0.0330810546875, -0.017009735107421875, -0.00093841552734375, 0.015132904052734375, 0.0312042236328125, 0.047275543212890625, 0.06334686279296875, 0.07941818237304688, 0.095489501953125, 0.11156082153320312, 0.12763214111328125, 0.14370346069335938, 0.1597747802734375, 0.17584609985351562, 0.19191741943359375, 0.20798873901367188, 0.22406005859375, 0.24013137817382812, 0.25620269775390625, 0.2722740173339844, 0.2883453369140625, 0.3044166564941406, 0.32048797607421875, 0.3365592956542969, 0.352630615234375, 0.3687019348144531, 0.38477325439453125, 0.4008445739746094, 0.4169158935546875, 0.4329872131347656, 0.44905853271484375, 0.4651298522949219, 0.481201171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 4.0, 8.0, 4.0, 8.0, 5.0, 11.0, 13.0, 20.0, 22.0, 21.0, 28.0, 38.0, 58.0, 59.0, 70.0, 75.0, 83.0, 64.0, 70.0, 58.0, 55.0, 39.0, 42.0, 31.0, 25.0, 17.0, 13.0, 11.0, 4.0, 10.0, 9.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.120361328125, -0.1161956787109375, -0.112030029296875, -0.1078643798828125, -0.10369873046875, -0.0995330810546875, -0.095367431640625, -0.0912017822265625, -0.0870361328125, -0.0828704833984375, -0.078704833984375, -0.0745391845703125, -0.07037353515625, -0.0662078857421875, -0.062042236328125, -0.0578765869140625, -0.0537109375, -0.0495452880859375, -0.045379638671875, -0.0412139892578125, -0.03704833984375, -0.0328826904296875, -0.028717041015625, -0.0245513916015625, -0.0203857421875, -0.0162200927734375, -0.012054443359375, -0.0078887939453125, -0.00372314453125, 0.0004425048828125, 0.004608154296875, 0.0087738037109375, 0.012939453125, 0.0171051025390625, 0.021270751953125, 0.0254364013671875, 0.02960205078125, 0.0337677001953125, 0.037933349609375, 0.0420989990234375, 0.0462646484375, 0.0504302978515625, 0.054595947265625, 0.0587615966796875, 0.06292724609375, 0.0670928955078125, 0.071258544921875, 0.0754241943359375, 0.07958984375, 0.0837554931640625, 0.087921142578125, 0.0920867919921875, 0.09625244140625, 0.1004180908203125, 0.104583740234375, 0.1087493896484375, 0.1129150390625, 0.1170806884765625, 0.121246337890625, 0.1254119873046875, 0.12957763671875, 0.1337432861328125, 0.137908935546875, 0.1420745849609375, 0.146240234375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 11.0, 13.0, 30.0, 31.0, 55.0, 92.0, 139.0, 141.0, 133.0, 123.0, 75.0, 49.0, 31.0, 21.0, 18.0, 10.0, 6.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.231117248535156, -10.96853256225586, -10.705948829650879, -10.443364143371582, -10.180780410766602, -9.918195724487305, -9.655611038208008, -9.393027305603027, -9.13044261932373, -8.867857933044434, -8.605274200439453, -8.342689514160156, -8.08010482788086, -7.817521095275879, -7.554936408996582, -7.292352199554443, -7.029767990112305, -6.767183780670166, -6.504599571228027, -6.2420148849487305, -5.979430675506592, -5.716846466064453, -5.454261779785156, -5.191677570343018, -4.929093360900879, -4.66650915145874, -4.403924942016602, -4.141340255737305, -3.878756046295166, -3.6161718368530273, -3.3535873889923096, -3.091002941131592, -2.8284177780151367, -2.565833568572998, -2.3032491207122803, -2.0406646728515625, -1.7780804634094238, -1.5154961347579956, -1.2529118061065674, -0.9903274774551392, -0.7277431488037109, -0.4651588201522827, -0.2025744915008545, 0.06000983715057373, 0.32259416580200195, 0.5851784944534302, 0.8477628231048584, 1.1103471517562866, 1.3729314804077148, 1.635515809059143, 1.8981001377105713, 2.160684585571289, 2.4232687950134277, 2.6858530044555664, 2.948437452316284, 3.211021900177002, 3.4736061096191406, 3.7361903190612793, 3.998774766921997, 4.261359214782715, 4.5239434242248535, 4.786527633666992, 5.049112319946289, 5.311696529388428, 5.574280738830566]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 13.0, 10.0, 11.0, 28.0, 19.0, 30.0, 23.0, 30.0, 45.0, 52.0, 43.0, 53.0, 52.0, 43.0, 55.0, 54.0, 45.0, 53.0, 35.0, 42.0, 42.0, 29.0, 36.0, 32.0, 28.0, 16.0, 19.0, 9.0, 9.0, 8.0, 10.0, 4.0, 3.0, 4.0, 6.0, 2.0, 0.0, 3.0], "bins": [-5.188355445861816, -5.061628341674805, -4.934901237487793, -4.8081746101379395, -4.681447505950928, -4.554720401763916, -4.4279937744140625, -4.301266670227051, -4.174539566040039, -4.047812461853027, -3.9210855960845947, -3.794358730316162, -3.6676316261291504, -3.5409045219421387, -3.414177656173706, -3.2874507904052734, -3.1607236862182617, -3.03399658203125, -2.9072697162628174, -2.7805428504943848, -2.653815746307373, -2.5270886421203613, -2.4003617763519287, -2.273634910583496, -2.1469078063964844, -2.0201807022094727, -1.89345383644104, -1.7667268514633179, -1.6399998664855957, -1.5132728815078735, -1.3865458965301514, -1.2598189115524292, -1.1330924034118652, -1.006365418434143, -0.8796384334564209, -0.7529114484786987, -0.6261844635009766, -0.4994574785232544, -0.3727304935455322, -0.24600350856781006, -0.11927652359008789, 0.007450461387634277, 0.13417744636535645, 0.2609044313430786, 0.3876314163208008, 0.514358401298523, 0.6410853862762451, 0.7678123712539673, 0.8945393562316895, 1.0212663412094116, 1.1479933261871338, 1.274720311164856, 1.4014472961425781, 1.5281742811203003, 1.6549012660980225, 1.7816282510757446, 1.9083552360534668, 2.0350823402404785, 2.161809206008911, 2.2885360717773438, 2.4152631759643555, 2.541990280151367, 2.6687171459198, 2.7954440116882324, 2.922171115875244]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 10.0, 4.0, 7.0, 13.0, 21.0, 31.0, 40.0, 52.0, 88.0, 153.0, 233.0, 397.0, 641.0, 1140.0, 2104.0, 4004.0, 8516.0, 18387.0, 45812.0, 127559.0, 389527.0, 292726.0, 93697.0, 34466.0, 14737.0, 6699.0, 3398.0, 1628.0, 978.0, 561.0, 330.0, 196.0, 124.0, 85.0, 69.0, 38.0, 31.0, 14.0, 11.0, 8.0, 3.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4765625, -3.3560791015625, -3.235595703125, -3.1151123046875, -2.99462890625, -2.8741455078125, -2.753662109375, -2.6331787109375, -2.5126953125, -2.3922119140625, -2.271728515625, -2.1512451171875, -2.03076171875, -1.9102783203125, -1.789794921875, -1.6693115234375, -1.548828125, -1.4283447265625, -1.307861328125, -1.1873779296875, -1.06689453125, -0.9464111328125, -0.825927734375, -0.7054443359375, -0.5849609375, -0.4644775390625, -0.343994140625, -0.2235107421875, -0.10302734375, 0.0174560546875, 0.137939453125, 0.2584228515625, 0.37890625, 0.4993896484375, 0.619873046875, 0.7403564453125, 0.86083984375, 0.9813232421875, 1.101806640625, 1.2222900390625, 1.3427734375, 1.4632568359375, 1.583740234375, 1.7042236328125, 1.82470703125, 1.9451904296875, 2.065673828125, 2.1861572265625, 2.306640625, 2.4271240234375, 2.547607421875, 2.6680908203125, 2.78857421875, 2.9090576171875, 3.029541015625, 3.1500244140625, 3.2705078125, 3.3909912109375, 3.511474609375, 3.6319580078125, 3.75244140625, 3.8729248046875, 3.993408203125, 4.1138916015625, 4.234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 5.0, 5.0, 5.0, 8.0, 17.0, 13.0, 15.0, 23.0, 45.0, 30.0, 39.0, 50.0, 51.0, 49.0, 61.0, 55.0, 50.0, 49.0, 53.0, 42.0, 44.0, 49.0, 32.0, 35.0, 31.0, 21.0, 25.0, 23.0, 11.0, 11.0, 8.0, 10.0, 7.0, 6.0, 8.0, 5.0, 3.0, 1.0, 5.0], "bins": [-12.2421875, -11.947265625, -11.65234375, -11.357421875, -11.0625, -10.767578125, -10.47265625, -10.177734375, -9.8828125, -9.587890625, -9.29296875, -8.998046875, -8.703125, -8.408203125, -8.11328125, -7.818359375, -7.5234375, -7.228515625, -6.93359375, -6.638671875, -6.34375, -6.048828125, -5.75390625, -5.458984375, -5.1640625, -4.869140625, -4.57421875, -4.279296875, -3.984375, -3.689453125, -3.39453125, -3.099609375, -2.8046875, -2.509765625, -2.21484375, -1.919921875, -1.625, -1.330078125, -1.03515625, -0.740234375, -0.4453125, -0.150390625, 0.14453125, 0.439453125, 0.734375, 1.029296875, 1.32421875, 1.619140625, 1.9140625, 2.208984375, 2.50390625, 2.798828125, 3.09375, 3.388671875, 3.68359375, 3.978515625, 4.2734375, 4.568359375, 4.86328125, 5.158203125, 5.453125, 5.748046875, 6.04296875, 6.337890625, 6.6328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 5.0, 9.0, 13.0, 23.0, 30.0, 42.0, 52.0, 92.0, 142.0, 240.0, 451.0, 1176.0, 4144.0, 21735.0, 189563.0, 717456.0, 95747.0, 13022.0, 2787.0, 873.0, 365.0, 203.0, 137.0, 62.0, 54.0, 41.0, 27.0, 16.0, 13.0, 7.0, 6.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9609375, -5.750732421875, -5.54052734375, -5.330322265625, -5.1201171875, -4.909912109375, -4.69970703125, -4.489501953125, -4.279296875, -4.069091796875, -3.85888671875, -3.648681640625, -3.4384765625, -3.228271484375, -3.01806640625, -2.807861328125, -2.59765625, -2.387451171875, -2.17724609375, -1.967041015625, -1.7568359375, -1.546630859375, -1.33642578125, -1.126220703125, -0.916015625, -0.705810546875, -0.49560546875, -0.285400390625, -0.0751953125, 0.135009765625, 0.34521484375, 0.555419921875, 0.765625, 0.975830078125, 1.18603515625, 1.396240234375, 1.6064453125, 1.816650390625, 2.02685546875, 2.237060546875, 2.447265625, 2.657470703125, 2.86767578125, 3.077880859375, 3.2880859375, 3.498291015625, 3.70849609375, 3.918701171875, 4.12890625, 4.339111328125, 4.54931640625, 4.759521484375, 4.9697265625, 5.179931640625, 5.39013671875, 5.600341796875, 5.810546875, 6.020751953125, 6.23095703125, 6.441162109375, 6.6513671875, 6.861572265625, 7.07177734375, 7.281982421875, 7.4921875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 11.0, 9.0, 10.0, 5.0, 12.0, 21.0, 20.0, 24.0, 38.0, 33.0, 47.0, 48.0, 38.0, 49.0, 56.0, 51.0, 58.0, 49.0, 51.0, 51.0, 45.0, 53.0, 33.0, 39.0, 27.0, 24.0, 23.0, 24.0, 12.0, 11.0, 8.0, 8.0, 4.0, 5.0, 6.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.53125, -9.16064453125, -8.7900390625, -8.41943359375, -8.048828125, -7.67822265625, -7.3076171875, -6.93701171875, -6.56640625, -6.19580078125, -5.8251953125, -5.45458984375, -5.083984375, -4.71337890625, -4.3427734375, -3.97216796875, -3.6015625, -3.23095703125, -2.8603515625, -2.48974609375, -2.119140625, -1.74853515625, -1.3779296875, -1.00732421875, -0.63671875, -0.26611328125, 0.1044921875, 0.47509765625, 0.845703125, 1.21630859375, 1.5869140625, 1.95751953125, 2.328125, 2.69873046875, 3.0693359375, 3.43994140625, 3.810546875, 4.18115234375, 4.5517578125, 4.92236328125, 5.29296875, 5.66357421875, 6.0341796875, 6.40478515625, 6.775390625, 7.14599609375, 7.5166015625, 7.88720703125, 8.2578125, 8.62841796875, 8.9990234375, 9.36962890625, 9.740234375, 10.11083984375, 10.4814453125, 10.85205078125, 11.22265625, 11.59326171875, 11.9638671875, 12.33447265625, 12.705078125, 13.07568359375, 13.4462890625, 13.81689453125, 14.1875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 2.0, 10.0, 12.0, 9.0, 12.0, 20.0, 13.0, 26.0, 34.0, 53.0, 69.0, 125.0, 233.0, 409.0, 1085.0, 2841.0, 9473.0, 44507.0, 313512.0, 571419.0, 82478.0, 15155.0, 4204.0, 1463.0, 606.0, 325.0, 158.0, 106.0, 57.0, 30.0, 26.0, 16.0, 16.0, 10.0, 6.0, 6.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.818359375, -1.7600250244140625, -1.701690673828125, -1.6433563232421875, -1.58502197265625, -1.5266876220703125, -1.468353271484375, -1.4100189208984375, -1.3516845703125, -1.2933502197265625, -1.235015869140625, -1.1766815185546875, -1.11834716796875, -1.0600128173828125, -1.001678466796875, -0.9433441162109375, -0.885009765625, -0.8266754150390625, -0.768341064453125, -0.7100067138671875, -0.65167236328125, -0.5933380126953125, -0.535003662109375, -0.4766693115234375, -0.4183349609375, -0.3600006103515625, -0.301666259765625, -0.2433319091796875, -0.18499755859375, -0.1266632080078125, -0.068328857421875, -0.0099945068359375, 0.04833984375, 0.1066741943359375, 0.165008544921875, 0.2233428955078125, 0.28167724609375, 0.3400115966796875, 0.398345947265625, 0.4566802978515625, 0.5150146484375, 0.5733489990234375, 0.631683349609375, 0.6900177001953125, 0.74835205078125, 0.8066864013671875, 0.865020751953125, 0.9233551025390625, 0.981689453125, 1.0400238037109375, 1.098358154296875, 1.1566925048828125, 1.21502685546875, 1.2733612060546875, 1.331695556640625, 1.3900299072265625, 1.4483642578125, 1.5066986083984375, 1.565032958984375, 1.6233673095703125, 1.68170166015625, 1.7400360107421875, 1.798370361328125, 1.8567047119140625, 1.9150390625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 8.0, 10.0, 8.0, 13.0, 23.0, 31.0, 36.0, 46.0, 68.0, 90.0, 89.0, 107.0, 106.0, 95.0, 66.0, 51.0, 33.0, 25.0, 23.0, 15.0, 10.0, 12.0, 8.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003077983856201172, -0.00029908493161201477, -0.00029037147760391235, -0.00028165802359580994, -0.0002729445695877075, -0.0002642311155796051, -0.0002555176615715027, -0.00024680420756340027, -0.00023809075355529785, -0.00022937729954719543, -0.00022066384553909302, -0.0002119503915309906, -0.00020323693752288818, -0.00019452348351478577, -0.00018581002950668335, -0.00017709657549858093, -0.00016838312149047852, -0.0001596696674823761, -0.00015095621347427368, -0.00014224275946617126, -0.00013352930545806885, -0.00012481585144996643, -0.00011610239744186401, -0.0001073889434337616, -9.867548942565918e-05, -8.996203541755676e-05, -8.124858140945435e-05, -7.253512740135193e-05, -6.382167339324951e-05, -5.5108219385147095e-05, -4.639476537704468e-05, -3.768131136894226e-05, -2.8967857360839844e-05, -2.0254403352737427e-05, -1.154094934463501e-05, -2.8274953365325928e-06, 5.885958671569824e-06, 1.4599412679672241e-05, 2.3312866687774658e-05, 3.2026320695877075e-05, 4.073977470397949e-05, 4.945322871208191e-05, 5.8166682720184326e-05, 6.688013672828674e-05, 7.559359073638916e-05, 8.430704474449158e-05, 9.3020498752594e-05, 0.00010173395276069641, 0.00011044740676879883, 0.00011916086077690125, 0.00012787431478500366, 0.00013658776879310608, 0.0001453012228012085, 0.0001540146768093109, 0.00016272813081741333, 0.00017144158482551575, 0.00018015503883361816, 0.00018886849284172058, 0.000197581946849823, 0.00020629540085792542, 0.00021500885486602783, 0.00022372230887413025, 0.00023243576288223267, 0.00024114921689033508, 0.0002498626708984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 6.0, 7.0, 11.0, 12.0, 20.0, 23.0, 56.0, 74.0, 109.0, 188.0, 377.0, 859.0, 2179.0, 5949.0, 19100.0, 81361.0, 440786.0, 397278.0, 73090.0, 17775.0, 5435.0, 2065.0, 852.0, 413.0, 204.0, 128.0, 83.0, 36.0, 23.0, 16.0, 5.0, 6.0, 10.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4326171875, -1.3813934326171875, -1.330169677734375, -1.2789459228515625, -1.22772216796875, -1.1764984130859375, -1.125274658203125, -1.0740509033203125, -1.0228271484375, -0.9716033935546875, -0.920379638671875, -0.8691558837890625, -0.81793212890625, -0.7667083740234375, -0.715484619140625, -0.6642608642578125, -0.613037109375, -0.5618133544921875, -0.510589599609375, -0.4593658447265625, -0.40814208984375, -0.3569183349609375, -0.305694580078125, -0.2544708251953125, -0.2032470703125, -0.1520233154296875, -0.100799560546875, -0.0495758056640625, 0.00164794921875, 0.0528717041015625, 0.104095458984375, 0.1553192138671875, 0.20654296875, 0.2577667236328125, 0.308990478515625, 0.3602142333984375, 0.41143798828125, 0.4626617431640625, 0.513885498046875, 0.5651092529296875, 0.6163330078125, 0.6675567626953125, 0.718780517578125, 0.7700042724609375, 0.82122802734375, 0.8724517822265625, 0.923675537109375, 0.9748992919921875, 1.026123046875, 1.0773468017578125, 1.128570556640625, 1.1797943115234375, 1.23101806640625, 1.2822418212890625, 1.333465576171875, 1.3846893310546875, 1.4359130859375, 1.4871368408203125, 1.538360595703125, 1.5895843505859375, 1.64080810546875, 1.6920318603515625, 1.743255615234375, 1.7944793701171875, 1.845703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 9.0, 9.0, 7.0, 13.0, 11.0, 22.0, 23.0, 18.0, 34.0, 49.0, 49.0, 72.0, 89.0, 98.0, 86.0, 70.0, 80.0, 50.0, 46.0, 23.0, 23.0, 24.0, 19.0, 11.0, 11.0, 7.0, 6.0, 10.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.880859375, -0.8563690185546875, -0.831878662109375, -0.8073883056640625, -0.78289794921875, -0.7584075927734375, -0.733917236328125, -0.7094268798828125, -0.6849365234375, -0.6604461669921875, -0.635955810546875, -0.6114654541015625, -0.58697509765625, -0.5624847412109375, -0.537994384765625, -0.5135040283203125, -0.489013671875, -0.4645233154296875, -0.440032958984375, -0.4155426025390625, -0.39105224609375, -0.3665618896484375, -0.342071533203125, -0.3175811767578125, -0.2930908203125, -0.2686004638671875, -0.244110107421875, -0.2196197509765625, -0.19512939453125, -0.1706390380859375, -0.146148681640625, -0.1216583251953125, -0.09716796875, -0.0726776123046875, -0.048187255859375, -0.0236968994140625, 0.00079345703125, 0.0252838134765625, 0.049774169921875, 0.0742645263671875, 0.0987548828125, 0.1232452392578125, 0.147735595703125, 0.1722259521484375, 0.19671630859375, 0.2212066650390625, 0.245697021484375, 0.2701873779296875, 0.294677734375, 0.3191680908203125, 0.343658447265625, 0.3681488037109375, 0.39263916015625, 0.4171295166015625, 0.441619873046875, 0.4661102294921875, 0.4906005859375, 0.5150909423828125, 0.539581298828125, 0.5640716552734375, 0.58856201171875, 0.6130523681640625, 0.637542724609375, 0.6620330810546875, 0.6865234375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 12.0, 16.0, 14.0, 31.0, 34.0, 52.0, 93.0, 110.0, 148.0, 125.0, 106.0, 95.0, 51.0, 36.0, 18.0, 16.0, 11.0, 9.0, 7.0, 4.0, 6.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.37177085876465, -20.88273048400879, -20.39369010925293, -19.90464973449707, -19.415611267089844, -18.926570892333984, -18.437530517578125, -17.948490142822266, -17.459449768066406, -16.970409393310547, -16.481369018554688, -15.992329597473145, -15.503289222717285, -15.014249801635742, -14.525209426879883, -14.036169052124023, -13.547128677368164, -13.058088302612305, -12.569048881530762, -12.080008506774902, -11.590968132019043, -11.1019287109375, -10.61288833618164, -10.123847961425781, -9.634808540344238, -9.145768165588379, -8.656728744506836, -8.167688369750977, -7.678647994995117, -7.189608097076416, -6.700568199157715, -6.2115278244018555, -5.722487449645996, -5.233447551727295, -4.7444071769714355, -4.255367279052734, -3.766326904296875, -3.277287006378174, -2.7882468700408936, -2.2992067337036133, -1.810166597366333, -1.3211264610290527, -0.8320863842964172, -0.34304630756378174, 0.14599382877349854, 0.6350338459014893, 1.1240739822387695, 1.6131141185760498, 2.10215425491333, 2.5911943912506104, 3.0802345275878906, 3.569274425506592, 4.058314800262451, 4.547354698181152, 5.036395072937012, 5.525434970855713, 6.014474868774414, 6.503514766693115, 6.992555141448975, 7.481595039367676, 7.970635414123535, 8.459674835205078, 8.948715209960938, 9.437755584716797, 9.926795959472656]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 11.0, 4.0, 11.0, 10.0, 8.0, 11.0, 28.0, 23.0, 30.0, 28.0, 40.0, 33.0, 39.0, 42.0, 34.0, 47.0, 56.0, 37.0, 36.0, 41.0, 42.0, 34.0, 45.0, 42.0, 28.0, 25.0, 33.0, 25.0, 27.0, 17.0, 21.0, 18.0, 17.0, 13.0, 6.0, 14.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.588801383972168, -14.067383766174316, -13.545965194702148, -13.024547576904297, -12.503129005432129, -11.981711387634277, -11.46029281616211, -10.938875198364258, -10.417457580566406, -9.896039962768555, -9.374621391296387, -8.853203773498535, -8.331785202026367, -7.810367584228516, -7.288949489593506, -6.767531394958496, -6.246112823486328, -5.724694728851318, -5.203276634216309, -4.681859016418457, -4.160440444946289, -3.6390225887298584, -3.1176047325134277, -2.596186637878418, -2.074768543243408, -1.5533504486083984, -1.0319324731826782, -0.510514497756958, 0.010903596878051758, 0.5323216915130615, 1.0537395477294922, 1.575157642364502, 2.096576690673828, 2.617994785308838, 3.1394128799438477, 3.6608307361602783, 4.182249069213867, 4.703666687011719, 5.2250847816467285, 5.746502876281738, 6.267920970916748, 6.789339065551758, 7.310757160186768, 7.832175254821777, 8.353592872619629, 8.875011444091797, 9.396429061889648, 9.9178466796875, 10.439265251159668, 10.96068286895752, 11.482101440429688, 12.003519058227539, 12.524937629699707, 13.046355247497559, 13.567773818969727, 14.089191436767578, 14.61060905456543, 15.132026672363281, 15.65344524383545, 16.174863815307617, 16.69628143310547, 17.21769905090332, 17.739116668701172, 18.260536193847656, 18.781953811645508]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 6.0, 5.0, 15.0, 13.0, 20.0, 32.0, 54.0, 71.0, 95.0, 160.0, 278.0, 399.0, 622.0, 990.0, 1771.0, 3257.0, 6595.0, 15651.0, 47527.0, 192000.0, 1081783.0, 2179479.0, 515933.0, 98590.0, 27547.0, 10421.0, 4790.0, 2493.0, 1390.0, 873.0, 486.0, 342.0, 196.0, 130.0, 84.0, 58.0, 36.0, 27.0, 23.0, 12.0, 10.0, 8.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-6.546875, -6.37127685546875, -6.1956787109375, -6.02008056640625, -5.844482421875, -5.66888427734375, -5.4932861328125, -5.31768798828125, -5.14208984375, -4.96649169921875, -4.7908935546875, -4.61529541015625, -4.439697265625, -4.26409912109375, -4.0885009765625, -3.91290283203125, -3.7373046875, -3.56170654296875, -3.3861083984375, -3.21051025390625, -3.034912109375, -2.85931396484375, -2.6837158203125, -2.50811767578125, -2.33251953125, -2.15692138671875, -1.9813232421875, -1.80572509765625, -1.630126953125, -1.45452880859375, -1.2789306640625, -1.10333251953125, -0.927734375, -0.75213623046875, -0.5765380859375, -0.40093994140625, -0.225341796875, -0.04974365234375, 0.1258544921875, 0.30145263671875, 0.47705078125, 0.65264892578125, 0.8282470703125, 1.00384521484375, 1.179443359375, 1.35504150390625, 1.5306396484375, 1.70623779296875, 1.8818359375, 2.05743408203125, 2.2330322265625, 2.40863037109375, 2.584228515625, 2.75982666015625, 2.9354248046875, 3.11102294921875, 3.28662109375, 3.46221923828125, 3.6378173828125, 3.81341552734375, 3.989013671875, 4.16461181640625, 4.3402099609375, 4.51580810546875, 4.69140625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 8.0, 4.0, 3.0, 4.0, 6.0, 8.0, 5.0, 8.0, 15.0, 25.0, 22.0, 29.0, 32.0, 29.0, 41.0, 38.0, 52.0, 60.0, 50.0, 48.0, 52.0, 49.0, 53.0, 70.0, 48.0, 46.0, 38.0, 28.0, 25.0, 28.0, 23.0, 12.0, 8.0, 14.0, 5.0, 3.0, 6.0, 4.0, 8.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.3203125, -6.15087890625, -5.9814453125, -5.81201171875, -5.642578125, -5.47314453125, -5.3037109375, -5.13427734375, -4.96484375, -4.79541015625, -4.6259765625, -4.45654296875, -4.287109375, -4.11767578125, -3.9482421875, -3.77880859375, -3.609375, -3.43994140625, -3.2705078125, -3.10107421875, -2.931640625, -2.76220703125, -2.5927734375, -2.42333984375, -2.25390625, -2.08447265625, -1.9150390625, -1.74560546875, -1.576171875, -1.40673828125, -1.2373046875, -1.06787109375, -0.8984375, -0.72900390625, -0.5595703125, -0.39013671875, -0.220703125, -0.05126953125, 0.1181640625, 0.28759765625, 0.45703125, 0.62646484375, 0.7958984375, 0.96533203125, 1.134765625, 1.30419921875, 1.4736328125, 1.64306640625, 1.8125, 1.98193359375, 2.1513671875, 2.32080078125, 2.490234375, 2.65966796875, 2.8291015625, 2.99853515625, 3.16796875, 3.33740234375, 3.5068359375, 3.67626953125, 3.845703125, 4.01513671875, 4.1845703125, 4.35400390625, 4.5234375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 8.0, 14.0, 23.0, 22.0, 19.0, 39.0, 59.0, 69.0, 111.0, 169.0, 253.0, 425.0, 760.0, 1658.0, 3748.0, 10086.0, 34812.0, 179045.0, 2163196.0, 1612830.0, 141629.0, 29706.0, 8929.0, 3255.0, 1461.0, 753.0, 391.0, 242.0, 161.0, 102.0, 67.0, 57.0, 51.0, 27.0, 23.0, 23.0, 8.0, 9.0, 5.0, 6.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.59765625, -6.40325927734375, -6.2088623046875, -6.01446533203125, -5.820068359375, -5.62567138671875, -5.4312744140625, -5.23687744140625, -5.04248046875, -4.84808349609375, -4.6536865234375, -4.45928955078125, -4.264892578125, -4.07049560546875, -3.8760986328125, -3.68170166015625, -3.4873046875, -3.29290771484375, -3.0985107421875, -2.90411376953125, -2.709716796875, -2.51531982421875, -2.3209228515625, -2.12652587890625, -1.93212890625, -1.73773193359375, -1.5433349609375, -1.34893798828125, -1.154541015625, -0.96014404296875, -0.7657470703125, -0.57135009765625, -0.376953125, -0.18255615234375, 0.0118408203125, 0.20623779296875, 0.400634765625, 0.59503173828125, 0.7894287109375, 0.98382568359375, 1.17822265625, 1.37261962890625, 1.5670166015625, 1.76141357421875, 1.955810546875, 2.15020751953125, 2.3446044921875, 2.53900146484375, 2.7333984375, 2.92779541015625, 3.1221923828125, 3.31658935546875, 3.510986328125, 3.70538330078125, 3.8997802734375, 4.09417724609375, 4.28857421875, 4.48297119140625, 4.6773681640625, 4.87176513671875, 5.066162109375, 5.26055908203125, 5.4549560546875, 5.64935302734375, 5.84375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 5.0, 3.0, 4.0, 9.0, 10.0, 5.0, 10.0, 21.0, 19.0, 26.0, 43.0, 50.0, 76.0, 106.0, 125.0, 204.0, 305.0, 418.0, 503.0, 543.0, 448.0, 319.0, 254.0, 169.0, 123.0, 69.0, 39.0, 48.0, 43.0, 18.0, 15.0, 12.0, 3.0, 7.0, 6.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5810546875, -1.5227813720703125, -1.464508056640625, -1.4062347412109375, -1.34796142578125, -1.2896881103515625, -1.231414794921875, -1.1731414794921875, -1.1148681640625, -1.0565948486328125, -0.998321533203125, -0.9400482177734375, -0.88177490234375, -0.8235015869140625, -0.765228271484375, -0.7069549560546875, -0.648681640625, -0.5904083251953125, -0.532135009765625, -0.4738616943359375, -0.41558837890625, -0.3573150634765625, -0.299041748046875, -0.2407684326171875, -0.1824951171875, -0.1242218017578125, -0.065948486328125, -0.0076751708984375, 0.05059814453125, 0.1088714599609375, 0.167144775390625, 0.2254180908203125, 0.28369140625, 0.3419647216796875, 0.400238037109375, 0.4585113525390625, 0.51678466796875, 0.5750579833984375, 0.633331298828125, 0.6916046142578125, 0.7498779296875, 0.8081512451171875, 0.866424560546875, 0.9246978759765625, 0.98297119140625, 1.0412445068359375, 1.099517822265625, 1.1577911376953125, 1.216064453125, 1.2743377685546875, 1.332611083984375, 1.3908843994140625, 1.44915771484375, 1.5074310302734375, 1.565704345703125, 1.6239776611328125, 1.6822509765625, 1.7405242919921875, 1.798797607421875, 1.8570709228515625, 1.91534423828125, 1.9736175537109375, 2.031890869140625, 2.0901641845703125, 2.1484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 5.0, 2.0, 8.0, 8.0, 12.0, 13.0, 29.0, 68.0, 77.0, 108.0, 136.0, 144.0, 121.0, 85.0, 70.0, 47.0, 32.0, 11.0, 14.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.270666122436523, -16.89580535888672, -16.52094268798828, -16.146081924438477, -15.771220207214355, -15.396358489990234, -15.02149772644043, -14.646636009216309, -14.271774291992188, -13.896912574768066, -13.522051811218262, -13.14719009399414, -12.77232837677002, -12.397466659545898, -12.022605895996094, -11.647744178771973, -11.272883415222168, -10.898021697998047, -10.523160934448242, -10.148299217224121, -9.7734375, -9.398576736450195, -9.023715019226074, -8.648853302001953, -8.273992538452148, -7.8991312980651855, -7.5242695808410645, -7.149408340454102, -6.7745466232299805, -6.399685382843018, -6.024824142456055, -5.649962425231934, -5.275100231170654, -4.900238990783691, -4.52537727355957, -4.150516033172607, -3.7756545543670654, -3.4007930755615234, -3.0259318351745605, -2.6510703563690186, -2.2762088775634766, -1.9013473987579346, -1.5264860391616821, -1.1516246795654297, -0.7767632007598877, -0.4019017219543457, -0.027040481567382812, 0.3478209972381592, 0.7226824760437012, 1.0975439548492432, 1.4724053144454956, 1.847266674041748, 2.22212815284729, 2.596989631652832, 2.971850872039795, 3.346712350845337, 3.721573829650879, 4.096435070037842, 4.471296787261963, 4.846158027648926, 5.221019744873047, 5.59588098526001, 5.970742225646973, 6.345603942871094, 6.720465183258057]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 6.0, 3.0, 4.0, 10.0, 8.0, 21.0, 19.0, 20.0, 30.0, 28.0, 36.0, 47.0, 51.0, 54.0, 49.0, 62.0, 66.0, 57.0, 59.0, 43.0, 55.0, 52.0, 58.0, 27.0, 25.0, 20.0, 24.0, 13.0, 13.0, 14.0, 7.0, 9.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.115744590759277, -7.910972595214844, -7.70620059967041, -7.501428604125977, -7.296656608581543, -7.091884613037109, -6.887112617492676, -6.682340621948242, -6.477568626403809, -6.272796630859375, -6.068024635314941, -5.863252639770508, -5.658480644226074, -5.453708648681641, -5.248936653137207, -5.044164657592773, -4.839393138885498, -4.6346211433410645, -4.429849147796631, -4.225077152252197, -4.020305156707764, -3.81553316116333, -3.6107614040374756, -3.405989408493042, -3.2012174129486084, -2.996445417404175, -2.791673421859741, -2.5869016647338867, -2.382129669189453, -2.1773576736450195, -1.972585678100586, -1.7678136825561523, -1.5630412101745605, -1.358269214630127, -1.1534972190856934, -0.9487253427505493, -0.7439533472061157, -0.5391813516616821, -0.3344094753265381, -0.1296374797821045, 0.0751345157623291, 0.2799064815044403, 0.4846784472465515, 0.6894503831863403, 0.8942223787307739, 1.0989943742752075, 1.3037662506103516, 1.5085382461547852, 1.7133102416992188, 1.9180822372436523, 2.122854232788086, 2.3276262283325195, 2.532398223876953, 2.7371702194213867, 2.941941976547241, 3.146713972091675, 3.3514859676361084, 3.556257963180542, 3.7610299587249756, 3.96580171585083, 4.170573711395264, 4.375345706939697, 4.580117702484131, 4.7848896980285645, 4.989661693572998]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 9.0, 9.0, 8.0, 21.0, 30.0, 54.0, 82.0, 124.0, 225.0, 434.0, 746.0, 1597.0, 3260.0, 7474.0, 18130.0, 46999.0, 128576.0, 308894.0, 315824.0, 133460.0, 49060.0, 18903.0, 7902.0, 3396.0, 1523.0, 808.0, 403.0, 238.0, 122.0, 87.0, 55.0, 31.0, 27.0, 11.0, 8.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.09375, -1.063385009765625, -1.03302001953125, -1.002655029296875, -0.9722900390625, -0.941925048828125, -0.91156005859375, -0.881195068359375, -0.850830078125, -0.820465087890625, -0.79010009765625, -0.759735107421875, -0.7293701171875, -0.699005126953125, -0.66864013671875, -0.638275146484375, -0.60791015625, -0.577545166015625, -0.54718017578125, -0.516815185546875, -0.4864501953125, -0.456085205078125, -0.42572021484375, -0.395355224609375, -0.364990234375, -0.334625244140625, -0.30426025390625, -0.273895263671875, -0.2435302734375, -0.213165283203125, -0.18280029296875, -0.152435302734375, -0.1220703125, -0.091705322265625, -0.06134033203125, -0.030975341796875, -0.0006103515625, 0.029754638671875, 0.06011962890625, 0.090484619140625, 0.120849609375, 0.151214599609375, 0.18157958984375, 0.211944580078125, 0.2423095703125, 0.272674560546875, 0.30303955078125, 0.333404541015625, 0.36376953125, 0.394134521484375, 0.42449951171875, 0.454864501953125, 0.4852294921875, 0.515594482421875, 0.54595947265625, 0.576324462890625, 0.606689453125, 0.637054443359375, 0.66741943359375, 0.697784423828125, 0.7281494140625, 0.758514404296875, 0.78887939453125, 0.819244384765625, 0.849609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 6.0, 8.0, 16.0, 17.0, 23.0, 21.0, 26.0, 30.0, 46.0, 54.0, 61.0, 49.0, 62.0, 57.0, 60.0, 66.0, 57.0, 54.0, 58.0, 44.0, 35.0, 32.0, 17.0, 20.0, 16.0, 12.0, 15.0, 9.0, 5.0, 4.0, 3.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.5546875, -5.4130859375, -5.271484375, -5.1298828125, -4.98828125, -4.8466796875, -4.705078125, -4.5634765625, -4.421875, -4.2802734375, -4.138671875, -3.9970703125, -3.85546875, -3.7138671875, -3.572265625, -3.4306640625, -3.2890625, -3.1474609375, -3.005859375, -2.8642578125, -2.72265625, -2.5810546875, -2.439453125, -2.2978515625, -2.15625, -2.0146484375, -1.873046875, -1.7314453125, -1.58984375, -1.4482421875, -1.306640625, -1.1650390625, -1.0234375, -0.8818359375, -0.740234375, -0.5986328125, -0.45703125, -0.3154296875, -0.173828125, -0.0322265625, 0.109375, 0.2509765625, 0.392578125, 0.5341796875, 0.67578125, 0.8173828125, 0.958984375, 1.1005859375, 1.2421875, 1.3837890625, 1.525390625, 1.6669921875, 1.80859375, 1.9501953125, 2.091796875, 2.2333984375, 2.375, 2.5166015625, 2.658203125, 2.7998046875, 2.94140625, 3.0830078125, 3.224609375, 3.3662109375, 3.5078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 14.0, 14.0, 15.0, 30.0, 56.0, 92.0, 125.0, 206.0, 399.0, 860.0, 2464.0, 7764.0, 34987.0, 192122.0, 542538.0, 215292.0, 38596.0, 8531.0, 2533.0, 960.0, 386.0, 227.0, 112.0, 66.0, 52.0, 33.0, 25.0, 19.0, 11.0, 6.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4755859375, -1.43157958984375, -1.3875732421875, -1.34356689453125, -1.299560546875, -1.25555419921875, -1.2115478515625, -1.16754150390625, -1.12353515625, -1.07952880859375, -1.0355224609375, -0.99151611328125, -0.947509765625, -0.90350341796875, -0.8594970703125, -0.81549072265625, -0.771484375, -0.72747802734375, -0.6834716796875, -0.63946533203125, -0.595458984375, -0.55145263671875, -0.5074462890625, -0.46343994140625, -0.41943359375, -0.37542724609375, -0.3314208984375, -0.28741455078125, -0.243408203125, -0.19940185546875, -0.1553955078125, -0.11138916015625, -0.0673828125, -0.02337646484375, 0.0206298828125, 0.06463623046875, 0.108642578125, 0.15264892578125, 0.1966552734375, 0.24066162109375, 0.28466796875, 0.32867431640625, 0.3726806640625, 0.41668701171875, 0.460693359375, 0.50469970703125, 0.5487060546875, 0.59271240234375, 0.63671875, 0.68072509765625, 0.7247314453125, 0.76873779296875, 0.812744140625, 0.85675048828125, 0.9007568359375, 0.94476318359375, 0.98876953125, 1.03277587890625, 1.0767822265625, 1.12078857421875, 1.164794921875, 1.20880126953125, 1.2528076171875, 1.29681396484375, 1.3408203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 11.0, 10.0, 12.0, 12.0, 13.0, 20.0, 21.0, 10.0, 22.0, 31.0, 34.0, 36.0, 28.0, 40.0, 41.0, 32.0, 43.0, 44.0, 46.0, 41.0, 41.0, 40.0, 32.0, 46.0, 44.0, 27.0, 28.0, 26.0, 22.0, 22.0, 18.0, 29.0, 15.0, 9.0, 8.0, 13.0, 6.0, 2.0, 3.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-7.30859375, -7.0897216796875, -6.870849609375, -6.6519775390625, -6.43310546875, -6.2142333984375, -5.995361328125, -5.7764892578125, -5.5576171875, -5.3387451171875, -5.119873046875, -4.9010009765625, -4.68212890625, -4.4632568359375, -4.244384765625, -4.0255126953125, -3.806640625, -3.5877685546875, -3.368896484375, -3.1500244140625, -2.93115234375, -2.7122802734375, -2.493408203125, -2.2745361328125, -2.0556640625, -1.8367919921875, -1.617919921875, -1.3990478515625, -1.18017578125, -0.9613037109375, -0.742431640625, -0.5235595703125, -0.3046875, -0.0858154296875, 0.133056640625, 0.3519287109375, 0.57080078125, 0.7896728515625, 1.008544921875, 1.2274169921875, 1.4462890625, 1.6651611328125, 1.884033203125, 2.1029052734375, 2.32177734375, 2.5406494140625, 2.759521484375, 2.9783935546875, 3.197265625, 3.4161376953125, 3.635009765625, 3.8538818359375, 4.07275390625, 4.2916259765625, 4.510498046875, 4.7293701171875, 4.9482421875, 5.1671142578125, 5.385986328125, 5.6048583984375, 5.82373046875, 6.0426025390625, 6.261474609375, 6.4803466796875, 6.69921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 14.0, 15.0, 13.0, 23.0, 32.0, 47.0, 63.0, 88.0, 151.0, 218.0, 344.0, 558.0, 901.0, 1580.0, 3138.0, 6757.0, 16856.0, 48699.0, 156173.0, 380787.0, 286410.0, 93601.0, 30375.0, 11094.0, 4939.0, 2319.0, 1276.0, 734.0, 462.0, 272.0, 184.0, 131.0, 86.0, 33.0, 39.0, 28.0, 20.0, 19.0, 11.0, 11.0, 8.0, 8.0, 4.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 5.0], "bins": [-0.4462890625, -0.4330787658691406, -0.41986846923828125, -0.4066581726074219, -0.3934478759765625, -0.3802375793457031, -0.36702728271484375, -0.3538169860839844, -0.340606689453125, -0.3273963928222656, -0.31418609619140625, -0.3009757995605469, -0.2877655029296875, -0.2745552062988281, -0.26134490966796875, -0.24813461303710938, -0.23492431640625, -0.22171401977539062, -0.20850372314453125, -0.19529342651367188, -0.1820831298828125, -0.16887283325195312, -0.15566253662109375, -0.14245223999023438, -0.129241943359375, -0.11603164672851562, -0.10282135009765625, -0.08961105346679688, -0.0764007568359375, -0.06319046020507812, -0.04998016357421875, -0.036769866943359375, -0.0235595703125, -0.010349273681640625, 0.00286102294921875, 0.016071319580078125, 0.0292816162109375, 0.042491912841796875, 0.05570220947265625, 0.06891250610351562, 0.082122802734375, 0.09533309936523438, 0.10854339599609375, 0.12175369262695312, 0.1349639892578125, 0.14817428588867188, 0.16138458251953125, 0.17459487915039062, 0.18780517578125, 0.20101547241210938, 0.21422576904296875, 0.22743606567382812, 0.2406463623046875, 0.2538566589355469, 0.26706695556640625, 0.2802772521972656, 0.293487548828125, 0.3066978454589844, 0.31990814208984375, 0.3331184387207031, 0.3463287353515625, 0.3595390319824219, 0.37274932861328125, 0.3859596252441406, 0.399169921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 8.0, 11.0, 8.0, 10.0, 12.0, 19.0, 21.0, 30.0, 30.0, 44.0, 68.0, 61.0, 72.0, 77.0, 77.0, 73.0, 65.0, 63.0, 43.0, 43.0, 43.0, 22.0, 23.0, 14.0, 12.0, 13.0, 6.0, 4.0, 5.0, 4.0, 2.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00021564960479736328, -0.00020942650735378265, -0.00020320340991020203, -0.0001969803124666214, -0.00019075721502304077, -0.00018453411757946014, -0.00017831102013587952, -0.0001720879226922989, -0.00016586482524871826, -0.00015964172780513763, -0.000153418630361557, -0.00014719553291797638, -0.00014097243547439575, -0.00013474933803081512, -0.0001285262405872345, -0.00012230314314365387, -0.00011608004570007324, -0.00010985694825649261, -0.00010363385081291199, -9.741075336933136e-05, -9.118765592575073e-05, -8.49645584821701e-05, -7.874146103858948e-05, -7.251836359500885e-05, -6.629526615142822e-05, -6.0072168707847595e-05, -5.384907126426697e-05, -4.762597382068634e-05, -4.140287637710571e-05, -3.5179778933525085e-05, -2.8956681489944458e-05, -2.273358404636383e-05, -1.6510486602783203e-05, -1.0287389159202576e-05, -4.064291715621948e-06, 2.158805727958679e-06, 8.381903171539307e-06, 1.4605000615119934e-05, 2.082809805870056e-05, 2.705119550228119e-05, 3.3274292945861816e-05, 3.9497390389442444e-05, 4.572048783302307e-05, 5.19435852766037e-05, 5.8166682720184326e-05, 6.438978016376495e-05, 7.061287760734558e-05, 7.683597505092621e-05, 8.305907249450684e-05, 8.928216993808746e-05, 9.550526738166809e-05, 0.00010172836482524872, 0.00010795146226882935, 0.00011417455971240997, 0.0001203976571559906, 0.00012662075459957123, 0.00013284385204315186, 0.00013906694948673248, 0.0001452900469303131, 0.00015151314437389374, 0.00015773624181747437, 0.000163959339261055, 0.00017018243670463562, 0.00017640553414821625, 0.00018262863159179688]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 8.0, 9.0, 26.0, 12.0, 25.0, 39.0, 54.0, 80.0, 120.0, 227.0, 327.0, 559.0, 1015.0, 2104.0, 4493.0, 9913.0, 25158.0, 72075.0, 219913.0, 391593.0, 209351.0, 68955.0, 24279.0, 9481.0, 4285.0, 1937.0, 995.0, 571.0, 302.0, 207.0, 141.0, 84.0, 65.0, 42.0, 35.0, 20.0, 16.0, 9.0, 5.0, 7.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.40087890625, -0.387725830078125, -0.37457275390625, -0.361419677734375, -0.3482666015625, -0.335113525390625, -0.32196044921875, -0.308807373046875, -0.295654296875, -0.282501220703125, -0.26934814453125, -0.256195068359375, -0.2430419921875, -0.229888916015625, -0.21673583984375, -0.203582763671875, -0.1904296875, -0.177276611328125, -0.16412353515625, -0.150970458984375, -0.1378173828125, -0.124664306640625, -0.11151123046875, -0.098358154296875, -0.085205078125, -0.072052001953125, -0.05889892578125, -0.045745849609375, -0.0325927734375, -0.019439697265625, -0.00628662109375, 0.006866455078125, 0.02001953125, 0.033172607421875, 0.04632568359375, 0.059478759765625, 0.0726318359375, 0.085784912109375, 0.09893798828125, 0.112091064453125, 0.125244140625, 0.138397216796875, 0.15155029296875, 0.164703369140625, 0.1778564453125, 0.191009521484375, 0.20416259765625, 0.217315673828125, 0.23046875, 0.243621826171875, 0.25677490234375, 0.269927978515625, 0.2830810546875, 0.296234130859375, 0.30938720703125, 0.322540283203125, 0.335693359375, 0.348846435546875, 0.36199951171875, 0.375152587890625, 0.3883056640625, 0.401458740234375, 0.41461181640625, 0.427764892578125, 0.44091796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 8.0, 6.0, 10.0, 12.0, 4.0, 13.0, 20.0, 24.0, 26.0, 42.0, 40.0, 56.0, 55.0, 85.0, 71.0, 60.0, 76.0, 56.0, 48.0, 59.0, 53.0, 42.0, 33.0, 19.0, 18.0, 13.0, 5.0, 10.0, 5.0, 8.0, 4.0, 4.0, 2.0, 5.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1451416015625, -0.14094161987304688, -0.13674163818359375, -0.13254165649414062, -0.1283416748046875, -0.12414169311523438, -0.11994171142578125, -0.11574172973632812, -0.111541748046875, -0.10734176635742188, -0.10314178466796875, -0.09894180297851562, -0.0947418212890625, -0.09054183959960938, -0.08634185791015625, -0.08214187622070312, -0.07794189453125, -0.07374191284179688, -0.06954193115234375, -0.06534194946289062, -0.0611419677734375, -0.056941986083984375, -0.05274200439453125, -0.048542022705078125, -0.044342041015625, -0.040142059326171875, -0.03594207763671875, -0.031742095947265625, -0.0275421142578125, -0.023342132568359375, -0.01914215087890625, -0.014942169189453125, -0.0107421875, -0.006542205810546875, -0.00234222412109375, 0.001857757568359375, 0.0060577392578125, 0.010257720947265625, 0.01445770263671875, 0.018657684326171875, 0.022857666015625, 0.027057647705078125, 0.03125762939453125, 0.035457611083984375, 0.0396575927734375, 0.043857574462890625, 0.04805755615234375, 0.052257537841796875, 0.05645751953125, 0.060657501220703125, 0.06485748291015625, 0.06905746459960938, 0.0732574462890625, 0.07745742797851562, 0.08165740966796875, 0.08585739135742188, 0.090057373046875, 0.09425735473632812, 0.09845733642578125, 0.10265731811523438, 0.1068572998046875, 0.11105728149414062, 0.11525726318359375, 0.11945724487304688, 0.1236572265625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 4.0, 6.0, 17.0, 16.0, 46.0, 72.0, 89.0, 128.0, 155.0, 150.0, 97.0, 73.0, 59.0, 26.0, 17.0, 16.0, 6.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-12.267181396484375, -12.01455307006836, -11.76192569732666, -11.509297370910645, -11.256669044494629, -11.00404167175293, -10.751413345336914, -10.498785018920898, -10.2461576461792, -9.993529319763184, -9.740901947021484, -9.488273620605469, -9.235645294189453, -8.983017921447754, -8.730389595031738, -8.477761268615723, -8.225133895874023, -7.972506046295166, -7.71987771987915, -7.467249870300293, -7.2146220207214355, -6.961994171142578, -6.7093658447265625, -6.456737995147705, -6.204109191894531, -5.951481342315674, -5.698853015899658, -5.446225166320801, -5.193597316741943, -4.940969467163086, -4.68834114074707, -4.435713291168213, -4.183085918426514, -3.930457830429077, -3.6778299808502197, -3.425201892852783, -3.172574043273926, -2.9199459552764893, -2.6673178672790527, -2.4146900177001953, -2.162061929702759, -1.9094339609146118, -1.6568059921264648, -1.4041779041290283, -1.1515499353408813, -0.8989219665527344, -0.6462938785552979, -0.3936659097671509, -0.1410379409790039, 0.11159005761146545, 0.3642180562019348, 0.6168460845947266, 0.8694740533828735, 1.1221020221710205, 1.374730110168457, 1.627358078956604, 1.879986047744751, 2.1326141357421875, 2.385241985321045, 2.6378700733184814, 2.890498161315918, 3.1431260108947754, 3.395754098892212, 3.6483821868896484, 3.901010036468506]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 0.0, 5.0, 4.0, 6.0, 6.0, 11.0, 17.0, 22.0, 31.0, 28.0, 35.0, 45.0, 54.0, 54.0, 60.0, 72.0, 61.0, 84.0, 53.0, 53.0, 56.0, 62.0, 41.0, 31.0, 20.0, 22.0, 17.0, 13.0, 12.0, 3.0, 9.0, 10.0, 3.0, 8.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.348143100738525, -6.199432373046875, -6.050721645355225, -5.902010917663574, -5.753299713134766, -5.604588985443115, -5.455878257751465, -5.3071675300598145, -5.158456802368164, -5.009746074676514, -4.861035346984863, -4.712324619293213, -4.5636138916015625, -4.414902687072754, -4.2661919593811035, -4.117481231689453, -3.9687705039978027, -3.8200597763061523, -3.671349048614502, -3.5226380825042725, -3.373927354812622, -3.2252166271209717, -3.076505661010742, -2.927794933319092, -2.7790842056274414, -2.630373477935791, -2.4816627502441406, -2.332951784133911, -2.1842410564422607, -2.0355303287506104, -1.8868194818496704, -1.7381086349487305, -1.5893981456756592, -1.4406874179840088, -1.2919765710830688, -1.143265724182129, -0.9945549964904785, -0.8458442091941833, -0.6971334218978882, -0.5484225749969482, -0.39971184730529785, -0.2510010600090027, -0.10229027271270752, 0.046420514583587646, 0.1951313018798828, 0.343842089176178, 0.49255287647247314, 0.6412637233734131, 0.7899744510650635, 0.9386852383613586, 1.0873960256576538, 1.2361068725585938, 1.3848176002502441, 1.5335283279418945, 1.6822391748428345, 1.8309500217437744, 1.9796607494354248, 2.128371477127075, 2.2770824432373047, 2.425793170928955, 2.5745038986206055, 2.723214626312256, 2.8719253540039062, 3.0206363201141357, 3.169347047805786]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 6.0, 6.0, 14.0, 15.0, 17.0, 37.0, 46.0, 72.0, 113.0, 170.0, 246.0, 413.0, 622.0, 1042.0, 1628.0, 2889.0, 5137.0, 9372.0, 18841.0, 38691.0, 90658.0, 251938.0, 381838.0, 135926.0, 55024.0, 25510.0, 12754.0, 6451.0, 3652.0, 2141.0, 1169.0, 757.0, 441.0, 348.0, 180.0, 128.0, 91.0, 48.0, 42.0, 25.0, 23.0, 10.0, 5.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.654296875, -2.5718994140625, -2.489501953125, -2.4071044921875, -2.32470703125, -2.2423095703125, -2.159912109375, -2.0775146484375, -1.9951171875, -1.9127197265625, -1.830322265625, -1.7479248046875, -1.66552734375, -1.5831298828125, -1.500732421875, -1.4183349609375, -1.3359375, -1.2535400390625, -1.171142578125, -1.0887451171875, -1.00634765625, -0.9239501953125, -0.841552734375, -0.7591552734375, -0.6767578125, -0.5943603515625, -0.511962890625, -0.4295654296875, -0.34716796875, -0.2647705078125, -0.182373046875, -0.0999755859375, -0.017578125, 0.0648193359375, 0.147216796875, 0.2296142578125, 0.31201171875, 0.3944091796875, 0.476806640625, 0.5592041015625, 0.6416015625, 0.7239990234375, 0.806396484375, 0.8887939453125, 0.97119140625, 1.0535888671875, 1.135986328125, 1.2183837890625, 1.30078125, 1.3831787109375, 1.465576171875, 1.5479736328125, 1.63037109375, 1.7127685546875, 1.795166015625, 1.8775634765625, 1.9599609375, 2.0423583984375, 2.124755859375, 2.2071533203125, 2.28955078125, 2.3719482421875, 2.454345703125, 2.5367431640625, 2.619140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 9.0, 9.0, 12.0, 11.0, 19.0, 25.0, 25.0, 23.0, 37.0, 41.0, 33.0, 52.0, 49.0, 63.0, 55.0, 56.0, 54.0, 63.0, 47.0, 42.0, 45.0, 36.0, 35.0, 26.0, 24.0, 15.0, 19.0, 13.0, 14.0, 5.0, 5.0, 8.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-9.9921875, -9.7310791015625, -9.469970703125, -9.2088623046875, -8.94775390625, -8.6866455078125, -8.425537109375, -8.1644287109375, -7.9033203125, -7.6422119140625, -7.381103515625, -7.1199951171875, -6.85888671875, -6.5977783203125, -6.336669921875, -6.0755615234375, -5.814453125, -5.5533447265625, -5.292236328125, -5.0311279296875, -4.77001953125, -4.5089111328125, -4.247802734375, -3.9866943359375, -3.7255859375, -3.4644775390625, -3.203369140625, -2.9422607421875, -2.68115234375, -2.4200439453125, -2.158935546875, -1.8978271484375, -1.63671875, -1.3756103515625, -1.114501953125, -0.8533935546875, -0.59228515625, -0.3311767578125, -0.070068359375, 0.1910400390625, 0.4521484375, 0.7132568359375, 0.974365234375, 1.2354736328125, 1.49658203125, 1.7576904296875, 2.018798828125, 2.2799072265625, 2.541015625, 2.8021240234375, 3.063232421875, 3.3243408203125, 3.58544921875, 3.8465576171875, 4.107666015625, 4.3687744140625, 4.6298828125, 4.8909912109375, 5.152099609375, 5.4132080078125, 5.67431640625, 5.9354248046875, 6.196533203125, 6.4576416015625, 6.71875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 7.0, 10.0, 14.0, 15.0, 22.0, 31.0, 39.0, 59.0, 80.0, 121.0, 170.0, 315.0, 717.0, 1684.0, 4935.0, 17630.0, 88596.0, 613794.0, 265481.0, 40240.0, 9456.0, 2894.0, 1074.0, 450.0, 240.0, 155.0, 93.0, 59.0, 52.0, 25.0, 23.0, 18.0, 11.0, 12.0, 8.0, 3.0, 3.0, 4.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.58984375, -4.440673828125, -4.29150390625, -4.142333984375, -3.9931640625, -3.843994140625, -3.69482421875, -3.545654296875, -3.396484375, -3.247314453125, -3.09814453125, -2.948974609375, -2.7998046875, -2.650634765625, -2.50146484375, -2.352294921875, -2.203125, -2.053955078125, -1.90478515625, -1.755615234375, -1.6064453125, -1.457275390625, -1.30810546875, -1.158935546875, -1.009765625, -0.860595703125, -0.71142578125, -0.562255859375, -0.4130859375, -0.263916015625, -0.11474609375, 0.034423828125, 0.18359375, 0.332763671875, 0.48193359375, 0.631103515625, 0.7802734375, 0.929443359375, 1.07861328125, 1.227783203125, 1.376953125, 1.526123046875, 1.67529296875, 1.824462890625, 1.9736328125, 2.122802734375, 2.27197265625, 2.421142578125, 2.5703125, 2.719482421875, 2.86865234375, 3.017822265625, 3.1669921875, 3.316162109375, 3.46533203125, 3.614501953125, 3.763671875, 3.912841796875, 4.06201171875, 4.211181640625, 4.3603515625, 4.509521484375, 4.65869140625, 4.807861328125, 4.95703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 10.0, 7.0, 13.0, 9.0, 15.0, 15.0, 11.0, 21.0, 28.0, 13.0, 25.0, 22.0, 33.0, 28.0, 37.0, 37.0, 29.0, 42.0, 28.0, 37.0, 40.0, 39.0, 45.0, 42.0, 37.0, 42.0, 29.0, 37.0, 22.0, 29.0, 25.0, 20.0, 23.0, 14.0, 13.0, 10.0, 10.0, 8.0, 12.0, 6.0, 5.0, 6.0, 8.0, 3.0, 4.0, 5.0, 1.0, 0.0, 4.0], "bins": [-8.9296875, -8.68096923828125, -8.4322509765625, -8.18353271484375, -7.934814453125, -7.68609619140625, -7.4373779296875, -7.18865966796875, -6.93994140625, -6.69122314453125, -6.4425048828125, -6.19378662109375, -5.945068359375, -5.69635009765625, -5.4476318359375, -5.19891357421875, -4.9501953125, -4.70147705078125, -4.4527587890625, -4.20404052734375, -3.955322265625, -3.70660400390625, -3.4578857421875, -3.20916748046875, -2.96044921875, -2.71173095703125, -2.4630126953125, -2.21429443359375, -1.965576171875, -1.71685791015625, -1.4681396484375, -1.21942138671875, -0.970703125, -0.72198486328125, -0.4732666015625, -0.22454833984375, 0.024169921875, 0.27288818359375, 0.5216064453125, 0.77032470703125, 1.01904296875, 1.26776123046875, 1.5164794921875, 1.76519775390625, 2.013916015625, 2.26263427734375, 2.5113525390625, 2.76007080078125, 3.0087890625, 3.25750732421875, 3.5062255859375, 3.75494384765625, 4.003662109375, 4.25238037109375, 4.5010986328125, 4.74981689453125, 4.99853515625, 5.24725341796875, 5.4959716796875, 5.74468994140625, 5.993408203125, 6.24212646484375, 6.4908447265625, 6.73956298828125, 6.98828125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 11.0, 17.0, 30.0, 49.0, 72.0, 143.0, 264.0, 724.0, 2710.0, 19140.0, 297565.0, 682590.0, 39080.0, 4420.0, 1040.0, 354.0, 145.0, 84.0, 46.0, 24.0, 13.0, 10.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.326171875, -3.243316650390625, -3.16046142578125, -3.077606201171875, -2.9947509765625, -2.911895751953125, -2.82904052734375, -2.746185302734375, -2.663330078125, -2.580474853515625, -2.49761962890625, -2.414764404296875, -2.3319091796875, -2.249053955078125, -2.16619873046875, -2.083343505859375, -2.00048828125, -1.917633056640625, -1.83477783203125, -1.751922607421875, -1.6690673828125, -1.586212158203125, -1.50335693359375, -1.420501708984375, -1.337646484375, -1.254791259765625, -1.17193603515625, -1.089080810546875, -1.0062255859375, -0.923370361328125, -0.84051513671875, -0.757659912109375, -0.6748046875, -0.591949462890625, -0.50909423828125, -0.426239013671875, -0.3433837890625, -0.260528564453125, -0.17767333984375, -0.094818115234375, -0.011962890625, 0.070892333984375, 0.15374755859375, 0.236602783203125, 0.3194580078125, 0.402313232421875, 0.48516845703125, 0.568023681640625, 0.65087890625, 0.733734130859375, 0.81658935546875, 0.899444580078125, 0.9822998046875, 1.065155029296875, 1.14801025390625, 1.230865478515625, 1.313720703125, 1.396575927734375, 1.47943115234375, 1.562286376953125, 1.6451416015625, 1.727996826171875, 1.81085205078125, 1.893707275390625, 1.9765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 4.0, 5.0, 14.0, 27.0, 39.0, 48.0, 74.0, 87.0, 122.0, 200.0, 121.0, 78.0, 58.0, 30.0, 32.0, 25.0, 19.0, 4.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000270843505859375, -0.00025971606373786926, -0.0002485886216163635, -0.0002374611794948578, -0.00022633373737335205, -0.0002152062952518463, -0.00020407885313034058, -0.00019295141100883484, -0.0001818239688873291, -0.00017069652676582336, -0.00015956908464431763, -0.0001484416425228119, -0.00013731420040130615, -0.00012618675827980042, -0.00011505931615829468, -0.00010393187403678894, -9.28044319152832e-05, -8.167698979377747e-05, -7.054954767227173e-05, -5.942210555076599e-05, -4.8294663429260254e-05, -3.7167221307754517e-05, -2.603977918624878e-05, -1.4912337064743042e-05, -3.7848949432373047e-06, 7.342547178268433e-06, 1.846998929977417e-05, 2.9597431421279907e-05, 4.0724873542785645e-05, 5.185231566429138e-05, 6.297975778579712e-05, 7.410719990730286e-05, 8.52346420288086e-05, 9.636208415031433e-05, 0.00010748952627182007, 0.0001186169683933258, 0.00012974441051483154, 0.00014087185263633728, 0.00015199929475784302, 0.00016312673687934875, 0.0001742541790008545, 0.00018538162112236023, 0.00019650906324386597, 0.0002076365053653717, 0.00021876394748687744, 0.00022989138960838318, 0.00024101883172988892, 0.00025214627385139465, 0.0002632737159729004, 0.00027440115809440613, 0.00028552860021591187, 0.0002966560423374176, 0.00030778348445892334, 0.0003189109265804291, 0.0003300383687019348, 0.00034116581082344055, 0.0003522932529449463, 0.000363420695066452, 0.00037454813718795776, 0.0003856755793094635, 0.00039680302143096924, 0.000407930463552475, 0.0004190579056739807, 0.00043018534779548645, 0.0004413127899169922]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 11.0, 12.0, 31.0, 35.0, 75.0, 98.0, 219.0, 336.0, 671.0, 1489.0, 3753.0, 12693.0, 53355.0, 311547.0, 552766.0, 84305.0, 18267.0, 5095.0, 1913.0, 812.0, 420.0, 253.0, 143.0, 71.0, 58.0, 37.0, 21.0, 13.0, 10.0, 10.0, 8.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4443359375, -1.39300537109375, -1.3416748046875, -1.29034423828125, -1.239013671875, -1.18768310546875, -1.1363525390625, -1.08502197265625, -1.03369140625, -0.98236083984375, -0.9310302734375, -0.87969970703125, -0.828369140625, -0.77703857421875, -0.7257080078125, -0.67437744140625, -0.623046875, -0.57171630859375, -0.5203857421875, -0.46905517578125, -0.417724609375, -0.36639404296875, -0.3150634765625, -0.26373291015625, -0.21240234375, -0.16107177734375, -0.1097412109375, -0.05841064453125, -0.007080078125, 0.04425048828125, 0.0955810546875, 0.14691162109375, 0.1982421875, 0.24957275390625, 0.3009033203125, 0.35223388671875, 0.403564453125, 0.45489501953125, 0.5062255859375, 0.55755615234375, 0.60888671875, 0.66021728515625, 0.7115478515625, 0.76287841796875, 0.814208984375, 0.86553955078125, 0.9168701171875, 0.96820068359375, 1.01953125, 1.07086181640625, 1.1221923828125, 1.17352294921875, 1.224853515625, 1.27618408203125, 1.3275146484375, 1.37884521484375, 1.43017578125, 1.48150634765625, 1.5328369140625, 1.58416748046875, 1.635498046875, 1.68682861328125, 1.7381591796875, 1.78948974609375, 1.8408203125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 5.0, 9.0, 8.0, 11.0, 15.0, 28.0, 28.0, 35.0, 56.0, 78.0, 112.0, 182.0, 120.0, 92.0, 70.0, 43.0, 29.0, 23.0, 13.0, 9.0, 11.0, 7.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2998046875, -1.2653274536132812, -1.2308502197265625, -1.1963729858398438, -1.161895751953125, -1.1274185180664062, -1.0929412841796875, -1.0584640502929688, -1.02398681640625, -0.9895095825195312, -0.9550323486328125, -0.9205551147460938, -0.886077880859375, -0.8516006469726562, -0.8171234130859375, -0.7826461791992188, -0.7481689453125, -0.7136917114257812, -0.6792144775390625, -0.6447372436523438, -0.610260009765625, -0.5757827758789062, -0.5413055419921875, -0.5068283081054688, -0.47235107421875, -0.43787384033203125, -0.4033966064453125, -0.36891937255859375, -0.334442138671875, -0.29996490478515625, -0.2654876708984375, -0.23101043701171875, -0.196533203125, -0.16205596923828125, -0.1275787353515625, -0.09310150146484375, -0.058624267578125, -0.02414703369140625, 0.0103302001953125, 0.04480743408203125, 0.07928466796875, 0.11376190185546875, 0.1482391357421875, 0.18271636962890625, 0.217193603515625, 0.25167083740234375, 0.2861480712890625, 0.32062530517578125, 0.3551025390625, 0.38957977294921875, 0.4240570068359375, 0.45853424072265625, 0.493011474609375, 0.5274887084960938, 0.5619659423828125, 0.5964431762695312, 0.63092041015625, 0.6653976440429688, 0.6998748779296875, 0.7343521118164062, 0.768829345703125, 0.8033065795898438, 0.8377838134765625, 0.8722610473632812, 0.90673828125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 14.0, 19.0, 54.0, 159.0, 295.0, 257.0, 134.0, 44.0, 16.0, 11.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.016429901123047, -15.93708610534668, -14.857741355895996, -13.778396606445312, -12.699052810668945, -11.619709014892578, -10.540364265441895, -9.461019515991211, -8.381675720214844, -7.302331447601318, -6.222987174987793, -5.143642902374268, -4.064298629760742, -2.984954357147217, -1.9056100845336914, -0.826265811920166, 0.2530784606933594, 1.3324227333068848, 2.41176700592041, 3.4911112785339355, 4.570455551147461, 5.649799823760986, 6.729144096374512, 7.808488368988037, 8.887832641601562, 9.96717643737793, 11.046521186828613, 12.125865936279297, 13.205209732055664, 14.284553527832031, 15.363898277282715, 16.4432430267334, 17.522586822509766, 18.601930618286133, 19.6812744140625, 20.7606201171875, 21.839963912963867, 22.919307708740234, 23.998653411865234, 25.0779972076416, 26.15734100341797, 27.236684799194336, 28.316028594970703, 29.395374298095703, 30.47471809387207, 31.554061889648438, 32.63340759277344, 33.71274948120117, 34.79209518432617, 35.87144088745117, 36.950782775878906, 38.030128479003906, 39.109474182128906, 40.18881607055664, 41.26816177368164, 42.347503662109375, 43.426849365234375, 44.506195068359375, 45.58553695678711, 46.66488265991211, 47.744224548339844, 48.823570251464844, 49.902915954589844, 50.98225784301758, 52.06160354614258]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 5.0, 7.0, 7.0, 9.0, 10.0, 8.0, 12.0, 15.0, 17.0, 16.0, 18.0, 24.0, 27.0, 37.0, 34.0, 40.0, 30.0, 35.0, 42.0, 39.0, 41.0, 46.0, 38.0, 34.0, 39.0, 40.0, 33.0, 34.0, 32.0, 42.0, 40.0, 22.0, 18.0, 14.0, 15.0, 16.0, 12.0, 12.0, 11.0, 7.0, 6.0, 2.0, 3.0, 4.0, 5.0, 1.0, 2.0, 6.0, 3.0, 2.0], "bins": [-15.458958625793457, -15.028923034667969, -14.59888744354248, -14.168851852416992, -13.73881721496582, -13.308780670166016, -12.878746032714844, -12.448710441589355, -12.018674850463867, -11.588639259338379, -11.15860366821289, -10.728568077087402, -10.298532485961914, -9.868497848510742, -9.438462257385254, -9.008426666259766, -8.578391075134277, -8.148355484008789, -7.718319892883301, -7.288284778594971, -6.858249187469482, -6.428213596343994, -5.998178482055664, -5.568142890930176, -5.1381072998046875, -4.708071708679199, -4.278036117553711, -3.848001003265381, -3.4179654121398926, -2.9879298210144043, -2.557894468307495, -2.127859115600586, -1.6978235244750977, -1.267788052558899, -0.8377525806427002, -0.40771710872650146, 0.022318363189697266, 0.45235395431518555, 0.8823893070220947, 1.312424659729004, 1.7424602508544922, 2.1724958419799805, 2.6025311946868896, 3.032566547393799, 3.462602138519287, 3.8926377296447754, 4.3226728439331055, 4.752708435058594, 5.182744026184082, 5.61277961730957, 6.042815208435059, 6.472850322723389, 6.902885913848877, 7.332921504974365, 7.762956619262695, 8.192992210388184, 8.623027801513672, 9.05306339263916, 9.483098983764648, 9.913134574890137, 10.343170166015625, 10.773204803466797, 11.203240394592285, 11.633275985717773, 12.063311576843262]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 12.0, 10.0, 21.0, 21.0, 43.0, 30.0, 58.0, 62.0, 104.0, 149.0, 240.0, 414.0, 537.0, 929.0, 1642.0, 2999.0, 6415.0, 15424.0, 47832.0, 208281.0, 1242275.0, 2137913.0, 408408.0, 79385.0, 22779.0, 8915.0, 4176.0, 2112.0, 1204.0, 679.0, 392.0, 240.0, 156.0, 105.0, 90.0, 79.0, 39.0, 24.0, 33.0, 12.0, 14.0, 11.0, 8.0, 3.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.26171875, -5.093017578125, -4.92431640625, -4.755615234375, -4.5869140625, -4.418212890625, -4.24951171875, -4.080810546875, -3.912109375, -3.743408203125, -3.57470703125, -3.406005859375, -3.2373046875, -3.068603515625, -2.89990234375, -2.731201171875, -2.5625, -2.393798828125, -2.22509765625, -2.056396484375, -1.8876953125, -1.718994140625, -1.55029296875, -1.381591796875, -1.212890625, -1.044189453125, -0.87548828125, -0.706787109375, -0.5380859375, -0.369384765625, -0.20068359375, -0.031982421875, 0.13671875, 0.305419921875, 0.47412109375, 0.642822265625, 0.8115234375, 0.980224609375, 1.14892578125, 1.317626953125, 1.486328125, 1.655029296875, 1.82373046875, 1.992431640625, 2.1611328125, 2.329833984375, 2.49853515625, 2.667236328125, 2.8359375, 3.004638671875, 3.17333984375, 3.342041015625, 3.5107421875, 3.679443359375, 3.84814453125, 4.016845703125, 4.185546875, 4.354248046875, 4.52294921875, 4.691650390625, 4.8603515625, 5.029052734375, 5.19775390625, 5.366455078125, 5.53515625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 4.0, 6.0, 9.0, 12.0, 14.0, 19.0, 20.0, 36.0, 25.0, 45.0, 46.0, 72.0, 68.0, 72.0, 62.0, 75.0, 79.0, 63.0, 46.0, 44.0, 35.0, 34.0, 19.0, 22.0, 11.0, 15.0, 12.0, 6.0, 8.0, 9.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-7.75390625, -7.5687255859375, -7.383544921875, -7.1983642578125, -7.01318359375, -6.8280029296875, -6.642822265625, -6.4576416015625, -6.2724609375, -6.0872802734375, -5.902099609375, -5.7169189453125, -5.53173828125, -5.3465576171875, -5.161376953125, -4.9761962890625, -4.791015625, -4.6058349609375, -4.420654296875, -4.2354736328125, -4.05029296875, -3.8651123046875, -3.679931640625, -3.4947509765625, -3.3095703125, -3.1243896484375, -2.939208984375, -2.7540283203125, -2.56884765625, -2.3836669921875, -2.198486328125, -2.0133056640625, -1.828125, -1.6429443359375, -1.457763671875, -1.2725830078125, -1.08740234375, -0.9022216796875, -0.717041015625, -0.5318603515625, -0.3466796875, -0.1614990234375, 0.023681640625, 0.2088623046875, 0.39404296875, 0.5792236328125, 0.764404296875, 0.9495849609375, 1.134765625, 1.3199462890625, 1.505126953125, 1.6903076171875, 1.87548828125, 2.0606689453125, 2.245849609375, 2.4310302734375, 2.6162109375, 2.8013916015625, 2.986572265625, 3.1717529296875, 3.35693359375, 3.5421142578125, 3.727294921875, 3.9124755859375, 4.09765625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 3.0, 6.0, 6.0, 15.0, 10.0, 11.0, 20.0, 28.0, 38.0, 57.0, 79.0, 123.0, 189.0, 357.0, 625.0, 1259.0, 2841.0, 8037.0, 29156.0, 166925.0, 2733440.0, 1134903.0, 87854.0, 18285.0, 5546.0, 2124.0, 982.0, 503.0, 298.0, 191.0, 109.0, 73.0, 52.0, 30.0, 25.0, 17.0, 7.0, 11.0, 8.0, 11.0, 6.0, 8.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.1015625, -6.88531494140625, -6.6690673828125, -6.45281982421875, -6.236572265625, -6.02032470703125, -5.8040771484375, -5.58782958984375, -5.37158203125, -5.15533447265625, -4.9390869140625, -4.72283935546875, -4.506591796875, -4.29034423828125, -4.0740966796875, -3.85784912109375, -3.6416015625, -3.42535400390625, -3.2091064453125, -2.99285888671875, -2.776611328125, -2.56036376953125, -2.3441162109375, -2.12786865234375, -1.91162109375, -1.69537353515625, -1.4791259765625, -1.26287841796875, -1.046630859375, -0.83038330078125, -0.6141357421875, -0.39788818359375, -0.181640625, 0.03460693359375, 0.2508544921875, 0.46710205078125, 0.683349609375, 0.89959716796875, 1.1158447265625, 1.33209228515625, 1.54833984375, 1.76458740234375, 1.9808349609375, 2.19708251953125, 2.413330078125, 2.62957763671875, 2.8458251953125, 3.06207275390625, 3.2783203125, 3.49456787109375, 3.7108154296875, 3.92706298828125, 4.143310546875, 4.35955810546875, 4.5758056640625, 4.79205322265625, 5.00830078125, 5.22454833984375, 5.4407958984375, 5.65704345703125, 5.873291015625, 6.08953857421875, 6.3057861328125, 6.52203369140625, 6.73828125]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 2.0, 5.0, 7.0, 3.0, 7.0, 14.0, 23.0, 23.0, 27.0, 29.0, 40.0, 61.0, 100.0, 130.0, 177.0, 285.0, 403.0, 504.0, 609.0, 418.0, 362.0, 258.0, 173.0, 101.0, 76.0, 54.0, 40.0, 37.0, 22.0, 8.0, 18.0, 13.0, 8.0, 11.0, 6.0, 7.0, 2.0, 1.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.984375, -1.926544189453125, -1.86871337890625, -1.810882568359375, -1.7530517578125, -1.695220947265625, -1.63739013671875, -1.579559326171875, -1.521728515625, -1.463897705078125, -1.40606689453125, -1.348236083984375, -1.2904052734375, -1.232574462890625, -1.17474365234375, -1.116912841796875, -1.05908203125, -1.001251220703125, -0.94342041015625, -0.885589599609375, -0.8277587890625, -0.769927978515625, -0.71209716796875, -0.654266357421875, -0.596435546875, -0.538604736328125, -0.48077392578125, -0.422943115234375, -0.3651123046875, -0.307281494140625, -0.24945068359375, -0.191619873046875, -0.1337890625, -0.075958251953125, -0.01812744140625, 0.039703369140625, 0.0975341796875, 0.155364990234375, 0.21319580078125, 0.271026611328125, 0.328857421875, 0.386688232421875, 0.44451904296875, 0.502349853515625, 0.5601806640625, 0.618011474609375, 0.67584228515625, 0.733673095703125, 0.79150390625, 0.849334716796875, 0.90716552734375, 0.964996337890625, 1.0228271484375, 1.080657958984375, 1.13848876953125, 1.196319580078125, 1.254150390625, 1.311981201171875, 1.36981201171875, 1.427642822265625, 1.4854736328125, 1.543304443359375, 1.60113525390625, 1.658966064453125, 1.716796875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 6.0, 14.0, 16.0, 21.0, 30.0, 52.0, 55.0, 82.0, 101.0, 105.0, 117.0, 99.0, 79.0, 62.0, 50.0, 35.0, 28.0, 14.0, 14.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.844393730163574, -12.55201244354248, -12.259631156921387, -11.967248916625977, -11.674867630004883, -11.382486343383789, -11.090105056762695, -10.797723770141602, -10.505342483520508, -10.212961196899414, -9.92057991027832, -9.62819766998291, -9.335816383361816, -9.043435096740723, -8.751053810119629, -8.458672523498535, -8.166290283203125, -7.873908996582031, -7.581527233123779, -7.2891459465026855, -6.996764183044434, -6.70438289642334, -6.412001609802246, -6.119620323181152, -5.8272385597229, -5.534857273101807, -5.242475509643555, -4.950094223022461, -4.657712936401367, -4.365331172943115, -4.0729498863220215, -3.7805683612823486, -3.4881863594055176, -3.1958048343658447, -2.903423309326172, -2.611042022705078, -2.3186604976654053, -2.0262789726257324, -1.7338975667953491, -1.4415161609649658, -1.149134635925293, -0.8567531704902649, -0.5643717050552368, -0.27199023962020874, 0.020391225814819336, 0.3127727508544922, 0.6051541566848755, 0.8975355625152588, 1.1899170875549316, 1.4822986125946045, 1.7746800184249878, 2.067061424255371, 2.359442949295044, 2.651824474334717, 2.9442057609558105, 3.2365872859954834, 3.5289688110351562, 3.821350336074829, 4.113731861114502, 4.406113147735596, 4.698494911193848, 4.990876197814941, 5.283257484436035, 5.575638771057129, 5.868020534515381]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 5.0, 2.0, 3.0, 7.0, 6.0, 10.0, 12.0, 15.0, 21.0, 13.0, 24.0, 31.0, 17.0, 35.0, 43.0, 28.0, 45.0, 29.0, 54.0, 48.0, 45.0, 60.0, 49.0, 45.0, 36.0, 41.0, 36.0, 26.0, 24.0, 35.0, 16.0, 27.0, 17.0, 16.0, 15.0, 16.0, 11.0, 9.0, 6.0, 5.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0], "bins": [-5.671573162078857, -5.520415782928467, -5.369258880615234, -5.218101501464844, -5.066944122314453, -4.9157867431640625, -4.76462984085083, -4.6134724617004395, -4.462315082550049, -4.311157703399658, -4.160000801086426, -4.008843421936035, -3.8576860427856445, -3.706528902053833, -3.5553717613220215, -3.404214382171631, -3.2530572414398193, -3.101900100708008, -2.950742721557617, -2.7995855808258057, -2.648428201675415, -2.4972710609436035, -2.346113681793213, -2.1949565410614014, -2.04379940032959, -1.8926421403884888, -1.7414848804473877, -1.5903277397155762, -1.4391703605651855, -1.288013219833374, -1.136855959892273, -0.9856986999511719, -0.8345413208007812, -0.6833840608596802, -0.5322268009185791, -0.3810696005821228, -0.22991234064102173, -0.07875508069992065, 0.07240211963653564, 0.22355937957763672, 0.3747166395187378, 0.5258738994598389, 0.6770311594009399, 0.8281883597373962, 0.9793456196784973, 1.1305029392242432, 1.2816600799560547, 1.4328173398971558, 1.5839745998382568, 1.735131859779358, 1.886289119720459, 2.0374462604522705, 2.188603639602661, 2.3397607803344727, 2.4909181594848633, 2.642075300216675, 2.7932324409484863, 2.944389581680298, 3.0955469608306885, 3.2467041015625, 3.3978614807128906, 3.549018621444702, 3.7001757621765137, 3.8513331413269043, 4.002490520477295]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 10.0, 9.0, 18.0, 28.0, 29.0, 45.0, 74.0, 107.0, 144.0, 222.0, 404.0, 538.0, 976.0, 1721.0, 2978.0, 5501.0, 10764.0, 22969.0, 56052.0, 158821.0, 365414.0, 262419.0, 91991.0, 34855.0, 15352.0, 7500.0, 4014.0, 2260.0, 1290.0, 722.0, 432.0, 322.0, 173.0, 130.0, 79.0, 69.0, 27.0, 23.0, 21.0, 12.0, 9.0, 8.0, 4.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.2236328125, -1.18841552734375, -1.1531982421875, -1.11798095703125, -1.082763671875, -1.04754638671875, -1.0123291015625, -0.97711181640625, -0.94189453125, -0.90667724609375, -0.8714599609375, -0.83624267578125, -0.801025390625, -0.76580810546875, -0.7305908203125, -0.69537353515625, -0.66015625, -0.62493896484375, -0.5897216796875, -0.55450439453125, -0.519287109375, -0.48406982421875, -0.4488525390625, -0.41363525390625, -0.37841796875, -0.34320068359375, -0.3079833984375, -0.27276611328125, -0.237548828125, -0.20233154296875, -0.1671142578125, -0.13189697265625, -0.0966796875, -0.06146240234375, -0.0262451171875, 0.00897216796875, 0.044189453125, 0.07940673828125, 0.1146240234375, 0.14984130859375, 0.18505859375, 0.22027587890625, 0.2554931640625, 0.29071044921875, 0.325927734375, 0.36114501953125, 0.3963623046875, 0.43157958984375, 0.466796875, 0.50201416015625, 0.5372314453125, 0.57244873046875, 0.607666015625, 0.64288330078125, 0.6781005859375, 0.71331787109375, 0.74853515625, 0.78375244140625, 0.8189697265625, 0.85418701171875, 0.889404296875, 0.92462158203125, 0.9598388671875, 0.99505615234375, 1.0302734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 6.0, 6.0, 1.0, 7.0, 6.0, 9.0, 13.0, 13.0, 24.0, 30.0, 28.0, 38.0, 28.0, 37.0, 38.0, 32.0, 59.0, 39.0, 54.0, 42.0, 66.0, 54.0, 45.0, 43.0, 41.0, 33.0, 29.0, 19.0, 23.0, 28.0, 21.0, 15.0, 9.0, 9.0, 11.0, 12.0, 10.0, 7.0, 3.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0], "bins": [-3.96484375, -3.86175537109375, -3.7586669921875, -3.65557861328125, -3.552490234375, -3.44940185546875, -3.3463134765625, -3.24322509765625, -3.14013671875, -3.03704833984375, -2.9339599609375, -2.83087158203125, -2.727783203125, -2.62469482421875, -2.5216064453125, -2.41851806640625, -2.3154296875, -2.21234130859375, -2.1092529296875, -2.00616455078125, -1.903076171875, -1.79998779296875, -1.6968994140625, -1.59381103515625, -1.49072265625, -1.38763427734375, -1.2845458984375, -1.18145751953125, -1.078369140625, -0.97528076171875, -0.8721923828125, -0.76910400390625, -0.666015625, -0.56292724609375, -0.4598388671875, -0.35675048828125, -0.253662109375, -0.15057373046875, -0.0474853515625, 0.05560302734375, 0.15869140625, 0.26177978515625, 0.3648681640625, 0.46795654296875, 0.571044921875, 0.67413330078125, 0.7772216796875, 0.88031005859375, 0.9833984375, 1.08648681640625, 1.1895751953125, 1.29266357421875, 1.395751953125, 1.49884033203125, 1.6019287109375, 1.70501708984375, 1.80810546875, 1.91119384765625, 2.0142822265625, 2.11737060546875, 2.220458984375, 2.32354736328125, 2.4266357421875, 2.52972412109375, 2.6328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 10.0, 11.0, 24.0, 32.0, 32.0, 55.0, 133.0, 192.0, 434.0, 897.0, 2480.0, 8365.0, 42248.0, 403794.0, 519757.0, 54876.0, 10240.0, 2882.0, 1069.0, 444.0, 258.0, 120.0, 69.0, 45.0, 30.0, 19.0, 7.0, 8.0, 4.0, 8.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.25, -2.179840087890625, -2.10968017578125, -2.039520263671875, -1.9693603515625, -1.899200439453125, -1.82904052734375, -1.758880615234375, -1.688720703125, -1.618560791015625, -1.54840087890625, -1.478240966796875, -1.4080810546875, -1.337921142578125, -1.26776123046875, -1.197601318359375, -1.12744140625, -1.057281494140625, -0.98712158203125, -0.916961669921875, -0.8468017578125, -0.776641845703125, -0.70648193359375, -0.636322021484375, -0.566162109375, -0.496002197265625, -0.42584228515625, -0.355682373046875, -0.2855224609375, -0.215362548828125, -0.14520263671875, -0.075042724609375, -0.0048828125, 0.065277099609375, 0.13543701171875, 0.205596923828125, 0.2757568359375, 0.345916748046875, 0.41607666015625, 0.486236572265625, 0.556396484375, 0.626556396484375, 0.69671630859375, 0.766876220703125, 0.8370361328125, 0.907196044921875, 0.97735595703125, 1.047515869140625, 1.11767578125, 1.187835693359375, 1.25799560546875, 1.328155517578125, 1.3983154296875, 1.468475341796875, 1.53863525390625, 1.608795166015625, 1.678955078125, 1.749114990234375, 1.81927490234375, 1.889434814453125, 1.9595947265625, 2.029754638671875, 2.09991455078125, 2.170074462890625, 2.240234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 7.0, 7.0, 10.0, 9.0, 8.0, 15.0, 20.0, 22.0, 20.0, 21.0, 25.0, 30.0, 36.0, 32.0, 38.0, 39.0, 45.0, 40.0, 39.0, 44.0, 40.0, 43.0, 52.0, 37.0, 39.0, 38.0, 37.0, 23.0, 27.0, 25.0, 25.0, 17.0, 12.0, 14.0, 7.0, 13.0, 7.0, 7.0, 3.0, 5.0, 3.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.58203125, -6.3780517578125, -6.174072265625, -5.9700927734375, -5.76611328125, -5.5621337890625, -5.358154296875, -5.1541748046875, -4.9501953125, -4.7462158203125, -4.542236328125, -4.3382568359375, -4.13427734375, -3.9302978515625, -3.726318359375, -3.5223388671875, -3.318359375, -3.1143798828125, -2.910400390625, -2.7064208984375, -2.50244140625, -2.2984619140625, -2.094482421875, -1.8905029296875, -1.6865234375, -1.4825439453125, -1.278564453125, -1.0745849609375, -0.87060546875, -0.6666259765625, -0.462646484375, -0.2586669921875, -0.0546875, 0.1492919921875, 0.353271484375, 0.5572509765625, 0.76123046875, 0.9652099609375, 1.169189453125, 1.3731689453125, 1.5771484375, 1.7811279296875, 1.985107421875, 2.1890869140625, 2.39306640625, 2.5970458984375, 2.801025390625, 3.0050048828125, 3.208984375, 3.4129638671875, 3.616943359375, 3.8209228515625, 4.02490234375, 4.2288818359375, 4.432861328125, 4.6368408203125, 4.8408203125, 5.0447998046875, 5.248779296875, 5.4527587890625, 5.65673828125, 5.8607177734375, 6.064697265625, 6.2686767578125, 6.47265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 13.0, 10.0, 15.0, 37.0, 60.0, 91.0, 221.0, 396.0, 923.0, 2254.0, 6575.0, 26455.0, 288077.0, 648350.0, 58939.0, 10373.0, 3267.0, 1244.0, 607.0, 270.0, 145.0, 95.0, 47.0, 26.0, 20.0, 12.0, 8.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0400390625, -1.0055999755859375, -0.971160888671875, -0.9367218017578125, -0.90228271484375, -0.8678436279296875, -0.833404541015625, -0.7989654541015625, -0.7645263671875, -0.7300872802734375, -0.695648193359375, -0.6612091064453125, -0.62677001953125, -0.5923309326171875, -0.557891845703125, -0.5234527587890625, -0.489013671875, -0.4545745849609375, -0.420135498046875, -0.3856964111328125, -0.35125732421875, -0.3168182373046875, -0.282379150390625, -0.2479400634765625, -0.2135009765625, -0.1790618896484375, -0.144622802734375, -0.1101837158203125, -0.07574462890625, -0.0413055419921875, -0.006866455078125, 0.0275726318359375, 0.06201171875, 0.0964508056640625, 0.130889892578125, 0.1653289794921875, 0.19976806640625, 0.2342071533203125, 0.268646240234375, 0.3030853271484375, 0.3375244140625, 0.3719635009765625, 0.406402587890625, 0.4408416748046875, 0.47528076171875, 0.5097198486328125, 0.544158935546875, 0.5785980224609375, 0.613037109375, 0.6474761962890625, 0.681915283203125, 0.7163543701171875, 0.75079345703125, 0.7852325439453125, 0.819671630859375, 0.8541107177734375, 0.8885498046875, 0.9229888916015625, 0.957427978515625, 0.9918670654296875, 1.02630615234375, 1.0607452392578125, 1.095184326171875, 1.1296234130859375, 1.1640625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 8.0, 4.0, 8.0, 18.0, 43.0, 66.0, 116.0, 159.0, 178.0, 158.0, 95.0, 61.0, 35.0, 16.0, 13.0, 6.0, 8.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002727508544921875, -0.00025791674852371216, -0.00024308264255523682, -0.00022824853658676147, -0.00021341443061828613, -0.0001985803246498108, -0.00018374621868133545, -0.0001689121127128601, -0.00015407800674438477, -0.00013924390077590942, -0.00012440979480743408, -0.00010957568883895874, -9.47415828704834e-05, -7.990747690200806e-05, -6.507337093353271e-05, -5.023926496505737e-05, -3.540515899658203e-05, -2.057105302810669e-05, -5.736947059631348e-06, 9.097158908843994e-06, 2.3931264877319336e-05, 3.876537084579468e-05, 5.359947681427002e-05, 6.843358278274536e-05, 8.32676887512207e-05, 9.810179471969604e-05, 0.00011293590068817139, 0.00012777000665664673, 0.00014260411262512207, 0.0001574382185935974, 0.00017227232456207275, 0.0001871064305305481, 0.00020194053649902344, 0.00021677464246749878, 0.00023160874843597412, 0.00024644285440444946, 0.0002612769603729248, 0.00027611106634140015, 0.0002909451723098755, 0.00030577927827835083, 0.00032061338424682617, 0.0003354474902153015, 0.00035028159618377686, 0.0003651157021522522, 0.00037994980812072754, 0.0003947839140892029, 0.0004096180200576782, 0.00042445212602615356, 0.0004392862319946289, 0.00045412033796310425, 0.0004689544439315796, 0.00048378854990005493, 0.0004986226558685303, 0.0005134567618370056, 0.000528290867805481, 0.0005431249737739563, 0.0005579590797424316, 0.000572793185710907, 0.0005876272916793823, 0.0006024613976478577, 0.000617295503616333, 0.0006321296095848083, 0.0006469637155532837, 0.000661797821521759, 0.0006766319274902344]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 9.0, 12.0, 11.0, 18.0, 22.0, 39.0, 56.0, 77.0, 119.0, 213.0, 406.0, 815.0, 1576.0, 3369.0, 7639.0, 20177.0, 70229.0, 311450.0, 457785.0, 123375.0, 31312.0, 10828.0, 4603.0, 2090.0, 1018.0, 554.0, 283.0, 170.0, 85.0, 63.0, 53.0, 27.0, 16.0, 14.0, 4.0, 7.0, 4.0, 6.0, 5.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5888671875, -0.5679779052734375, -0.547088623046875, -0.5261993408203125, -0.50531005859375, -0.4844207763671875, -0.463531494140625, -0.4426422119140625, -0.4217529296875, -0.4008636474609375, -0.379974365234375, -0.3590850830078125, -0.33819580078125, -0.3173065185546875, -0.296417236328125, -0.2755279541015625, -0.254638671875, -0.2337493896484375, -0.212860107421875, -0.1919708251953125, -0.17108154296875, -0.1501922607421875, -0.129302978515625, -0.1084136962890625, -0.0875244140625, -0.0666351318359375, -0.045745849609375, -0.0248565673828125, -0.00396728515625, 0.0169219970703125, 0.037811279296875, 0.0587005615234375, 0.07958984375, 0.1004791259765625, 0.121368408203125, 0.1422576904296875, 0.16314697265625, 0.1840362548828125, 0.204925537109375, 0.2258148193359375, 0.2467041015625, 0.2675933837890625, 0.288482666015625, 0.3093719482421875, 0.33026123046875, 0.3511505126953125, 0.372039794921875, 0.3929290771484375, 0.413818359375, 0.4347076416015625, 0.455596923828125, 0.4764862060546875, 0.49737548828125, 0.5182647705078125, 0.539154052734375, 0.5600433349609375, 0.5809326171875, 0.6018218994140625, 0.622711181640625, 0.6436004638671875, 0.66448974609375, 0.6853790283203125, 0.706268310546875, 0.7271575927734375, 0.748046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 5.0, 9.0, 10.0, 10.0, 13.0, 18.0, 30.0, 37.0, 50.0, 57.0, 80.0, 110.0, 114.0, 97.0, 84.0, 80.0, 43.0, 32.0, 26.0, 17.0, 10.0, 13.0, 7.0, 7.0, 3.0, 4.0, 5.0, 2.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.24755859375, -0.2401905059814453, -0.23282241821289062, -0.22545433044433594, -0.21808624267578125, -0.21071815490722656, -0.20335006713867188, -0.1959819793701172, -0.1886138916015625, -0.1812458038330078, -0.17387771606445312, -0.16650962829589844, -0.15914154052734375, -0.15177345275878906, -0.14440536499023438, -0.1370372772216797, -0.129669189453125, -0.12230110168457031, -0.11493301391601562, -0.10756492614746094, -0.10019683837890625, -0.09282875061035156, -0.08546066284179688, -0.07809257507324219, -0.0707244873046875, -0.06335639953613281, -0.055988311767578125, -0.04862022399902344, -0.04125213623046875, -0.03388404846191406, -0.026515960693359375, -0.019147872924804688, -0.01177978515625, -0.0044116973876953125, 0.002956390380859375, 0.010324478149414062, 0.01769256591796875, 0.025060653686523438, 0.032428741455078125, 0.03979682922363281, 0.0471649169921875, 0.05453300476074219, 0.061901092529296875, 0.06926918029785156, 0.07663726806640625, 0.08400535583496094, 0.09137344360351562, 0.09874153137207031, 0.106109619140625, 0.11347770690917969, 0.12084579467773438, 0.12821388244628906, 0.13558197021484375, 0.14295005798339844, 0.15031814575195312, 0.1576862335205078, 0.1650543212890625, 0.1724224090576172, 0.17979049682617188, 0.18715858459472656, 0.19452667236328125, 0.20189476013183594, 0.20926284790039062, 0.2166309356689453, 0.2239990234375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 5.0, 5.0, 6.0, 12.0, 25.0, 18.0, 34.0, 44.0, 66.0, 84.0, 113.0, 105.0, 116.0, 98.0, 80.0, 60.0, 36.0, 34.0, 19.0, 17.0, 10.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.8193159103393555, -7.640412330627441, -7.461508750915527, -7.282605171203613, -7.103701591491699, -6.924798011779785, -6.745894432067871, -6.566991329193115, -6.388087749481201, -6.209184169769287, -6.030280590057373, -5.851377010345459, -5.672473430633545, -5.493570327758789, -5.314666748046875, -5.135763168334961, -4.956859588623047, -4.777956008911133, -4.599052429199219, -4.420148849487305, -4.241245269775391, -4.062341690063477, -3.8834383487701416, -3.7045350074768066, -3.5256309509277344, -3.3467273712158203, -3.1678237915039062, -2.988920211791992, -2.8100168704986572, -2.631113290786743, -2.452209711074829, -2.273306369781494, -2.094403028488159, -1.9154994487762451, -1.7365959882736206, -1.5576924085617065, -1.378788948059082, -1.199885368347168, -1.020981788635254, -0.8420783281326294, -0.6631747484207153, -0.48427122831344604, -0.30536767840385437, -0.1264641284942627, 0.05243939161300659, 0.23134291172027588, 0.41024649143218994, 0.5891499519348145, 0.7680535316467285, 0.9469570517539978, 1.125860571861267, 1.3047641515731812, 1.4836676120758057, 1.6625711917877197, 1.8414747714996338, 2.0203781127929688, 2.199281692504883, 2.378185272216797, 2.557088851928711, 2.735992431640625, 2.91489577293396, 3.093799352645874, 3.272702932357788, 3.451606273651123, 3.630510091781616]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 2.0, 7.0, 5.0, 9.0, 6.0, 17.0, 19.0, 20.0, 25.0, 32.0, 31.0, 31.0, 33.0, 42.0, 58.0, 56.0, 58.0, 42.0, 53.0, 55.0, 56.0, 39.0, 42.0, 48.0, 31.0, 20.0, 34.0, 22.0, 21.0, 22.0, 16.0, 8.0, 10.0, 5.0, 6.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.103898048400879, -3.996190071105957, -3.888482093811035, -3.7807741165161133, -3.6730661392211914, -3.5653581619262695, -3.4576501846313477, -3.349942207336426, -3.242234230041504, -3.134526252746582, -3.02681827545166, -2.9191102981567383, -2.8114023208618164, -2.7036943435668945, -2.5959863662719727, -2.488278388977051, -2.38057017326355, -2.272862195968628, -2.165154218673706, -2.057446241378784, -1.9497382640838623, -1.8420302867889404, -1.734322190284729, -1.6266142129898071, -1.5189062356948853, -1.4111982583999634, -1.3034902811050415, -1.19578218460083, -1.0880742073059082, -0.9803662896156311, -0.8726582527160645, -0.7649502754211426, -0.6572425365447998, -0.5495345592498779, -0.44182655215263367, -0.3341185450553894, -0.22641056776046753, -0.11870259046554565, -0.010994553565979004, 0.09671342372894287, 0.20442140102386475, 0.3121293783187866, 0.4198373854160309, 0.5275453925132751, 0.635253369808197, 0.7429613471031189, 0.8506693840026855, 0.9583773612976074, 1.0660853385925293, 1.1737933158874512, 1.281501293182373, 1.389209270477295, 1.4969172477722168, 1.6046252250671387, 1.71233332157135, 1.820041298866272, 1.9277492761611938, 2.0354573726654053, 2.143165349960327, 2.250873327255249, 2.358581304550171, 2.4662892818450928, 2.5739972591400146, 2.6817052364349365, 2.7894132137298584]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 2.0, 6.0, 8.0, 10.0, 13.0, 27.0, 21.0, 41.0, 52.0, 70.0, 133.0, 203.0, 331.0, 552.0, 872.0, 1855.0, 3734.0, 8282.0, 21228.0, 69279.0, 480900.0, 368717.0, 58525.0, 18931.0, 7488.0, 3283.0, 1661.0, 933.0, 488.0, 318.0, 196.0, 127.0, 80.0, 54.0, 39.0, 23.0, 25.0, 15.0, 8.0, 10.0, 8.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9453125, -3.81353759765625, -3.6817626953125, -3.54998779296875, -3.418212890625, -3.28643798828125, -3.1546630859375, -3.02288818359375, -2.89111328125, -2.75933837890625, -2.6275634765625, -2.49578857421875, -2.364013671875, -2.23223876953125, -2.1004638671875, -1.96868896484375, -1.8369140625, -1.70513916015625, -1.5733642578125, -1.44158935546875, -1.309814453125, -1.17803955078125, -1.0462646484375, -0.91448974609375, -0.78271484375, -0.65093994140625, -0.5191650390625, -0.38739013671875, -0.255615234375, -0.12384033203125, 0.0079345703125, 0.13970947265625, 0.271484375, 0.40325927734375, 0.5350341796875, 0.66680908203125, 0.798583984375, 0.93035888671875, 1.0621337890625, 1.19390869140625, 1.32568359375, 1.45745849609375, 1.5892333984375, 1.72100830078125, 1.852783203125, 1.98455810546875, 2.1163330078125, 2.24810791015625, 2.3798828125, 2.51165771484375, 2.6434326171875, 2.77520751953125, 2.906982421875, 3.03875732421875, 3.1705322265625, 3.30230712890625, 3.43408203125, 3.56585693359375, 3.6976318359375, 3.82940673828125, 3.961181640625, 4.09295654296875, 4.2247314453125, 4.35650634765625, 4.48828125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 7.0, 3.0, 2.0, 5.0, 8.0, 12.0, 19.0, 15.0, 20.0, 32.0, 27.0, 24.0, 25.0, 43.0, 41.0, 44.0, 39.0, 42.0, 51.0, 51.0, 48.0, 44.0, 40.0, 43.0, 44.0, 35.0, 33.0, 28.0, 29.0, 17.0, 24.0, 23.0, 12.0, 14.0, 8.0, 7.0, 6.0, 7.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.3203125, -6.12615966796875, -5.9320068359375, -5.73785400390625, -5.543701171875, -5.34954833984375, -5.1553955078125, -4.96124267578125, -4.76708984375, -4.57293701171875, -4.3787841796875, -4.18463134765625, -3.990478515625, -3.79632568359375, -3.6021728515625, -3.40802001953125, -3.2138671875, -3.01971435546875, -2.8255615234375, -2.63140869140625, -2.437255859375, -2.24310302734375, -2.0489501953125, -1.85479736328125, -1.66064453125, -1.46649169921875, -1.2723388671875, -1.07818603515625, -0.884033203125, -0.68988037109375, -0.4957275390625, -0.30157470703125, -0.107421875, 0.08673095703125, 0.2808837890625, 0.47503662109375, 0.669189453125, 0.86334228515625, 1.0574951171875, 1.25164794921875, 1.44580078125, 1.63995361328125, 1.8341064453125, 2.02825927734375, 2.222412109375, 2.41656494140625, 2.6107177734375, 2.80487060546875, 2.9990234375, 3.19317626953125, 3.3873291015625, 3.58148193359375, 3.775634765625, 3.96978759765625, 4.1639404296875, 4.35809326171875, 4.55224609375, 4.74639892578125, 4.9405517578125, 5.13470458984375, 5.328857421875, 5.52301025390625, 5.7171630859375, 5.91131591796875, 6.10546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 1.0, 5.0, 9.0, 2.0, 5.0, 14.0, 10.0, 16.0, 16.0, 30.0, 30.0, 39.0, 53.0, 71.0, 140.0, 442.0, 3173.0, 83761.0, 944496.0, 14394.0, 1175.0, 254.0, 112.0, 64.0, 46.0, 36.0, 30.0, 26.0, 17.0, 21.0, 12.0, 14.0, 13.0, 7.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-16.140625, -15.669677734375, -15.19873046875, -14.727783203125, -14.2568359375, -13.785888671875, -13.31494140625, -12.843994140625, -12.373046875, -11.902099609375, -11.43115234375, -10.960205078125, -10.4892578125, -10.018310546875, -9.54736328125, -9.076416015625, -8.60546875, -8.134521484375, -7.66357421875, -7.192626953125, -6.7216796875, -6.250732421875, -5.77978515625, -5.308837890625, -4.837890625, -4.366943359375, -3.89599609375, -3.425048828125, -2.9541015625, -2.483154296875, -2.01220703125, -1.541259765625, -1.0703125, -0.599365234375, -0.12841796875, 0.342529296875, 0.8134765625, 1.284423828125, 1.75537109375, 2.226318359375, 2.697265625, 3.168212890625, 3.63916015625, 4.110107421875, 4.5810546875, 5.052001953125, 5.52294921875, 5.993896484375, 6.46484375, 6.935791015625, 7.40673828125, 7.877685546875, 8.3486328125, 8.819580078125, 9.29052734375, 9.761474609375, 10.232421875, 10.703369140625, 11.17431640625, 11.645263671875, 12.1162109375, 12.587158203125, 13.05810546875, 13.529052734375, 14.0]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 2.0, 6.0, 4.0, 8.0, 9.0, 9.0, 14.0, 17.0, 13.0, 18.0, 23.0, 35.0, 46.0, 42.0, 36.0, 44.0, 46.0, 40.0, 52.0, 53.0, 65.0, 46.0, 55.0, 43.0, 31.0, 32.0, 37.0, 34.0, 27.0, 22.0, 12.0, 18.0, 16.0, 11.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0], "bins": [-10.4921875, -10.1942138671875, -9.896240234375, -9.5982666015625, -9.30029296875, -9.0023193359375, -8.704345703125, -8.4063720703125, -8.1083984375, -7.8104248046875, -7.512451171875, -7.2144775390625, -6.91650390625, -6.6185302734375, -6.320556640625, -6.0225830078125, -5.724609375, -5.4266357421875, -5.128662109375, -4.8306884765625, -4.53271484375, -4.2347412109375, -3.936767578125, -3.6387939453125, -3.3408203125, -3.0428466796875, -2.744873046875, -2.4468994140625, -2.14892578125, -1.8509521484375, -1.552978515625, -1.2550048828125, -0.95703125, -0.6590576171875, -0.361083984375, -0.0631103515625, 0.23486328125, 0.5328369140625, 0.830810546875, 1.1287841796875, 1.4267578125, 1.7247314453125, 2.022705078125, 2.3206787109375, 2.61865234375, 2.9166259765625, 3.214599609375, 3.5125732421875, 3.810546875, 4.1085205078125, 4.406494140625, 4.7044677734375, 5.00244140625, 5.3004150390625, 5.598388671875, 5.8963623046875, 6.1943359375, 6.4923095703125, 6.790283203125, 7.0882568359375, 7.38623046875, 7.6842041015625, 7.982177734375, 8.2801513671875, 8.578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 7.0, 11.0, 26.0, 37.0, 74.0, 165.0, 450.0, 1255.0, 4599.0, 38132.0, 807274.0, 180112.0, 12705.0, 2430.0, 731.0, 270.0, 131.0, 59.0, 34.0, 17.0, 16.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.66796875, -2.5933837890625, -2.518798828125, -2.4442138671875, -2.36962890625, -2.2950439453125, -2.220458984375, -2.1458740234375, -2.0712890625, -1.9967041015625, -1.922119140625, -1.8475341796875, -1.77294921875, -1.6983642578125, -1.623779296875, -1.5491943359375, -1.474609375, -1.4000244140625, -1.325439453125, -1.2508544921875, -1.17626953125, -1.1016845703125, -1.027099609375, -0.9525146484375, -0.8779296875, -0.8033447265625, -0.728759765625, -0.6541748046875, -0.57958984375, -0.5050048828125, -0.430419921875, -0.3558349609375, -0.28125, -0.2066650390625, -0.132080078125, -0.0574951171875, 0.01708984375, 0.0916748046875, 0.166259765625, 0.2408447265625, 0.3154296875, 0.3900146484375, 0.464599609375, 0.5391845703125, 0.61376953125, 0.6883544921875, 0.762939453125, 0.8375244140625, 0.912109375, 0.9866943359375, 1.061279296875, 1.1358642578125, 1.21044921875, 1.2850341796875, 1.359619140625, 1.4342041015625, 1.5087890625, 1.5833740234375, 1.657958984375, 1.7325439453125, 1.80712890625, 1.8817138671875, 1.956298828125, 2.0308837890625, 2.10546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 5.0, 10.0, 8.0, 10.0, 18.0, 20.0, 31.0, 35.0, 72.0, 76.0, 171.0, 180.0, 100.0, 77.0, 41.0, 37.0, 18.0, 26.0, 12.0, 13.0, 10.0, 4.0, 4.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002396106719970703, -0.0002331472933292389, -0.00022668391466140747, -0.00022022053599357605, -0.00021375715732574463, -0.0002072937786579132, -0.0002008303999900818, -0.00019436702132225037, -0.00018790364265441895, -0.00018144026398658752, -0.0001749768853187561, -0.00016851350665092468, -0.00016205012798309326, -0.00015558674931526184, -0.00014912337064743042, -0.000142659991979599, -0.00013619661331176758, -0.00012973323464393616, -0.00012326985597610474, -0.00011680647730827332, -0.0001103430986404419, -0.00010387971997261047, -9.741634130477905e-05, -9.095296263694763e-05, -8.448958396911621e-05, -7.802620530128479e-05, -7.156282663345337e-05, -6.509944796562195e-05, -5.863606929779053e-05, -5.2172690629959106e-05, -4.5709311962127686e-05, -3.9245933294296265e-05, -3.2782554626464844e-05, -2.6319175958633423e-05, -1.9855797290802002e-05, -1.3392418622970581e-05, -6.92903995513916e-06, -4.6566128730773926e-07, 5.997717380523682e-06, 1.2461096048355103e-05, 1.8924474716186523e-05, 2.5387853384017944e-05, 3.1851232051849365e-05, 3.8314610719680786e-05, 4.477798938751221e-05, 5.124136805534363e-05, 5.770474672317505e-05, 6.416812539100647e-05, 7.063150405883789e-05, 7.709488272666931e-05, 8.355826139450073e-05, 9.002164006233215e-05, 9.648501873016357e-05, 0.000102948397397995, 0.00010941177606582642, 0.00011587515473365784, 0.00012233853340148926, 0.00012880191206932068, 0.0001352652907371521, 0.00014172866940498352, 0.00014819204807281494, 0.00015465542674064636, 0.00016111880540847778, 0.0001675821840763092, 0.00017404556274414062]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 11.0, 19.0, 47.0, 63.0, 124.0, 290.0, 618.0, 1822.0, 6602.0, 36178.0, 552598.0, 408055.0, 33188.0, 6027.0, 1727.0, 653.0, 282.0, 114.0, 47.0, 39.0, 24.0, 9.0, 4.0, 9.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4638671875, -1.3972625732421875, -1.330657958984375, -1.2640533447265625, -1.19744873046875, -1.1308441162109375, -1.064239501953125, -0.9976348876953125, -0.9310302734375, -0.8644256591796875, -0.797821044921875, -0.7312164306640625, -0.66461181640625, -0.5980072021484375, -0.531402587890625, -0.4647979736328125, -0.398193359375, -0.3315887451171875, -0.264984130859375, -0.1983795166015625, -0.13177490234375, -0.0651702880859375, 0.001434326171875, 0.0680389404296875, 0.1346435546875, 0.2012481689453125, 0.267852783203125, 0.3344573974609375, 0.40106201171875, 0.4676666259765625, 0.534271240234375, 0.6008758544921875, 0.66748046875, 0.7340850830078125, 0.800689697265625, 0.8672943115234375, 0.93389892578125, 1.0005035400390625, 1.067108154296875, 1.1337127685546875, 1.2003173828125, 1.2669219970703125, 1.333526611328125, 1.4001312255859375, 1.46673583984375, 1.5333404541015625, 1.599945068359375, 1.6665496826171875, 1.733154296875, 1.7997589111328125, 1.866363525390625, 1.9329681396484375, 1.99957275390625, 2.0661773681640625, 2.132781982421875, 2.1993865966796875, 2.2659912109375, 2.3325958251953125, 2.399200439453125, 2.4658050537109375, 2.53240966796875, 2.5990142822265625, 2.665618896484375, 2.7322235107421875, 2.798828125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 8.0, 9.0, 10.0, 17.0, 15.0, 22.0, 29.0, 31.0, 56.0, 65.0, 114.0, 218.0, 124.0, 57.0, 38.0, 43.0, 25.0, 17.0, 20.0, 14.0, 11.0, 10.0, 8.0, 7.0, 6.0, 4.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.85791015625, -0.8344192504882812, -0.8109283447265625, -0.7874374389648438, -0.763946533203125, -0.7404556274414062, -0.7169647216796875, -0.6934738159179688, -0.66998291015625, -0.6464920043945312, -0.6230010986328125, -0.5995101928710938, -0.576019287109375, -0.5525283813476562, -0.5290374755859375, -0.5055465698242188, -0.4820556640625, -0.45856475830078125, -0.4350738525390625, -0.41158294677734375, -0.388092041015625, -0.36460113525390625, -0.3411102294921875, -0.31761932373046875, -0.29412841796875, -0.27063751220703125, -0.2471466064453125, -0.22365570068359375, -0.200164794921875, -0.17667388916015625, -0.1531829833984375, -0.12969207763671875, -0.106201171875, -0.08271026611328125, -0.0592193603515625, -0.03572845458984375, -0.012237548828125, 0.01125335693359375, 0.0347442626953125, 0.05823516845703125, 0.08172607421875, 0.10521697998046875, 0.1287078857421875, 0.15219879150390625, 0.175689697265625, 0.19918060302734375, 0.2226715087890625, 0.24616241455078125, 0.2696533203125, 0.29314422607421875, 0.3166351318359375, 0.34012603759765625, 0.363616943359375, 0.38710784912109375, 0.4105987548828125, 0.43408966064453125, 0.45758056640625, 0.48107147216796875, 0.5045623779296875, 0.5280532836914062, 0.551544189453125, 0.5750350952148438, 0.5985260009765625, 0.6220169067382812, 0.6455078125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 9.0, 11.0, 14.0, 26.0, 50.0, 53.0, 64.0, 117.0, 131.0, 128.0, 115.0, 99.0, 62.0, 37.0, 23.0, 26.0, 15.0, 9.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.271665573120117, -14.835480690002441, -14.39929485321045, -13.963109970092773, -13.526924133300781, -13.090739250183105, -12.65455436706543, -12.218368530273438, -11.782182693481445, -11.34599781036377, -10.909811973571777, -10.473627090454102, -10.03744125366211, -9.601256370544434, -9.165071487426758, -8.728885650634766, -8.29270076751709, -7.856515407562256, -7.420330047607422, -6.984145164489746, -6.547959327697754, -6.111774444580078, -5.675589084625244, -5.23940372467041, -4.803218364715576, -4.367033004760742, -3.930847644805908, -3.4946625232696533, -3.0584771633148193, -2.6222918033599854, -2.1861066818237305, -1.7499213218688965, -1.313735008239746, -0.8775497078895569, -0.4413644075393677, -0.005179166793823242, 0.43100619316101074, 0.8671915531158447, 1.3033766746520996, 1.7395620346069336, 2.1757473945617676, 2.6119327545166016, 3.0481181144714355, 3.4843032360076904, 3.9204885959625244, 4.3566741943359375, 4.792859077453613, 5.229044437408447, 5.665229797363281, 6.101415157318115, 6.537600517272949, 6.973785400390625, 7.409971237182617, 7.846156120300293, 8.282341003417969, 8.718526840209961, 9.154712677001953, 9.590897560119629, 10.027083396911621, 10.463268280029297, 10.899454116821289, 11.335638999938965, 11.77182388305664, 12.208009719848633, 12.644194602966309]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 6.0, 5.0, 4.0, 5.0, 17.0, 17.0, 19.0, 13.0, 19.0, 27.0, 32.0, 35.0, 40.0, 51.0, 35.0, 43.0, 52.0, 45.0, 53.0, 43.0, 52.0, 43.0, 42.0, 27.0, 29.0, 31.0, 27.0, 35.0, 31.0, 36.0, 16.0, 17.0, 6.0, 9.0, 16.0, 6.0, 4.0, 3.0, 4.0, 4.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.999740600585938, -11.552684783935547, -11.105628967285156, -10.658573150634766, -10.211518287658691, -9.7644624710083, -9.31740665435791, -8.87035083770752, -8.423295021057129, -7.976239204406738, -7.529183864593506, -7.082128047943115, -6.635072231292725, -6.188016891479492, -5.740961074829102, -5.293905258178711, -4.8468499183654785, -4.399794101715088, -3.9527385234832764, -3.505682945251465, -3.058627128601074, -2.6115715503692627, -2.164515972137451, -1.7174601554870605, -1.270404577255249, -0.823348879814148, -0.37629324197769165, 0.07076239585876465, 0.5178180932998657, 0.9648737907409668, 1.4119293689727783, 1.858985185623169, 2.3060407638549805, 2.753096342086792, 3.2001521587371826, 3.647207736968994, 4.094263553619385, 4.541318893432617, 4.988374710083008, 5.435430526733398, 5.882486343383789, 6.32954216003418, 6.776597499847412, 7.223653316497803, 7.670709133148193, 8.117764472961426, 8.564820289611816, 9.011876106262207, 9.458930969238281, 9.905986785888672, 10.353042602539062, 10.800098419189453, 11.247153282165527, 11.694209098815918, 12.141264915466309, 12.5883207321167, 13.03537654876709, 13.48243236541748, 13.929488182067871, 14.376543045043945, 14.823598861694336, 15.270654678344727, 15.717710494995117, 16.164766311645508, 16.6118221282959]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 5.0, 7.0, 14.0, 15.0, 18.0, 19.0, 23.0, 32.0, 60.0, 85.0, 140.0, 214.0, 375.0, 734.0, 1512.0, 3488.0, 9937.0, 44049.0, 511502.0, 3170597.0, 396129.0, 39615.0, 9478.0, 3206.0, 1428.0, 689.0, 344.0, 192.0, 97.0, 65.0, 66.0, 30.0, 25.0, 23.0, 18.0, 17.0, 8.0, 7.0, 5.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.89453125, -6.65228271484375, -6.4100341796875, -6.16778564453125, -5.925537109375, -5.68328857421875, -5.4410400390625, -5.19879150390625, -4.95654296875, -4.71429443359375, -4.4720458984375, -4.22979736328125, -3.987548828125, -3.74530029296875, -3.5030517578125, -3.26080322265625, -3.0185546875, -2.77630615234375, -2.5340576171875, -2.29180908203125, -2.049560546875, -1.80731201171875, -1.5650634765625, -1.32281494140625, -1.08056640625, -0.83831787109375, -0.5960693359375, -0.35382080078125, -0.111572265625, 0.13067626953125, 0.3729248046875, 0.61517333984375, 0.857421875, 1.09967041015625, 1.3419189453125, 1.58416748046875, 1.826416015625, 2.06866455078125, 2.3109130859375, 2.55316162109375, 2.79541015625, 3.03765869140625, 3.2799072265625, 3.52215576171875, 3.764404296875, 4.00665283203125, 4.2489013671875, 4.49114990234375, 4.7333984375, 4.97564697265625, 5.2178955078125, 5.46014404296875, 5.702392578125, 5.94464111328125, 6.1868896484375, 6.42913818359375, 6.67138671875, 6.91363525390625, 7.1558837890625, 7.39813232421875, 7.640380859375, 7.88262939453125, 8.1248779296875, 8.36712646484375, 8.609375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 7.0, 0.0, 7.0, 9.0, 5.0, 9.0, 10.0, 11.0, 18.0, 22.0, 22.0, 27.0, 40.0, 39.0, 34.0, 68.0, 58.0, 55.0, 55.0, 52.0, 51.0, 49.0, 58.0, 43.0, 33.0, 41.0, 36.0, 20.0, 25.0, 24.0, 19.0, 9.0, 12.0, 11.0, 6.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-5.28515625, -5.14691162109375, -5.0086669921875, -4.87042236328125, -4.732177734375, -4.59393310546875, -4.4556884765625, -4.31744384765625, -4.17919921875, -4.04095458984375, -3.9027099609375, -3.76446533203125, -3.626220703125, -3.48797607421875, -3.3497314453125, -3.21148681640625, -3.0732421875, -2.93499755859375, -2.7967529296875, -2.65850830078125, -2.520263671875, -2.38201904296875, -2.2437744140625, -2.10552978515625, -1.96728515625, -1.82904052734375, -1.6907958984375, -1.55255126953125, -1.414306640625, -1.27606201171875, -1.1378173828125, -0.99957275390625, -0.861328125, -0.72308349609375, -0.5848388671875, -0.44659423828125, -0.308349609375, -0.17010498046875, -0.0318603515625, 0.10638427734375, 0.24462890625, 0.38287353515625, 0.5211181640625, 0.65936279296875, 0.797607421875, 0.93585205078125, 1.0740966796875, 1.21234130859375, 1.3505859375, 1.48883056640625, 1.6270751953125, 1.76531982421875, 1.903564453125, 2.04180908203125, 2.1800537109375, 2.31829833984375, 2.45654296875, 2.59478759765625, 2.7330322265625, 2.87127685546875, 3.009521484375, 3.14776611328125, 3.2860107421875, 3.42425537109375, 3.5625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 3.0, 4.0, 7.0, 5.0, 11.0, 16.0, 19.0, 34.0, 39.0, 81.0, 124.0, 267.0, 607.0, 1794.0, 7210.0, 54861.0, 2579635.0, 1499699.0, 41487.0, 5807.0, 1455.0, 522.0, 261.0, 105.0, 79.0, 42.0, 32.0, 20.0, 17.0, 9.0, 8.0, 2.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.3828125, -12.047607421875, -11.71240234375, -11.377197265625, -11.0419921875, -10.706787109375, -10.37158203125, -10.036376953125, -9.701171875, -9.365966796875, -9.03076171875, -8.695556640625, -8.3603515625, -8.025146484375, -7.68994140625, -7.354736328125, -7.01953125, -6.684326171875, -6.34912109375, -6.013916015625, -5.6787109375, -5.343505859375, -5.00830078125, -4.673095703125, -4.337890625, -4.002685546875, -3.66748046875, -3.332275390625, -2.9970703125, -2.661865234375, -2.32666015625, -1.991455078125, -1.65625, -1.321044921875, -0.98583984375, -0.650634765625, -0.3154296875, 0.019775390625, 0.35498046875, 0.690185546875, 1.025390625, 1.360595703125, 1.69580078125, 2.031005859375, 2.3662109375, 2.701416015625, 3.03662109375, 3.371826171875, 3.70703125, 4.042236328125, 4.37744140625, 4.712646484375, 5.0478515625, 5.383056640625, 5.71826171875, 6.053466796875, 6.388671875, 6.723876953125, 7.05908203125, 7.394287109375, 7.7294921875, 8.064697265625, 8.39990234375, 8.735107421875, 9.0703125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 10.0, 9.0, 10.0, 10.0, 21.0, 18.0, 43.0, 55.0, 73.0, 84.0, 125.0, 170.0, 277.0, 434.0, 544.0, 576.0, 451.0, 345.0, 232.0, 170.0, 119.0, 69.0, 63.0, 41.0, 26.0, 17.0, 14.0, 11.0, 11.0, 14.0, 6.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.572265625, -1.516815185546875, -1.46136474609375, -1.405914306640625, -1.3504638671875, -1.295013427734375, -1.23956298828125, -1.184112548828125, -1.128662109375, -1.073211669921875, -1.01776123046875, -0.962310791015625, -0.9068603515625, -0.851409912109375, -0.79595947265625, -0.740509033203125, -0.68505859375, -0.629608154296875, -0.57415771484375, -0.518707275390625, -0.4632568359375, -0.407806396484375, -0.35235595703125, -0.296905517578125, -0.241455078125, -0.186004638671875, -0.13055419921875, -0.075103759765625, -0.0196533203125, 0.035797119140625, 0.09124755859375, 0.146697998046875, 0.2021484375, 0.257598876953125, 0.31304931640625, 0.368499755859375, 0.4239501953125, 0.479400634765625, 0.53485107421875, 0.590301513671875, 0.645751953125, 0.701202392578125, 0.75665283203125, 0.812103271484375, 0.8675537109375, 0.923004150390625, 0.97845458984375, 1.033905029296875, 1.08935546875, 1.144805908203125, 1.20025634765625, 1.255706787109375, 1.3111572265625, 1.366607666015625, 1.42205810546875, 1.477508544921875, 1.532958984375, 1.588409423828125, 1.64385986328125, 1.699310302734375, 1.7547607421875, 1.810211181640625, 1.86566162109375, 1.921112060546875, 1.9765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 30.0, 64.0, 80.0, 123.0, 160.0, 140.0, 149.0, 105.0, 57.0, 37.0, 23.0, 11.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.593779563903809, -15.174943923950195, -14.756108283996582, -14.337272644042969, -13.918437004089355, -13.499601364135742, -13.080765724182129, -12.661930084228516, -12.243094444274902, -11.824258804321289, -11.405423164367676, -10.986587524414062, -10.56775188446045, -10.148916244506836, -9.730080604553223, -9.31124496459961, -8.892409324645996, -8.473573684692383, -8.05473804473877, -7.635902404785156, -7.217066764831543, -6.79823112487793, -6.379395484924316, -5.960559844970703, -5.54172420501709, -5.122888565063477, -4.704052925109863, -4.28521728515625, -3.8663816452026367, -3.4475460052490234, -3.02871036529541, -2.609874725341797, -2.191038131713867, -1.772202491760254, -1.3533668518066406, -0.9345312118530273, -0.5156955718994141, -0.09685993194580078, 0.3219757080078125, 0.7408113479614258, 1.159646987915039, 1.5784826278686523, 1.9973182678222656, 2.416153907775879, 2.834989547729492, 3.2538251876831055, 3.6726608276367188, 4.091496467590332, 4.510332107543945, 4.929167747497559, 5.348003387451172, 5.766839027404785, 6.185674667358398, 6.604510307312012, 7.023345947265625, 7.442181587219238, 7.861017227172852, 8.279852867126465, 8.698688507080078, 9.117524147033691, 9.536359786987305, 9.955195426940918, 10.374031066894531, 10.792866706848145, 11.211702346801758]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 13.0, 9.0, 14.0, 10.0, 18.0, 16.0, 28.0, 28.0, 31.0, 32.0, 38.0, 46.0, 48.0, 42.0, 44.0, 49.0, 46.0, 41.0, 50.0, 42.0, 52.0, 41.0, 35.0, 42.0, 32.0, 28.0, 22.0, 18.0, 15.0, 14.0, 19.0, 5.0, 8.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.917880535125732, -5.757607936859131, -5.597335338592529, -5.437063217163086, -5.276790618896484, -5.116518020629883, -4.956245422363281, -4.79597282409668, -4.635700225830078, -4.475427627563477, -4.315155029296875, -4.154882907867432, -3.99461030960083, -3.8343377113342285, -3.674065113067627, -3.5137925148010254, -3.353520393371582, -3.1932477951049805, -3.032975435256958, -2.8727028369903564, -2.712430477142334, -2.5521578788757324, -2.391885280609131, -2.2316126823425293, -2.071340322494507, -1.9110678434371948, -1.7507953643798828, -1.5905227661132812, -1.4302502870559692, -1.2699778079986572, -1.1097052097320557, -0.9494327306747437, -0.7891602516174316, -0.6288877725601196, -0.46861523389816284, -0.30834272503852844, -0.14807021617889404, 0.012202262878417969, 0.17247480154037476, 0.33274734020233154, 0.49301981925964355, 0.6532922983169556, 0.8135648369789124, 0.9738373756408691, 1.1341098546981812, 1.2943823337554932, 1.4546549320220947, 1.6149274110794067, 1.7751998901367188, 1.9354723691940308, 2.0957448482513428, 2.2560174465179443, 2.416289806365967, 2.5765624046325684, 2.73683500289917, 2.8971076011657715, 3.057379961013794, 3.2176525592803955, 3.377924919128418, 3.5381975173950195, 3.698470115661621, 3.8587424755096436, 4.019014835357666, 4.179287433624268, 4.339560031890869]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 9.0, 9.0, 15.0, 25.0, 43.0, 61.0, 106.0, 149.0, 287.0, 481.0, 876.0, 1628.0, 3129.0, 7250.0, 19942.0, 87792.0, 553265.0, 304023.0, 45966.0, 12812.0, 5183.0, 2478.0, 1318.0, 696.0, 411.0, 246.0, 129.0, 84.0, 38.0, 43.0, 19.0, 10.0, 7.0, 9.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-3.072265625, -2.995086669921875, -2.91790771484375, -2.840728759765625, -2.7635498046875, -2.686370849609375, -2.60919189453125, -2.532012939453125, -2.454833984375, -2.377655029296875, -2.30047607421875, -2.223297119140625, -2.1461181640625, -2.068939208984375, -1.99176025390625, -1.914581298828125, -1.83740234375, -1.760223388671875, -1.68304443359375, -1.605865478515625, -1.5286865234375, -1.451507568359375, -1.37432861328125, -1.297149658203125, -1.219970703125, -1.142791748046875, -1.06561279296875, -0.988433837890625, -0.9112548828125, -0.834075927734375, -0.75689697265625, -0.679718017578125, -0.6025390625, -0.525360107421875, -0.44818115234375, -0.371002197265625, -0.2938232421875, -0.216644287109375, -0.13946533203125, -0.062286376953125, 0.014892578125, 0.092071533203125, 0.16925048828125, 0.246429443359375, 0.3236083984375, 0.400787353515625, 0.47796630859375, 0.555145263671875, 0.63232421875, 0.709503173828125, 0.78668212890625, 0.863861083984375, 0.9410400390625, 1.018218994140625, 1.09539794921875, 1.172576904296875, 1.249755859375, 1.326934814453125, 1.40411376953125, 1.481292724609375, 1.5584716796875, 1.635650634765625, 1.71282958984375, 1.790008544921875, 1.8671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 4.0, 4.0, 11.0, 7.0, 15.0, 12.0, 19.0, 36.0, 29.0, 30.0, 30.0, 44.0, 54.0, 47.0, 45.0, 46.0, 62.0, 39.0, 46.0, 63.0, 44.0, 43.0, 56.0, 42.0, 25.0, 25.0, 25.0, 17.0, 18.0, 12.0, 12.0, 13.0, 8.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.8125, -4.6890869140625, -4.565673828125, -4.4422607421875, -4.31884765625, -4.1954345703125, -4.072021484375, -3.9486083984375, -3.8251953125, -3.7017822265625, -3.578369140625, -3.4549560546875, -3.33154296875, -3.2081298828125, -3.084716796875, -2.9613037109375, -2.837890625, -2.7144775390625, -2.591064453125, -2.4676513671875, -2.34423828125, -2.2208251953125, -2.097412109375, -1.9739990234375, -1.8505859375, -1.7271728515625, -1.603759765625, -1.4803466796875, -1.35693359375, -1.2335205078125, -1.110107421875, -0.9866943359375, -0.86328125, -0.7398681640625, -0.616455078125, -0.4930419921875, -0.36962890625, -0.2462158203125, -0.122802734375, 0.0006103515625, 0.1240234375, 0.2474365234375, 0.370849609375, 0.4942626953125, 0.61767578125, 0.7410888671875, 0.864501953125, 0.9879150390625, 1.111328125, 1.2347412109375, 1.358154296875, 1.4815673828125, 1.60498046875, 1.7283935546875, 1.851806640625, 1.9752197265625, 2.0986328125, 2.2220458984375, 2.345458984375, 2.4688720703125, 2.59228515625, 2.7156982421875, 2.839111328125, 2.9625244140625, 3.0859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 7.0, 6.0, 12.0, 20.0, 13.0, 23.0, 27.0, 37.0, 78.0, 152.0, 301.0, 602.0, 1298.0, 3292.0, 9940.0, 51734.0, 598591.0, 339676.0, 30976.0, 7110.0, 2531.0, 1069.0, 501.0, 224.0, 122.0, 72.0, 42.0, 29.0, 17.0, 12.0, 15.0, 6.0, 11.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.505859375, -2.41595458984375, -2.3260498046875, -2.23614501953125, -2.146240234375, -2.05633544921875, -1.9664306640625, -1.87652587890625, -1.78662109375, -1.69671630859375, -1.6068115234375, -1.51690673828125, -1.427001953125, -1.33709716796875, -1.2471923828125, -1.15728759765625, -1.0673828125, -0.97747802734375, -0.8875732421875, -0.79766845703125, -0.707763671875, -0.61785888671875, -0.5279541015625, -0.43804931640625, -0.34814453125, -0.25823974609375, -0.1683349609375, -0.07843017578125, 0.011474609375, 0.10137939453125, 0.1912841796875, 0.28118896484375, 0.37109375, 0.46099853515625, 0.5509033203125, 0.64080810546875, 0.730712890625, 0.82061767578125, 0.9105224609375, 1.00042724609375, 1.09033203125, 1.18023681640625, 1.2701416015625, 1.36004638671875, 1.449951171875, 1.53985595703125, 1.6297607421875, 1.71966552734375, 1.8095703125, 1.89947509765625, 1.9893798828125, 2.07928466796875, 2.169189453125, 2.25909423828125, 2.3489990234375, 2.43890380859375, 2.52880859375, 2.61871337890625, 2.7086181640625, 2.79852294921875, 2.888427734375, 2.97833251953125, 3.0682373046875, 3.15814208984375, 3.248046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 13.0, 10.0, 13.0, 14.0, 11.0, 23.0, 39.0, 21.0, 31.0, 36.0, 35.0, 41.0, 40.0, 45.0, 59.0, 47.0, 54.0, 52.0, 55.0, 44.0, 50.0, 39.0, 35.0, 22.0, 29.0, 20.0, 17.0, 19.0, 19.0, 16.0, 7.0, 13.0, 5.0, 8.0, 6.0, 4.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.6953125, -9.42193603515625, -9.1485595703125, -8.87518310546875, -8.601806640625, -8.32843017578125, -8.0550537109375, -7.78167724609375, -7.50830078125, -7.23492431640625, -6.9615478515625, -6.68817138671875, -6.414794921875, -6.14141845703125, -5.8680419921875, -5.59466552734375, -5.3212890625, -5.04791259765625, -4.7745361328125, -4.50115966796875, -4.227783203125, -3.95440673828125, -3.6810302734375, -3.40765380859375, -3.13427734375, -2.86090087890625, -2.5875244140625, -2.31414794921875, -2.040771484375, -1.76739501953125, -1.4940185546875, -1.22064208984375, -0.947265625, -0.67388916015625, -0.4005126953125, -0.12713623046875, 0.146240234375, 0.41961669921875, 0.6929931640625, 0.96636962890625, 1.23974609375, 1.51312255859375, 1.7864990234375, 2.05987548828125, 2.333251953125, 2.60662841796875, 2.8800048828125, 3.15338134765625, 3.4267578125, 3.70013427734375, 3.9735107421875, 4.24688720703125, 4.520263671875, 4.79364013671875, 5.0670166015625, 5.34039306640625, 5.61376953125, 5.88714599609375, 6.1605224609375, 6.43389892578125, 6.707275390625, 6.98065185546875, 7.2540283203125, 7.52740478515625, 7.80078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 7.0, 5.0, 10.0, 8.0, 16.0, 20.0, 38.0, 54.0, 82.0, 161.0, 250.0, 431.0, 776.0, 1545.0, 3437.0, 8976.0, 35313.0, 448002.0, 494638.0, 38388.0, 9319.0, 3613.0, 1615.0, 747.0, 465.0, 244.0, 132.0, 74.0, 62.0, 35.0, 30.0, 17.0, 12.0, 9.0, 6.0, 4.0, 8.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0654296875, -1.0260009765625, -0.986572265625, -0.9471435546875, -0.90771484375, -0.8682861328125, -0.828857421875, -0.7894287109375, -0.75, -0.7105712890625, -0.671142578125, -0.6317138671875, -0.59228515625, -0.5528564453125, -0.513427734375, -0.4739990234375, -0.4345703125, -0.3951416015625, -0.355712890625, -0.3162841796875, -0.27685546875, -0.2374267578125, -0.197998046875, -0.1585693359375, -0.119140625, -0.0797119140625, -0.040283203125, -0.0008544921875, 0.03857421875, 0.0780029296875, 0.117431640625, 0.1568603515625, 0.1962890625, 0.2357177734375, 0.275146484375, 0.3145751953125, 0.35400390625, 0.3934326171875, 0.432861328125, 0.4722900390625, 0.51171875, 0.5511474609375, 0.590576171875, 0.6300048828125, 0.66943359375, 0.7088623046875, 0.748291015625, 0.7877197265625, 0.8271484375, 0.8665771484375, 0.906005859375, 0.9454345703125, 0.98486328125, 1.0242919921875, 1.063720703125, 1.1031494140625, 1.142578125, 1.1820068359375, 1.221435546875, 1.2608642578125, 1.30029296875, 1.3397216796875, 1.379150390625, 1.4185791015625, 1.4580078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 7.0, 3.0, 4.0, 14.0, 11.0, 20.0, 32.0, 48.0, 63.0, 107.0, 136.0, 137.0, 136.0, 86.0, 61.0, 41.0, 25.0, 23.0, 11.0, 5.0, 7.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0], "bins": [-0.0004639625549316406, -0.00045040249824523926, -0.0004368424415588379, -0.0004232823848724365, -0.00040972232818603516, -0.0003961622714996338, -0.0003826022148132324, -0.00036904215812683105, -0.0003554821014404297, -0.0003419220447540283, -0.00032836198806762695, -0.0003148019313812256, -0.0003012418746948242, -0.00028768181800842285, -0.0002741217613220215, -0.0002605617046356201, -0.00024700164794921875, -0.00023344159126281738, -0.00021988153457641602, -0.00020632147789001465, -0.00019276142120361328, -0.00017920136451721191, -0.00016564130783081055, -0.00015208125114440918, -0.0001385211944580078, -0.00012496113777160645, -0.00011140108108520508, -9.784102439880371e-05, -8.428096771240234e-05, -7.072091102600098e-05, -5.716085433959961e-05, -4.360079765319824e-05, -3.0040740966796875e-05, -1.6480684280395508e-05, -2.9206275939941406e-06, 1.0639429092407227e-05, 2.4199485778808594e-05, 3.775954246520996e-05, 5.131959915161133e-05, 6.48796558380127e-05, 7.843971252441406e-05, 9.199976921081543e-05, 0.0001055598258972168, 0.00011911988258361816, 0.00013267993927001953, 0.0001462399959564209, 0.00015980005264282227, 0.00017336010932922363, 0.000186920166015625, 0.00020048022270202637, 0.00021404027938842773, 0.0002276003360748291, 0.00024116039276123047, 0.00025472044944763184, 0.0002682805061340332, 0.00028184056282043457, 0.00029540061950683594, 0.0003089606761932373, 0.00032252073287963867, 0.00033608078956604004, 0.0003496408462524414, 0.0003632009029388428, 0.00037676095962524414, 0.0003903210163116455, 0.0004038810729980469]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 5.0, 10.0, 9.0, 39.0, 33.0, 55.0, 91.0, 181.0, 392.0, 702.0, 1486.0, 3435.0, 9392.0, 42333.0, 538857.0, 404805.0, 32765.0, 8101.0, 3014.0, 1409.0, 675.0, 324.0, 174.0, 109.0, 47.0, 24.0, 21.0, 16.0, 11.0, 8.0, 7.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.462890625, -1.4184722900390625, -1.374053955078125, -1.3296356201171875, -1.28521728515625, -1.2407989501953125, -1.196380615234375, -1.1519622802734375, -1.1075439453125, -1.0631256103515625, -1.018707275390625, -0.9742889404296875, -0.92987060546875, -0.8854522705078125, -0.841033935546875, -0.7966156005859375, -0.752197265625, -0.7077789306640625, -0.663360595703125, -0.6189422607421875, -0.57452392578125, -0.5301055908203125, -0.485687255859375, -0.4412689208984375, -0.3968505859375, -0.3524322509765625, -0.308013916015625, -0.2635955810546875, -0.21917724609375, -0.1747589111328125, -0.130340576171875, -0.0859222412109375, -0.04150390625, 0.0029144287109375, 0.047332763671875, 0.0917510986328125, 0.13616943359375, 0.1805877685546875, 0.225006103515625, 0.2694244384765625, 0.3138427734375, 0.3582611083984375, 0.402679443359375, 0.4470977783203125, 0.49151611328125, 0.5359344482421875, 0.580352783203125, 0.6247711181640625, 0.669189453125, 0.7136077880859375, 0.758026123046875, 0.8024444580078125, 0.84686279296875, 0.8912811279296875, 0.935699462890625, 0.9801177978515625, 1.0245361328125, 1.0689544677734375, 1.113372802734375, 1.1577911376953125, 1.20220947265625, 1.2466278076171875, 1.291046142578125, 1.3354644775390625, 1.3798828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 5.0, 6.0, 7.0, 5.0, 7.0, 11.0, 24.0, 26.0, 35.0, 74.0, 123.0, 145.0, 179.0, 124.0, 76.0, 54.0, 26.0, 11.0, 11.0, 15.0, 9.0, 7.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33056640625, -0.31682586669921875, -0.3030853271484375, -0.28934478759765625, -0.275604248046875, -0.26186370849609375, -0.2481231689453125, -0.23438262939453125, -0.22064208984375, -0.20690155029296875, -0.1931610107421875, -0.17942047119140625, -0.165679931640625, -0.15193939208984375, -0.1381988525390625, -0.12445831298828125, -0.1107177734375, -0.09697723388671875, -0.0832366943359375, -0.06949615478515625, -0.055755615234375, -0.04201507568359375, -0.0282745361328125, -0.01453399658203125, -0.00079345703125, 0.01294708251953125, 0.0266876220703125, 0.04042816162109375, 0.054168701171875, 0.06790924072265625, 0.0816497802734375, 0.09539031982421875, 0.109130859375, 0.12287139892578125, 0.1366119384765625, 0.15035247802734375, 0.164093017578125, 0.17783355712890625, 0.1915740966796875, 0.20531463623046875, 0.21905517578125, 0.23279571533203125, 0.2465362548828125, 0.26027679443359375, 0.274017333984375, 0.28775787353515625, 0.3014984130859375, 0.31523895263671875, 0.3289794921875, 0.34272003173828125, 0.3564605712890625, 0.37020111083984375, 0.383941650390625, 0.39768218994140625, 0.4114227294921875, 0.42516326904296875, 0.43890380859375, 0.45264434814453125, 0.4663848876953125, 0.48012542724609375, 0.493865966796875, 0.5076065063476562, 0.5213470458984375, 0.5350875854492188, 0.548828125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 6.0, 7.0, 13.0, 19.0, 41.0, 58.0, 90.0, 97.0, 111.0, 116.0, 121.0, 77.0, 80.0, 48.0, 43.0, 29.0, 16.0, 10.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.447192668914795, -7.242934226989746, -7.038675308227539, -6.834416389465332, -6.630157947540283, -6.425899505615234, -6.221640586853027, -6.01738166809082, -5.8131232261657715, -5.608864784240723, -5.404605865478516, -5.200346946716309, -4.99608850479126, -4.791830062866211, -4.587571144104004, -4.383312225341797, -4.179053783416748, -3.97479510307312, -3.770536422729492, -3.5662777423858643, -3.3620190620422363, -3.1577603816986084, -2.9535017013549805, -2.7492430210113525, -2.5449843406677246, -2.3407256603240967, -2.1364669799804688, -1.9322082996368408, -1.727949619293213, -1.523690938949585, -1.319432258605957, -1.115173578262329, -0.9109153747558594, -0.7066566944122314, -0.5023980140686035, -0.2981393337249756, -0.09388065338134766, 0.11037802696228027, 0.3146367073059082, 0.5188953876495361, 0.7231540679931641, 0.927412748336792, 1.13167142868042, 1.3359301090240479, 1.5401887893676758, 1.7444474697113037, 1.9487061500549316, 2.1529648303985596, 2.3572235107421875, 2.5614821910858154, 2.7657408714294434, 2.9699995517730713, 3.174258232116699, 3.378516912460327, 3.582775592803955, 3.787034273147583, 3.991292953491211, 4.195551872253418, 4.399810314178467, 4.604068756103516, 4.808327674865723, 5.01258659362793, 5.2168450355529785, 5.421103477478027, 5.625362396240234]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 2.0, 5.0, 8.0, 11.0, 12.0, 21.0, 19.0, 23.0, 29.0, 41.0, 40.0, 43.0, 44.0, 55.0, 59.0, 51.0, 56.0, 40.0, 57.0, 52.0, 56.0, 45.0, 49.0, 36.0, 23.0, 28.0, 20.0, 17.0, 17.0, 15.0, 6.0, 10.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.80606746673584, -4.6785712242126465, -4.551074504852295, -4.423578262329102, -4.29608154296875, -4.168585300445557, -4.041089057922363, -3.9135923385620117, -3.7860960960388184, -3.658599615097046, -3.5311031341552734, -3.40360689163208, -3.2761104106903076, -3.148613929748535, -3.0211174488067627, -2.8936209678649902, -2.7661244869232178, -2.6386280059814453, -2.511131525039673, -2.3836350440979004, -2.256138801574707, -2.1286423206329346, -2.001145839691162, -1.8736493587493896, -1.7461529970169067, -1.6186565160751343, -1.4911601543426514, -1.363663673400879, -1.2361671924591064, -1.1086708307266235, -0.9811743497848511, -0.8536779284477234, -0.7261812686920166, -0.5986848473548889, -0.47118839621543884, -0.34369194507598877, -0.21619552373886108, -0.0886991024017334, 0.03879737854003906, 0.16629379987716675, 0.29379022121429443, 0.4212866425514221, 0.5487830638885498, 0.6762795448303223, 0.80377596616745, 0.9312723875045776, 1.05876886844635, 1.186265230178833, 1.3137617111206055, 1.441258192062378, 1.5687545537948608, 1.6962510347366333, 1.8237473964691162, 1.9512438774108887, 2.078740358352661, 2.2062368392944336, 2.333733081817627, 2.4612295627593994, 2.588726043701172, 2.7162222862243652, 2.8437187671661377, 2.97121524810791, 3.0987117290496826, 3.226208209991455, 3.3537046909332275]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 9.0, 6.0, 13.0, 12.0, 29.0, 30.0, 74.0, 112.0, 167.0, 367.0, 776.0, 1688.0, 4113.0, 12607.0, 50239.0, 331474.0, 543146.0, 76809.0, 17518.0, 5442.0, 1991.0, 892.0, 456.0, 248.0, 133.0, 74.0, 37.0, 38.0, 17.0, 12.0, 8.0, 4.0, 3.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.29296875, -6.11383056640625, -5.9346923828125, -5.75555419921875, -5.576416015625, -5.39727783203125, -5.2181396484375, -5.03900146484375, -4.85986328125, -4.68072509765625, -4.5015869140625, -4.32244873046875, -4.143310546875, -3.96417236328125, -3.7850341796875, -3.60589599609375, -3.4267578125, -3.24761962890625, -3.0684814453125, -2.88934326171875, -2.710205078125, -2.53106689453125, -2.3519287109375, -2.17279052734375, -1.99365234375, -1.81451416015625, -1.6353759765625, -1.45623779296875, -1.277099609375, -1.09796142578125, -0.9188232421875, -0.73968505859375, -0.560546875, -0.38140869140625, -0.2022705078125, -0.02313232421875, 0.156005859375, 0.33514404296875, 0.5142822265625, 0.69342041015625, 0.87255859375, 1.05169677734375, 1.2308349609375, 1.40997314453125, 1.589111328125, 1.76824951171875, 1.9473876953125, 2.12652587890625, 2.3056640625, 2.48480224609375, 2.6639404296875, 2.84307861328125, 3.022216796875, 3.20135498046875, 3.3804931640625, 3.55963134765625, 3.73876953125, 3.91790771484375, 4.0970458984375, 4.27618408203125, 4.455322265625, 4.63446044921875, 4.8135986328125, 4.99273681640625, 5.171875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 5.0, 7.0, 2.0, 7.0, 9.0, 15.0, 11.0, 22.0, 25.0, 39.0, 32.0, 55.0, 49.0, 53.0, 54.0, 60.0, 68.0, 59.0, 67.0, 51.0, 60.0, 46.0, 46.0, 29.0, 24.0, 32.0, 24.0, 21.0, 12.0, 11.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.015625, -8.748779296875, -8.48193359375, -8.215087890625, -7.9482421875, -7.681396484375, -7.41455078125, -7.147705078125, -6.880859375, -6.614013671875, -6.34716796875, -6.080322265625, -5.8134765625, -5.546630859375, -5.27978515625, -5.012939453125, -4.74609375, -4.479248046875, -4.21240234375, -3.945556640625, -3.6787109375, -3.411865234375, -3.14501953125, -2.878173828125, -2.611328125, -2.344482421875, -2.07763671875, -1.810791015625, -1.5439453125, -1.277099609375, -1.01025390625, -0.743408203125, -0.4765625, -0.209716796875, 0.05712890625, 0.323974609375, 0.5908203125, 0.857666015625, 1.12451171875, 1.391357421875, 1.658203125, 1.925048828125, 2.19189453125, 2.458740234375, 2.7255859375, 2.992431640625, 3.25927734375, 3.526123046875, 3.79296875, 4.059814453125, 4.32666015625, 4.593505859375, 4.8603515625, 5.127197265625, 5.39404296875, 5.660888671875, 5.927734375, 6.194580078125, 6.46142578125, 6.728271484375, 6.9951171875, 7.261962890625, 7.52880859375, 7.795654296875, 8.0625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 0.0, 5.0, 2.0, 4.0, 5.0, 8.0, 8.0, 12.0, 17.0, 14.0, 23.0, 20.0, 31.0, 40.0, 74.0, 102.0, 159.0, 361.0, 1497.0, 19697.0, 932538.0, 89405.0, 3276.0, 589.0, 217.0, 134.0, 79.0, 54.0, 39.0, 30.0, 19.0, 22.0, 16.0, 12.0, 10.0, 2.0, 10.0, 4.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.9765625, -13.4893798828125, -13.002197265625, -12.5150146484375, -12.02783203125, -11.5406494140625, -11.053466796875, -10.5662841796875, -10.0791015625, -9.5919189453125, -9.104736328125, -8.6175537109375, -8.13037109375, -7.6431884765625, -7.156005859375, -6.6688232421875, -6.181640625, -5.6944580078125, -5.207275390625, -4.7200927734375, -4.23291015625, -3.7457275390625, -3.258544921875, -2.7713623046875, -2.2841796875, -1.7969970703125, -1.309814453125, -0.8226318359375, -0.33544921875, 0.1517333984375, 0.638916015625, 1.1260986328125, 1.61328125, 2.1004638671875, 2.587646484375, 3.0748291015625, 3.56201171875, 4.0491943359375, 4.536376953125, 5.0235595703125, 5.5107421875, 5.9979248046875, 6.485107421875, 6.9722900390625, 7.45947265625, 7.9466552734375, 8.433837890625, 8.9210205078125, 9.408203125, 9.8953857421875, 10.382568359375, 10.8697509765625, 11.35693359375, 11.8441162109375, 12.331298828125, 12.8184814453125, 13.3056640625, 13.7928466796875, 14.280029296875, 14.7672119140625, 15.25439453125, 15.7415771484375, 16.228759765625, 16.7159423828125, 17.203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 2.0, 9.0, 12.0, 10.0, 17.0, 20.0, 18.0, 21.0, 24.0, 33.0, 27.0, 47.0, 47.0, 55.0, 53.0, 52.0, 70.0, 65.0, 41.0, 59.0, 46.0, 39.0, 32.0, 37.0, 33.0, 24.0, 17.0, 17.0, 11.0, 12.0, 8.0, 9.0, 7.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-9.0703125, -8.763916015625, -8.45751953125, -8.151123046875, -7.8447265625, -7.538330078125, -7.23193359375, -6.925537109375, -6.619140625, -6.312744140625, -6.00634765625, -5.699951171875, -5.3935546875, -5.087158203125, -4.78076171875, -4.474365234375, -4.16796875, -3.861572265625, -3.55517578125, -3.248779296875, -2.9423828125, -2.635986328125, -2.32958984375, -2.023193359375, -1.716796875, -1.410400390625, -1.10400390625, -0.797607421875, -0.4912109375, -0.184814453125, 0.12158203125, 0.427978515625, 0.734375, 1.040771484375, 1.34716796875, 1.653564453125, 1.9599609375, 2.266357421875, 2.57275390625, 2.879150390625, 3.185546875, 3.491943359375, 3.79833984375, 4.104736328125, 4.4111328125, 4.717529296875, 5.02392578125, 5.330322265625, 5.63671875, 5.943115234375, 6.24951171875, 6.555908203125, 6.8623046875, 7.168701171875, 7.47509765625, 7.781494140625, 8.087890625, 8.394287109375, 8.70068359375, 9.007080078125, 9.3134765625, 9.619873046875, 9.92626953125, 10.232666015625, 10.5390625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 12.0, 11.0, 22.0, 35.0, 70.0, 165.0, 441.0, 1575.0, 10968.0, 262884.0, 740125.0, 28381.0, 2753.0, 653.0, 220.0, 101.0, 46.0, 26.0, 15.0, 16.0, 12.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.1484375, -3.056304931640625, -2.96417236328125, -2.872039794921875, -2.7799072265625, -2.687774658203125, -2.59564208984375, -2.503509521484375, -2.411376953125, -2.319244384765625, -2.22711181640625, -2.134979248046875, -2.0428466796875, -1.950714111328125, -1.85858154296875, -1.766448974609375, -1.67431640625, -1.582183837890625, -1.49005126953125, -1.397918701171875, -1.3057861328125, -1.213653564453125, -1.12152099609375, -1.029388427734375, -0.937255859375, -0.845123291015625, -0.75299072265625, -0.660858154296875, -0.5687255859375, -0.476593017578125, -0.38446044921875, -0.292327880859375, -0.2001953125, -0.108062744140625, -0.01593017578125, 0.076202392578125, 0.1683349609375, 0.260467529296875, 0.35260009765625, 0.444732666015625, 0.536865234375, 0.628997802734375, 0.72113037109375, 0.813262939453125, 0.9053955078125, 0.997528076171875, 1.08966064453125, 1.181793212890625, 1.27392578125, 1.366058349609375, 1.45819091796875, 1.550323486328125, 1.6424560546875, 1.734588623046875, 1.82672119140625, 1.918853759765625, 2.010986328125, 2.103118896484375, 2.19525146484375, 2.287384033203125, 2.3795166015625, 2.471649169921875, 2.56378173828125, 2.655914306640625, 2.748046875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 5.0, 14.0, 10.0, 22.0, 35.0, 39.0, 46.0, 58.0, 76.0, 94.0, 114.0, 112.0, 82.0, 57.0, 58.0, 52.0, 27.0, 22.0, 16.0, 12.0, 14.0, 4.0, 9.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00019621849060058594, -0.00018961355090141296, -0.00018300861120224, -0.00017640367150306702, -0.00016979873180389404, -0.00016319379210472107, -0.0001565888524055481, -0.00014998391270637512, -0.00014337897300720215, -0.00013677403330802917, -0.0001301690936088562, -0.00012356415390968323, -0.00011695921421051025, -0.00011035427451133728, -0.0001037493348121643, -9.714439511299133e-05, -9.053945541381836e-05, -8.393451571464539e-05, -7.732957601547241e-05, -7.072463631629944e-05, -6.411969661712646e-05, -5.751475691795349e-05, -5.090981721878052e-05, -4.4304877519607544e-05, -3.769993782043457e-05, -3.10949981212616e-05, -2.4490058422088623e-05, -1.788511872291565e-05, -1.1280179023742676e-05, -4.675239324569702e-06, 1.9297003746032715e-06, 8.534640073776245e-06, 1.5139579772949219e-05, 2.1744519472122192e-05, 2.8349459171295166e-05, 3.495439887046814e-05, 4.155933856964111e-05, 4.816427826881409e-05, 5.476921796798706e-05, 6.137415766716003e-05, 6.797909736633301e-05, 7.458403706550598e-05, 8.118897676467896e-05, 8.779391646385193e-05, 9.43988561630249e-05, 0.00010100379586219788, 0.00010760873556137085, 0.00011421367526054382, 0.0001208186149597168, 0.00012742355465888977, 0.00013402849435806274, 0.00014063343405723572, 0.0001472383737564087, 0.00015384331345558167, 0.00016044825315475464, 0.0001670531928539276, 0.00017365813255310059, 0.00018026307225227356, 0.00018686801195144653, 0.0001934729516506195, 0.00020007789134979248, 0.00020668283104896545, 0.00021328777074813843, 0.0002198927104473114, 0.00022649765014648438]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 17.0, 6.0, 23.0, 40.0, 106.0, 313.0, 1569.0, 13386.0, 430934.0, 583660.0, 16259.0, 1665.0, 351.0, 110.0, 56.0, 29.0, 6.0, 5.0, 8.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.046875, -4.929595947265625, -4.81231689453125, -4.695037841796875, -4.5777587890625, -4.460479736328125, -4.34320068359375, -4.225921630859375, -4.108642578125, -3.991363525390625, -3.87408447265625, -3.756805419921875, -3.6395263671875, -3.522247314453125, -3.40496826171875, -3.287689208984375, -3.17041015625, -3.053131103515625, -2.93585205078125, -2.818572998046875, -2.7012939453125, -2.584014892578125, -2.46673583984375, -2.349456787109375, -2.232177734375, -2.114898681640625, -1.99761962890625, -1.880340576171875, -1.7630615234375, -1.645782470703125, -1.52850341796875, -1.411224365234375, -1.2939453125, -1.176666259765625, -1.05938720703125, -0.942108154296875, -0.8248291015625, -0.707550048828125, -0.59027099609375, -0.472991943359375, -0.355712890625, -0.238433837890625, -0.12115478515625, -0.003875732421875, 0.1134033203125, 0.230682373046875, 0.34796142578125, 0.465240478515625, 0.58251953125, 0.699798583984375, 0.81707763671875, 0.934356689453125, 1.0516357421875, 1.168914794921875, 1.28619384765625, 1.403472900390625, 1.520751953125, 1.638031005859375, 1.75531005859375, 1.872589111328125, 1.9898681640625, 2.107147216796875, 2.22442626953125, 2.341705322265625, 2.458984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 3.0, 9.0, 12.0, 15.0, 29.0, 37.0, 50.0, 47.0, 60.0, 66.0, 92.0, 146.0, 87.0, 75.0, 62.0, 47.0, 43.0, 31.0, 26.0, 18.0, 17.0, 7.0, 6.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.98876953125, -0.9616165161132812, -0.9344635009765625, -0.9073104858398438, -0.880157470703125, -0.8530044555664062, -0.8258514404296875, -0.7986984252929688, -0.77154541015625, -0.7443923950195312, -0.7172393798828125, -0.6900863647460938, -0.662933349609375, -0.6357803344726562, -0.6086273193359375, -0.5814743041992188, -0.5543212890625, -0.5271682739257812, -0.5000152587890625, -0.47286224365234375, -0.445709228515625, -0.41855621337890625, -0.3914031982421875, -0.36425018310546875, -0.33709716796875, -0.30994415283203125, -0.2827911376953125, -0.25563812255859375, -0.228485107421875, -0.20133209228515625, -0.1741790771484375, -0.14702606201171875, -0.119873046875, -0.09272003173828125, -0.0655670166015625, -0.03841400146484375, -0.011260986328125, 0.01589202880859375, 0.0430450439453125, 0.07019805908203125, 0.09735107421875, 0.12450408935546875, 0.1516571044921875, 0.17881011962890625, 0.205963134765625, 0.23311614990234375, 0.2602691650390625, 0.28742218017578125, 0.3145751953125, 0.34172821044921875, 0.3688812255859375, 0.39603424072265625, 0.423187255859375, 0.45034027099609375, 0.4774932861328125, 0.5046463012695312, 0.53179931640625, 0.5589523315429688, 0.5861053466796875, 0.6132583618164062, 0.640411376953125, 0.6675643920898438, 0.6947174072265625, 0.7218704223632812, 0.7490234375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 11.0, 34.0, 116.0, 280.0, 307.0, 157.0, 68.0, 26.0, 8.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.430699348449707, -10.315457344055176, -9.200215339660645, -8.084973335266113, -6.969731330871582, -5.854489326477051, -4.7392473220825195, -3.6240053176879883, -2.508763313293457, -1.3935213088989258, -0.27827930450439453, 0.8369626998901367, 1.952204704284668, 3.067446708679199, 4.1826887130737305, 5.297930717468262, 6.413172721862793, 7.528414726257324, 8.643656730651855, 9.758898735046387, 10.874140739440918, 11.98938274383545, 13.10462474822998, 14.219866752624512, 15.335108757019043, 16.45035171508789, 17.565593719482422, 18.680835723876953, 19.796077728271484, 20.911319732666016, 22.026561737060547, 23.141803741455078, 24.25704574584961, 25.37228775024414, 26.487529754638672, 27.602771759033203, 28.718013763427734, 29.833255767822266, 30.948497772216797, 32.06373977661133, 33.17898178100586, 34.29422378540039, 35.40946578979492, 36.52470779418945, 37.639949798583984, 38.755191802978516, 39.87043380737305, 40.98567581176758, 42.10091781616211, 43.21615982055664, 44.33140182495117, 45.4466438293457, 46.561885833740234, 47.677127838134766, 48.7923698425293, 49.90761184692383, 51.02285385131836, 52.13809585571289, 53.25333786010742, 54.36857986450195, 55.483821868896484, 56.599063873291016, 57.71430587768555, 58.82954788208008, 59.94478988647461]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 4.0, 3.0, 7.0, 5.0, 5.0, 5.0, 11.0, 13.0, 14.0, 11.0, 18.0, 24.0, 20.0, 19.0, 18.0, 24.0, 40.0, 36.0, 35.0, 35.0, 32.0, 29.0, 46.0, 43.0, 33.0, 24.0, 37.0, 31.0, 48.0, 37.0, 32.0, 35.0, 24.0, 24.0, 28.0, 16.0, 19.0, 15.0, 15.0, 18.0, 9.0, 10.0, 14.0, 4.0, 4.0, 5.0, 9.0, 0.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-11.756836891174316, -11.40581226348877, -11.054786682128906, -10.70376205444336, -10.352737426757812, -10.001712799072266, -9.650687217712402, -9.299662590026855, -8.948637962341309, -8.597613334655762, -8.246587753295898, -7.895563125610352, -7.544538497924805, -7.1935133934021, -6.8424882888793945, -6.491463661193848, -6.140438556671143, -5.7894134521484375, -5.438388824462891, -5.0873637199401855, -4.736339092254639, -4.385313987731934, -4.034289360046387, -3.6832642555236816, -3.3322393894195557, -2.9812145233154297, -2.6301896572113037, -2.2791647911071777, -1.9281398057937622, -1.5771149396896362, -1.2260899543762207, -0.8750650882720947, -0.5240402221679688, -0.17301532626152039, 0.17800956964492798, 0.5290344953536987, 0.8800593614578247, 1.2310842275619507, 1.5821092128753662, 1.9331340789794922, 2.284158945083618, 2.635183811187744, 2.98620867729187, 3.337233543395996, 3.688258647918701, 4.039283275604248, 4.390308380126953, 4.7413330078125, 5.092358112335205, 5.44338321685791, 5.794407844543457, 6.145432949066162, 6.496457576751709, 6.847482681274414, 7.198507308959961, 7.549532413482666, 7.900557518005371, 8.251582145690918, 8.602607727050781, 8.953632354736328, 9.304656982421875, 9.655681610107422, 10.006707191467285, 10.357731819152832, 10.708756446838379]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 1.0, 0.0, 8.0, 14.0, 13.0, 20.0, 16.0, 27.0, 27.0, 55.0, 69.0, 88.0, 113.0, 169.0, 226.0, 395.0, 567.0, 974.0, 1782.0, 3578.0, 9053.0, 29444.0, 187915.0, 2130096.0, 1634637.0, 150826.0, 28009.0, 8553.0, 3489.0, 1669.0, 919.0, 509.0, 333.0, 197.0, 117.0, 91.0, 66.0, 71.0, 44.0, 34.0, 23.0, 8.0, 12.0, 8.0, 4.0, 8.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.96484375, -6.7655029296875, -6.566162109375, -6.3668212890625, -6.16748046875, -5.9681396484375, -5.768798828125, -5.5694580078125, -5.3701171875, -5.1707763671875, -4.971435546875, -4.7720947265625, -4.57275390625, -4.3734130859375, -4.174072265625, -3.9747314453125, -3.775390625, -3.5760498046875, -3.376708984375, -3.1773681640625, -2.97802734375, -2.7786865234375, -2.579345703125, -2.3800048828125, -2.1806640625, -1.9813232421875, -1.781982421875, -1.5826416015625, -1.38330078125, -1.1839599609375, -0.984619140625, -0.7852783203125, -0.5859375, -0.3865966796875, -0.187255859375, 0.0120849609375, 0.21142578125, 0.4107666015625, 0.610107421875, 0.8094482421875, 1.0087890625, 1.2081298828125, 1.407470703125, 1.6068115234375, 1.80615234375, 2.0054931640625, 2.204833984375, 2.4041748046875, 2.603515625, 2.8028564453125, 3.002197265625, 3.2015380859375, 3.40087890625, 3.6002197265625, 3.799560546875, 3.9989013671875, 4.1982421875, 4.3975830078125, 4.596923828125, 4.7962646484375, 4.99560546875, 5.1949462890625, 5.394287109375, 5.5936279296875, 5.79296875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 8.0, 2.0, 3.0, 7.0, 4.0, 7.0, 20.0, 16.0, 14.0, 26.0, 27.0, 27.0, 38.0, 39.0, 42.0, 40.0, 51.0, 60.0, 48.0, 48.0, 53.0, 63.0, 55.0, 47.0, 40.0, 36.0, 40.0, 37.0, 19.0, 23.0, 15.0, 13.0, 14.0, 5.0, 7.0, 4.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.0625, -4.925933837890625, -4.78936767578125, -4.652801513671875, -4.5162353515625, -4.379669189453125, -4.24310302734375, -4.106536865234375, -3.969970703125, -3.833404541015625, -3.69683837890625, -3.560272216796875, -3.4237060546875, -3.287139892578125, -3.15057373046875, -3.014007568359375, -2.87744140625, -2.740875244140625, -2.60430908203125, -2.467742919921875, -2.3311767578125, -2.194610595703125, -2.05804443359375, -1.921478271484375, -1.784912109375, -1.648345947265625, -1.51177978515625, -1.375213623046875, -1.2386474609375, -1.102081298828125, -0.96551513671875, -0.828948974609375, -0.6923828125, -0.555816650390625, -0.41925048828125, -0.282684326171875, -0.1461181640625, -0.009552001953125, 0.12701416015625, 0.263580322265625, 0.400146484375, 0.536712646484375, 0.67327880859375, 0.809844970703125, 0.9464111328125, 1.082977294921875, 1.21954345703125, 1.356109619140625, 1.49267578125, 1.629241943359375, 1.76580810546875, 1.902374267578125, 2.0389404296875, 2.175506591796875, 2.31207275390625, 2.448638916015625, 2.585205078125, 2.721771240234375, 2.85833740234375, 2.994903564453125, 3.1314697265625, 3.268035888671875, 3.40460205078125, 3.541168212890625, 3.677734375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 2.0, 6.0, 10.0, 7.0, 9.0, 12.0, 27.0, 46.0, 56.0, 140.0, 345.0, 1227.0, 7971.0, 289124.0, 3856777.0, 34604.0, 2853.0, 615.0, 214.0, 91.0, 59.0, 22.0, 17.0, 16.0, 4.0, 6.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.328125, -15.77001953125, -15.2119140625, -14.65380859375, -14.095703125, -13.53759765625, -12.9794921875, -12.42138671875, -11.86328125, -11.30517578125, -10.7470703125, -10.18896484375, -9.630859375, -9.07275390625, -8.5146484375, -7.95654296875, -7.3984375, -6.84033203125, -6.2822265625, -5.72412109375, -5.166015625, -4.60791015625, -4.0498046875, -3.49169921875, -2.93359375, -2.37548828125, -1.8173828125, -1.25927734375, -0.701171875, -0.14306640625, 0.4150390625, 0.97314453125, 1.53125, 2.08935546875, 2.6474609375, 3.20556640625, 3.763671875, 4.32177734375, 4.8798828125, 5.43798828125, 5.99609375, 6.55419921875, 7.1123046875, 7.67041015625, 8.228515625, 8.78662109375, 9.3447265625, 9.90283203125, 10.4609375, 11.01904296875, 11.5771484375, 12.13525390625, 12.693359375, 13.25146484375, 13.8095703125, 14.36767578125, 14.92578125, 15.48388671875, 16.0419921875, 16.60009765625, 17.158203125, 17.71630859375, 18.2744140625, 18.83251953125, 19.390625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 6.0, 11.0, 19.0, 24.0, 24.0, 36.0, 49.0, 77.0, 120.0, 172.0, 311.0, 453.0, 636.0, 673.0, 512.0, 341.0, 196.0, 104.0, 79.0, 63.0, 48.0, 27.0, 26.0, 8.0, 12.0, 7.0, 6.0, 7.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.5703125, -2.5010528564453125, -2.431793212890625, -2.3625335693359375, -2.29327392578125, -2.2240142822265625, -2.154754638671875, -2.0854949951171875, -2.0162353515625, -1.9469757080078125, -1.877716064453125, -1.8084564208984375, -1.73919677734375, -1.6699371337890625, -1.600677490234375, -1.5314178466796875, -1.462158203125, -1.3928985595703125, -1.323638916015625, -1.2543792724609375, -1.18511962890625, -1.1158599853515625, -1.046600341796875, -0.9773406982421875, -0.9080810546875, -0.8388214111328125, -0.769561767578125, -0.7003021240234375, -0.63104248046875, -0.5617828369140625, -0.492523193359375, -0.4232635498046875, -0.35400390625, -0.2847442626953125, -0.215484619140625, -0.1462249755859375, -0.07696533203125, -0.0077056884765625, 0.061553955078125, 0.1308135986328125, 0.2000732421875, 0.2693328857421875, 0.338592529296875, 0.4078521728515625, 0.47711181640625, 0.5463714599609375, 0.615631103515625, 0.6848907470703125, 0.754150390625, 0.8234100341796875, 0.892669677734375, 0.9619293212890625, 1.03118896484375, 1.1004486083984375, 1.169708251953125, 1.2389678955078125, 1.3082275390625, 1.3774871826171875, 1.446746826171875, 1.5160064697265625, 1.58526611328125, 1.6545257568359375, 1.723785400390625, 1.7930450439453125, 1.8623046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 7.0, 4.0, 8.0, 8.0, 17.0, 17.0, 24.0, 29.0, 35.0, 43.0, 55.0, 45.0, 71.0, 61.0, 68.0, 70.0, 69.0, 61.0, 57.0, 47.0, 43.0, 37.0, 32.0, 16.0, 15.0, 15.0, 15.0, 9.0, 11.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.285839557647705, -7.111353397369385, -6.9368672370910645, -6.762381076812744, -6.587894916534424, -6.4134087562561035, -6.238922595977783, -6.064436435699463, -5.889950275421143, -5.715464115142822, -5.540977954864502, -5.366491794586182, -5.192005634307861, -5.017519474029541, -4.843033313751221, -4.6685471534729, -4.49406099319458, -4.31957483291626, -4.1450886726379395, -3.970602512359619, -3.796116352081299, -3.6216301918029785, -3.447144031524658, -3.272657871246338, -3.0981717109680176, -2.9236855506896973, -2.749199390411377, -2.5747132301330566, -2.4002270698547363, -2.225740909576416, -2.0512547492980957, -1.8767685890197754, -1.7022829055786133, -1.527796745300293, -1.3533105850219727, -1.1788244247436523, -1.004338264465332, -0.8298521041870117, -0.6553659439086914, -0.4808797836303711, -0.3063936233520508, -0.13190746307373047, 0.042578697204589844, 0.21706485748291016, 0.39155101776123047, 0.5660371780395508, 0.7405233383178711, 0.9150094985961914, 1.0894956588745117, 1.263981819152832, 1.4384679794311523, 1.6129541397094727, 1.787440299987793, 1.9619264602661133, 2.1364126205444336, 2.310898780822754, 2.485384941101074, 2.6598711013793945, 2.834357261657715, 3.008843421936035, 3.1833295822143555, 3.357815742492676, 3.532301902770996, 3.7067880630493164, 3.8812742233276367]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 8.0, 6.0, 10.0, 12.0, 15.0, 12.0, 16.0, 19.0, 18.0, 19.0, 24.0, 20.0, 28.0, 22.0, 30.0, 31.0, 31.0, 38.0, 30.0, 48.0, 33.0, 36.0, 41.0, 37.0, 23.0, 29.0, 29.0, 32.0, 26.0, 40.0, 32.0, 19.0, 28.0, 27.0, 15.0, 11.0, 16.0, 16.0, 12.0, 13.0, 14.0, 3.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0], "bins": [-4.038170337677002, -3.920558452606201, -3.8029465675354004, -3.6853346824645996, -3.567722797393799, -3.450110912322998, -3.3324990272521973, -3.2148871421813965, -3.0972752571105957, -2.979663372039795, -2.862051486968994, -2.7444396018981934, -2.6268277168273926, -2.509215831756592, -2.391603946685791, -2.2739920616149902, -2.1563799381256104, -2.0387680530548096, -1.9211561679840088, -1.803544282913208, -1.6859323978424072, -1.5683205127716064, -1.4507085084915161, -1.3330966234207153, -1.2154847383499146, -1.0978728532791138, -0.980260968208313, -0.8626490235328674, -0.7450371384620667, -0.6274252533912659, -0.5098133087158203, -0.39220142364501953, -0.27458930015563965, -0.15697740018367767, -0.0393655002117157, 0.07824641466140747, 0.19585829973220825, 0.31347018480300903, 0.4310821294784546, 0.5486940145492554, 0.6663058996200562, 0.7839177846908569, 0.9015296697616577, 1.019141674041748, 1.1367535591125488, 1.2543654441833496, 1.3719773292541504, 1.4895892143249512, 1.607201099395752, 1.7248129844665527, 1.8424248695373535, 1.9600367546081543, 2.077648639678955, 2.195260524749756, 2.3128724098205566, 2.4304842948913574, 2.548096179962158, 2.665708065032959, 2.7833199501037598, 2.9009318351745605, 3.0185437202453613, 3.136155605316162, 3.253767490386963, 3.3713793754577637, 3.4889914989471436]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 5.0, 16.0, 20.0, 30.0, 61.0, 85.0, 155.0, 219.0, 407.0, 765.0, 1393.0, 2575.0, 5744.0, 12930.0, 32379.0, 95355.0, 299825.0, 380406.0, 139647.0, 45156.0, 17083.0, 7253.0, 3223.0, 1705.0, 905.0, 493.0, 261.0, 174.0, 92.0, 69.0, 41.0, 28.0, 15.0, 18.0, 5.0, 7.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.224609375, -1.1795196533203125, -1.134429931640625, -1.0893402099609375, -1.04425048828125, -0.9991607666015625, -0.954071044921875, -0.9089813232421875, -0.8638916015625, -0.8188018798828125, -0.773712158203125, -0.7286224365234375, -0.68353271484375, -0.6384429931640625, -0.593353271484375, -0.5482635498046875, -0.503173828125, -0.4580841064453125, -0.412994384765625, -0.3679046630859375, -0.32281494140625, -0.2777252197265625, -0.232635498046875, -0.1875457763671875, -0.1424560546875, -0.0973663330078125, -0.052276611328125, -0.0071868896484375, 0.03790283203125, 0.0829925537109375, 0.128082275390625, 0.1731719970703125, 0.21826171875, 0.2633514404296875, 0.308441162109375, 0.3535308837890625, 0.39862060546875, 0.4437103271484375, 0.488800048828125, 0.5338897705078125, 0.5789794921875, 0.6240692138671875, 0.669158935546875, 0.7142486572265625, 0.75933837890625, 0.8044281005859375, 0.849517822265625, 0.8946075439453125, 0.939697265625, 0.9847869873046875, 1.029876708984375, 1.0749664306640625, 1.12005615234375, 1.1651458740234375, 1.210235595703125, 1.2553253173828125, 1.3004150390625, 1.3455047607421875, 1.390594482421875, 1.4356842041015625, 1.48077392578125, 1.5258636474609375, 1.570953369140625, 1.6160430908203125, 1.6611328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 11.0, 8.0, 19.0, 16.0, 24.0, 22.0, 29.0, 20.0, 17.0, 36.0, 44.0, 45.0, 43.0, 56.0, 57.0, 53.0, 48.0, 30.0, 55.0, 49.0, 32.0, 40.0, 38.0, 41.0, 27.0, 24.0, 15.0, 18.0, 19.0, 11.0, 12.0, 13.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.59375, -2.50115966796875, -2.4085693359375, -2.31597900390625, -2.223388671875, -2.13079833984375, -2.0382080078125, -1.94561767578125, -1.85302734375, -1.76043701171875, -1.6678466796875, -1.57525634765625, -1.482666015625, -1.39007568359375, -1.2974853515625, -1.20489501953125, -1.1123046875, -1.01971435546875, -0.9271240234375, -0.83453369140625, -0.741943359375, -0.64935302734375, -0.5567626953125, -0.46417236328125, -0.37158203125, -0.27899169921875, -0.1864013671875, -0.09381103515625, -0.001220703125, 0.09136962890625, 0.1839599609375, 0.27655029296875, 0.369140625, 0.46173095703125, 0.5543212890625, 0.64691162109375, 0.739501953125, 0.83209228515625, 0.9246826171875, 1.01727294921875, 1.10986328125, 1.20245361328125, 1.2950439453125, 1.38763427734375, 1.480224609375, 1.57281494140625, 1.6654052734375, 1.75799560546875, 1.8505859375, 1.94317626953125, 2.0357666015625, 2.12835693359375, 2.220947265625, 2.31353759765625, 2.4061279296875, 2.49871826171875, 2.59130859375, 2.68389892578125, 2.7764892578125, 2.86907958984375, 2.961669921875, 3.05426025390625, 3.1468505859375, 3.23944091796875, 3.33203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 12.0, 8.0, 14.0, 16.0, 16.0, 23.0, 30.0, 51.0, 69.0, 115.0, 163.0, 280.0, 502.0, 896.0, 1961.0, 4569.0, 12281.0, 41022.0, 182834.0, 536296.0, 200844.0, 44167.0, 13169.0, 4800.0, 2114.0, 985.0, 506.0, 276.0, 166.0, 90.0, 83.0, 52.0, 34.0, 26.0, 23.0, 16.0, 17.0, 13.0, 4.0, 7.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8759765625, -1.8216400146484375, -1.767303466796875, -1.7129669189453125, -1.65863037109375, -1.6042938232421875, -1.549957275390625, -1.4956207275390625, -1.4412841796875, -1.3869476318359375, -1.332611083984375, -1.2782745361328125, -1.22393798828125, -1.1696014404296875, -1.115264892578125, -1.0609283447265625, -1.006591796875, -0.9522552490234375, -0.897918701171875, -0.8435821533203125, -0.78924560546875, -0.7349090576171875, -0.680572509765625, -0.6262359619140625, -0.5718994140625, -0.5175628662109375, -0.463226318359375, -0.4088897705078125, -0.35455322265625, -0.3002166748046875, -0.245880126953125, -0.1915435791015625, -0.13720703125, -0.0828704833984375, -0.028533935546875, 0.0258026123046875, 0.08013916015625, 0.1344757080078125, 0.188812255859375, 0.2431488037109375, 0.2974853515625, 0.3518218994140625, 0.406158447265625, 0.4604949951171875, 0.51483154296875, 0.5691680908203125, 0.623504638671875, 0.6778411865234375, 0.732177734375, 0.7865142822265625, 0.840850830078125, 0.8951873779296875, 0.94952392578125, 1.0038604736328125, 1.058197021484375, 1.1125335693359375, 1.1668701171875, 1.2212066650390625, 1.275543212890625, 1.3298797607421875, 1.38421630859375, 1.4385528564453125, 1.492889404296875, 1.5472259521484375, 1.6015625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 0.0, 0.0, 5.0, 5.0, 6.0, 7.0, 6.0, 10.0, 20.0, 15.0, 18.0, 16.0, 19.0, 22.0, 31.0, 22.0, 41.0, 39.0, 40.0, 52.0, 51.0, 35.0, 51.0, 45.0, 49.0, 48.0, 48.0, 39.0, 40.0, 37.0, 30.0, 17.0, 21.0, 18.0, 22.0, 13.0, 18.0, 5.0, 9.0, 7.0, 6.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.78515625, -6.57073974609375, -6.3563232421875, -6.14190673828125, -5.927490234375, -5.71307373046875, -5.4986572265625, -5.28424072265625, -5.06982421875, -4.85540771484375, -4.6409912109375, -4.42657470703125, -4.212158203125, -3.99774169921875, -3.7833251953125, -3.56890869140625, -3.3544921875, -3.14007568359375, -2.9256591796875, -2.71124267578125, -2.496826171875, -2.28240966796875, -2.0679931640625, -1.85357666015625, -1.63916015625, -1.42474365234375, -1.2103271484375, -0.99591064453125, -0.781494140625, -0.56707763671875, -0.3526611328125, -0.13824462890625, 0.076171875, 0.29058837890625, 0.5050048828125, 0.71942138671875, 0.933837890625, 1.14825439453125, 1.3626708984375, 1.57708740234375, 1.79150390625, 2.00592041015625, 2.2203369140625, 2.43475341796875, 2.649169921875, 2.86358642578125, 3.0780029296875, 3.29241943359375, 3.5068359375, 3.72125244140625, 3.9356689453125, 4.15008544921875, 4.364501953125, 4.57891845703125, 4.7933349609375, 5.00775146484375, 5.22216796875, 5.43658447265625, 5.6510009765625, 5.86541748046875, 6.079833984375, 6.29425048828125, 6.5086669921875, 6.72308349609375, 6.9375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 14.0, 9.0, 27.0, 42.0, 81.0, 107.0, 238.0, 505.0, 1223.0, 3418.0, 13980.0, 112173.0, 811504.0, 87988.0, 12059.0, 3162.0, 1074.0, 440.0, 210.0, 112.0, 71.0, 37.0, 22.0, 10.0, 11.0, 7.0, 5.0, 7.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4375, -1.37872314453125, -1.3199462890625, -1.26116943359375, -1.202392578125, -1.14361572265625, -1.0848388671875, -1.02606201171875, -0.96728515625, -0.90850830078125, -0.8497314453125, -0.79095458984375, -0.732177734375, -0.67340087890625, -0.6146240234375, -0.55584716796875, -0.4970703125, -0.43829345703125, -0.3795166015625, -0.32073974609375, -0.261962890625, -0.20318603515625, -0.1444091796875, -0.08563232421875, -0.02685546875, 0.03192138671875, 0.0906982421875, 0.14947509765625, 0.208251953125, 0.26702880859375, 0.3258056640625, 0.38458251953125, 0.443359375, 0.50213623046875, 0.5609130859375, 0.61968994140625, 0.678466796875, 0.73724365234375, 0.7960205078125, 0.85479736328125, 0.91357421875, 0.97235107421875, 1.0311279296875, 1.08990478515625, 1.148681640625, 1.20745849609375, 1.2662353515625, 1.32501220703125, 1.3837890625, 1.44256591796875, 1.5013427734375, 1.56011962890625, 1.618896484375, 1.67767333984375, 1.7364501953125, 1.79522705078125, 1.85400390625, 1.91278076171875, 1.9715576171875, 2.03033447265625, 2.089111328125, 2.14788818359375, 2.2066650390625, 2.26544189453125, 2.32421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 3.0, 5.0, 4.0, 6.0, 7.0, 10.0, 18.0, 20.0, 40.0, 71.0, 113.0, 154.0, 124.0, 116.0, 90.0, 68.0, 32.0, 35.0, 26.0, 17.0, 8.0, 8.0, 11.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006036758422851562, -0.0005866661667823792, -0.000569656491279602, -0.000552646815776825, -0.0005356371402740479, -0.0005186274647712708, -0.0005016177892684937, -0.00048460811376571655, -0.00046759843826293945, -0.00045058876276016235, -0.00043357908725738525, -0.00041656941175460815, -0.00039955973625183105, -0.00038255006074905396, -0.00036554038524627686, -0.00034853070974349976, -0.00033152103424072266, -0.00031451135873794556, -0.00029750168323516846, -0.00028049200773239136, -0.00026348233222961426, -0.00024647265672683716, -0.00022946298122406006, -0.00021245330572128296, -0.00019544363021850586, -0.00017843395471572876, -0.00016142427921295166, -0.00014441460371017456, -0.00012740492820739746, -0.00011039525270462036, -9.338557720184326e-05, -7.637590169906616e-05, -5.936622619628906e-05, -4.235655069351196e-05, -2.5346875190734863e-05, -8.337199687957764e-06, 8.672475814819336e-06, 2.5682151317596436e-05, 4.2691826820373535e-05, 5.9701502323150635e-05, 7.671117782592773e-05, 9.372085332870483e-05, 0.00011073052883148193, 0.00012774020433425903, 0.00014474987983703613, 0.00016175955533981323, 0.00017876923084259033, 0.00019577890634536743, 0.00021278858184814453, 0.00022979825735092163, 0.00024680793285369873, 0.00026381760835647583, 0.00028082728385925293, 0.00029783695936203003, 0.00031484663486480713, 0.00033185631036758423, 0.00034886598587036133, 0.00036587566137313843, 0.00038288533687591553, 0.0003998950123786926, 0.0004169046878814697, 0.0004339143633842468, 0.0004509240388870239, 0.000467933714389801, 0.0004849433898925781]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 7.0, 3.0, 4.0, 8.0, 16.0, 10.0, 14.0, 15.0, 37.0, 75.0, 108.0, 216.0, 468.0, 1176.0, 3027.0, 8658.0, 28501.0, 153889.0, 634469.0, 172464.0, 30778.0, 9129.0, 3270.0, 1239.0, 466.0, 203.0, 104.0, 61.0, 32.0, 29.0, 19.0, 13.0, 12.0, 4.0, 8.0, 4.0, 4.0, 5.0, 2.0, 1.0, 4.0, 1.0, 3.0], "bins": [-1.7666015625, -1.7219085693359375, -1.677215576171875, -1.6325225830078125, -1.58782958984375, -1.5431365966796875, -1.498443603515625, -1.4537506103515625, -1.4090576171875, -1.3643646240234375, -1.319671630859375, -1.2749786376953125, -1.23028564453125, -1.1855926513671875, -1.140899658203125, -1.0962066650390625, -1.051513671875, -1.0068206787109375, -0.962127685546875, -0.9174346923828125, -0.87274169921875, -0.8280487060546875, -0.783355712890625, -0.7386627197265625, -0.6939697265625, -0.6492767333984375, -0.604583740234375, -0.5598907470703125, -0.51519775390625, -0.4705047607421875, -0.425811767578125, -0.3811187744140625, -0.33642578125, -0.2917327880859375, -0.247039794921875, -0.2023468017578125, -0.15765380859375, -0.1129608154296875, -0.068267822265625, -0.0235748291015625, 0.0211181640625, 0.0658111572265625, 0.110504150390625, 0.1551971435546875, 0.19989013671875, 0.2445831298828125, 0.289276123046875, 0.3339691162109375, 0.378662109375, 0.4233551025390625, 0.468048095703125, 0.5127410888671875, 0.55743408203125, 0.6021270751953125, 0.646820068359375, 0.6915130615234375, 0.7362060546875, 0.7808990478515625, 0.825592041015625, 0.8702850341796875, 0.91497802734375, 0.9596710205078125, 1.004364013671875, 1.0490570068359375, 1.09375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 7.0, 5.0, 7.0, 4.0, 9.0, 11.0, 16.0, 15.0, 40.0, 50.0, 60.0, 117.0, 142.0, 123.0, 119.0, 76.0, 60.0, 33.0, 26.0, 18.0, 17.0, 6.0, 7.0, 4.0, 2.0, 2.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.332275390625, -0.3185462951660156, -0.30481719970703125, -0.2910881042480469, -0.2773590087890625, -0.2636299133300781, -0.24990081787109375, -0.23617172241210938, -0.222442626953125, -0.20871353149414062, -0.19498443603515625, -0.18125534057617188, -0.1675262451171875, -0.15379714965820312, -0.14006805419921875, -0.12633895874023438, -0.11260986328125, -0.09888076782226562, -0.08515167236328125, -0.07142257690429688, -0.0576934814453125, -0.043964385986328125, -0.03023529052734375, -0.016506195068359375, -0.002777099609375, 0.010951995849609375, 0.02468109130859375, 0.038410186767578125, 0.0521392822265625, 0.06586837768554688, 0.07959747314453125, 0.09332656860351562, 0.1070556640625, 0.12078475952148438, 0.13451385498046875, 0.14824295043945312, 0.1619720458984375, 0.17570114135742188, 0.18943023681640625, 0.20315933227539062, 0.216888427734375, 0.23061752319335938, 0.24434661865234375, 0.2580757141113281, 0.2718048095703125, 0.2855339050292969, 0.29926300048828125, 0.3129920959472656, 0.32672119140625, 0.3404502868652344, 0.35417938232421875, 0.3679084777832031, 0.3816375732421875, 0.3953666687011719, 0.40909576416015625, 0.4228248596191406, 0.436553955078125, 0.4502830505371094, 0.46401214599609375, 0.4777412414550781, 0.4914703369140625, 0.5051994323730469, 0.5189285278320312, 0.5326576232910156, 0.54638671875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 0.0, 4.0, 4.0, 10.0, 10.0, 16.0, 21.0, 20.0, 28.0, 47.0, 65.0, 58.0, 62.0, 90.0, 83.0, 77.0, 79.0, 68.0, 64.0, 40.0, 41.0, 32.0, 25.0, 13.0, 15.0, 7.0, 8.0, 9.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.798011779785156, -4.679961204528809, -4.561911106109619, -4.4438605308532715, -4.325810432434082, -4.207759857177734, -4.089709281921387, -3.971658945083618, -3.8536086082458496, -3.735558271408081, -3.6175079345703125, -3.499457359313965, -3.3814070224761963, -3.2633566856384277, -3.14530611038208, -3.0272557735443115, -2.909205436706543, -2.7911550998687744, -2.673104763031006, -2.555054187774658, -2.4370038509368896, -2.318953514099121, -2.2009029388427734, -2.082852602005005, -1.9648022651672363, -1.8467519283294678, -1.7287014722824097, -1.6106510162353516, -1.492600679397583, -1.3745503425598145, -1.2564998865127563, -1.1384494304656982, -1.0203993320465088, -0.9023489356040955, -0.7842985391616821, -0.6662481427192688, -0.5481977462768555, -0.43014734983444214, -0.3120969533920288, -0.19404655694961548, -0.07599616050720215, 0.04205423593521118, 0.1601046323776245, 0.27815502882003784, 0.39620542526245117, 0.5142558217048645, 0.6323062181472778, 0.7503566145896912, 0.8684070110321045, 0.9864574074745178, 1.1045078039169312, 1.2225582599639893, 1.3406085968017578, 1.4586589336395264, 1.5767093896865845, 1.6947598457336426, 1.8128101825714111, 1.9308605194091797, 2.0489110946655273, 2.166961431503296, 2.2850117683410645, 2.403062105178833, 2.5211124420166016, 2.639163017272949, 2.7572133541107178]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 5.0, 5.0, 11.0, 13.0, 11.0, 12.0, 12.0, 18.0, 24.0, 26.0, 26.0, 32.0, 36.0, 36.0, 40.0, 46.0, 42.0, 30.0, 36.0, 45.0, 50.0, 51.0, 32.0, 48.0, 30.0, 24.0, 38.0, 27.0, 29.0, 19.0, 27.0, 18.0, 22.0, 15.0, 12.0, 13.0, 9.0, 11.0, 6.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-2.553150177001953, -2.4733266830444336, -2.393503189086914, -2.3136796951293945, -2.233856201171875, -2.1540329456329346, -2.074209451675415, -1.9943859577178955, -1.914562463760376, -1.8347389698028564, -1.754915475845337, -1.675092101097107, -1.5952686071395874, -1.5154451131820679, -1.435621738433838, -1.3557982444763184, -1.2759747505187988, -1.1961512565612793, -1.1163277626037598, -1.0365043878555298, -0.9566808938980103, -0.8768573999404907, -0.797033965587616, -0.7172105312347412, -0.6373870372772217, -0.5575635433197021, -0.4777401089668274, -0.39791664481163025, -0.3180931806564331, -0.23826971650123596, -0.15844625234603882, -0.07862281799316406, 0.0012004375457763672, 0.08102390170097351, 0.16084736585617065, 0.2406708300113678, 0.32049429416656494, 0.4003177583217621, 0.48014122247695923, 0.559964656829834, 0.6397881507873535, 0.719611644744873, 0.7994350790977478, 0.8792585134506226, 0.9590820074081421, 1.0389055013656616, 1.1187288761138916, 1.1985523700714111, 1.2783758640289307, 1.3581993579864502, 1.4380228519439697, 1.5178462266921997, 1.5976697206497192, 1.6774932146072388, 1.7573165893554688, 1.8371400833129883, 1.9169635772705078, 1.9967870712280273, 2.076610565185547, 2.1564340591430664, 2.236257553100586, 2.3160808086395264, 2.395904302597046, 2.4757277965545654, 2.555551290512085]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 3.0, 8.0, 10.0, 14.0, 26.0, 21.0, 37.0, 56.0, 116.0, 198.0, 325.0, 726.0, 1426.0, 3608.0, 9836.0, 33182.0, 150954.0, 589352.0, 198547.0, 40861.0, 11794.0, 4106.0, 1648.0, 799.0, 363.0, 210.0, 109.0, 73.0, 41.0, 30.0, 25.0, 8.0, 18.0, 9.0, 4.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0546875, -5.87957763671875, -5.7044677734375, -5.52935791015625, -5.354248046875, -5.17913818359375, -5.0040283203125, -4.82891845703125, -4.65380859375, -4.47869873046875, -4.3035888671875, -4.12847900390625, -3.953369140625, -3.77825927734375, -3.6031494140625, -3.42803955078125, -3.2529296875, -3.07781982421875, -2.9027099609375, -2.72760009765625, -2.552490234375, -2.37738037109375, -2.2022705078125, -2.02716064453125, -1.85205078125, -1.67694091796875, -1.5018310546875, -1.32672119140625, -1.151611328125, -0.97650146484375, -0.8013916015625, -0.62628173828125, -0.451171875, -0.27606201171875, -0.1009521484375, 0.07415771484375, 0.249267578125, 0.42437744140625, 0.5994873046875, 0.77459716796875, 0.94970703125, 1.12481689453125, 1.2999267578125, 1.47503662109375, 1.650146484375, 1.82525634765625, 2.0003662109375, 2.17547607421875, 2.3505859375, 2.52569580078125, 2.7008056640625, 2.87591552734375, 3.051025390625, 3.22613525390625, 3.4012451171875, 3.57635498046875, 3.75146484375, 3.92657470703125, 4.1016845703125, 4.27679443359375, 4.451904296875, 4.62701416015625, 4.8021240234375, 4.97723388671875, 5.15234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 11.0, 8.0, 21.0, 10.0, 16.0, 21.0, 28.0, 30.0, 40.0, 33.0, 28.0, 38.0, 49.0, 37.0, 61.0, 50.0, 56.0, 61.0, 45.0, 45.0, 40.0, 31.0, 40.0, 26.0, 29.0, 31.0, 19.0, 14.0, 19.0, 14.0, 12.0, 6.0, 10.0, 8.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78515625, -5.5869140625, -5.388671875, -5.1904296875, -4.9921875, -4.7939453125, -4.595703125, -4.3974609375, -4.19921875, -4.0009765625, -3.802734375, -3.6044921875, -3.40625, -3.2080078125, -3.009765625, -2.8115234375, -2.61328125, -2.4150390625, -2.216796875, -2.0185546875, -1.8203125, -1.6220703125, -1.423828125, -1.2255859375, -1.02734375, -0.8291015625, -0.630859375, -0.4326171875, -0.234375, -0.0361328125, 0.162109375, 0.3603515625, 0.55859375, 0.7568359375, 0.955078125, 1.1533203125, 1.3515625, 1.5498046875, 1.748046875, 1.9462890625, 2.14453125, 2.3427734375, 2.541015625, 2.7392578125, 2.9375, 3.1357421875, 3.333984375, 3.5322265625, 3.73046875, 3.9287109375, 4.126953125, 4.3251953125, 4.5234375, 4.7216796875, 4.919921875, 5.1181640625, 5.31640625, 5.5146484375, 5.712890625, 5.9111328125, 6.109375, 6.3076171875, 6.505859375, 6.7041015625, 6.90234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 8.0, 8.0, 16.0, 17.0, 36.0, 41.0, 93.0, 173.0, 421.0, 1205.0, 4567.0, 26457.0, 342480.0, 617824.0, 45834.0, 6785.0, 1590.0, 507.0, 211.0, 117.0, 53.0, 33.0, 14.0, 14.0, 7.0, 5.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.1875, -8.91015625, -8.6328125, -8.35546875, -8.078125, -7.80078125, -7.5234375, -7.24609375, -6.96875, -6.69140625, -6.4140625, -6.13671875, -5.859375, -5.58203125, -5.3046875, -5.02734375, -4.75, -4.47265625, -4.1953125, -3.91796875, -3.640625, -3.36328125, -3.0859375, -2.80859375, -2.53125, -2.25390625, -1.9765625, -1.69921875, -1.421875, -1.14453125, -0.8671875, -0.58984375, -0.3125, -0.03515625, 0.2421875, 0.51953125, 0.796875, 1.07421875, 1.3515625, 1.62890625, 1.90625, 2.18359375, 2.4609375, 2.73828125, 3.015625, 3.29296875, 3.5703125, 3.84765625, 4.125, 4.40234375, 4.6796875, 4.95703125, 5.234375, 5.51171875, 5.7890625, 6.06640625, 6.34375, 6.62109375, 6.8984375, 7.17578125, 7.453125, 7.73046875, 8.0078125, 8.28515625, 8.5625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 5.0, 4.0, 15.0, 19.0, 15.0, 17.0, 31.0, 48.0, 33.0, 47.0, 48.0, 57.0, 67.0, 59.0, 55.0, 53.0, 60.0, 60.0, 37.0, 55.0, 48.0, 44.0, 20.0, 24.0, 15.0, 15.0, 12.0, 8.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0546875, -8.7734375, -8.4921875, -8.2109375, -7.9296875, -7.6484375, -7.3671875, -7.0859375, -6.8046875, -6.5234375, -6.2421875, -5.9609375, -5.6796875, -5.3984375, -5.1171875, -4.8359375, -4.5546875, -4.2734375, -3.9921875, -3.7109375, -3.4296875, -3.1484375, -2.8671875, -2.5859375, -2.3046875, -2.0234375, -1.7421875, -1.4609375, -1.1796875, -0.8984375, -0.6171875, -0.3359375, -0.0546875, 0.2265625, 0.5078125, 0.7890625, 1.0703125, 1.3515625, 1.6328125, 1.9140625, 2.1953125, 2.4765625, 2.7578125, 3.0390625, 3.3203125, 3.6015625, 3.8828125, 4.1640625, 4.4453125, 4.7265625, 5.0078125, 5.2890625, 5.5703125, 5.8515625, 6.1328125, 6.4140625, 6.6953125, 6.9765625, 7.2578125, 7.5390625, 7.8203125, 8.1015625, 8.3828125, 8.6640625, 8.9453125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 6.0, 10.0, 12.0, 30.0, 25.0, 49.0, 101.0, 252.0, 792.0, 3538.0, 27164.0, 378746.0, 589465.0, 41845.0, 4910.0, 978.0, 311.0, 107.0, 61.0, 42.0, 20.0, 17.0, 8.0, 12.0, 7.0, 7.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.26171875, -2.186553955078125, -2.11138916015625, -2.036224365234375, -1.9610595703125, -1.885894775390625, -1.81072998046875, -1.735565185546875, -1.660400390625, -1.585235595703125, -1.51007080078125, -1.434906005859375, -1.3597412109375, -1.284576416015625, -1.20941162109375, -1.134246826171875, -1.05908203125, -0.983917236328125, -0.90875244140625, -0.833587646484375, -0.7584228515625, -0.683258056640625, -0.60809326171875, -0.532928466796875, -0.457763671875, -0.382598876953125, -0.30743408203125, -0.232269287109375, -0.1571044921875, -0.081939697265625, -0.00677490234375, 0.068389892578125, 0.1435546875, 0.218719482421875, 0.29388427734375, 0.369049072265625, 0.4442138671875, 0.519378662109375, 0.59454345703125, 0.669708251953125, 0.744873046875, 0.820037841796875, 0.89520263671875, 0.970367431640625, 1.0455322265625, 1.120697021484375, 1.19586181640625, 1.271026611328125, 1.34619140625, 1.421356201171875, 1.49652099609375, 1.571685791015625, 1.6468505859375, 1.722015380859375, 1.79718017578125, 1.872344970703125, 1.947509765625, 2.022674560546875, 2.09783935546875, 2.173004150390625, 2.2481689453125, 2.323333740234375, 2.39849853515625, 2.473663330078125, 2.548828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 7.0, 15.0, 16.0, 18.0, 14.0, 19.0, 35.0, 44.0, 59.0, 72.0, 113.0, 140.0, 111.0, 97.0, 69.0, 39.0, 34.0, 20.0, 21.0, 12.0, 11.0, 10.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002815723419189453, -0.00027325376868247986, -0.0002649351954460144, -0.00025661662220954895, -0.0002482980489730835, -0.00023997947573661804, -0.0002316609025001526, -0.00022334232926368713, -0.00021502375602722168, -0.00020670518279075623, -0.00019838660955429077, -0.00019006803631782532, -0.00018174946308135986, -0.0001734308898448944, -0.00016511231660842896, -0.0001567937433719635, -0.00014847517013549805, -0.0001401565968990326, -0.00013183802366256714, -0.00012351945042610168, -0.00011520087718963623, -0.00010688230395317078, -9.856373071670532e-05, -9.024515748023987e-05, -8.192658424377441e-05, -7.360801100730896e-05, -6.52894377708435e-05, -5.697086453437805e-05, -4.86522912979126e-05, -4.0333718061447144e-05, -3.201514482498169e-05, -2.3696571588516235e-05, -1.537799835205078e-05, -7.059425115585327e-06, 1.259148120880127e-06, 9.577721357345581e-06, 1.7896294593811035e-05, 2.621486783027649e-05, 3.453344106674194e-05, 4.28520143032074e-05, 5.117058753967285e-05, 5.9489160776138306e-05, 6.780773401260376e-05, 7.612630724906921e-05, 8.444488048553467e-05, 9.276345372200012e-05, 0.00010108202695846558, 0.00010940060019493103, 0.00011771917343139648, 0.00012603774666786194, 0.0001343563199043274, 0.00014267489314079285, 0.0001509934663772583, 0.00015931203961372375, 0.0001676306128501892, 0.00017594918608665466, 0.00018426775932312012, 0.00019258633255958557, 0.00020090490579605103, 0.00020922347903251648, 0.00021754205226898193, 0.0002258606255054474, 0.00023417919874191284, 0.0002424977719783783, 0.00025081634521484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 4.0, 8.0, 8.0, 19.0, 28.0, 61.0, 138.0, 336.0, 1023.0, 4081.0, 26817.0, 328569.0, 625053.0, 53369.0, 6631.0, 1579.0, 477.0, 186.0, 64.0, 35.0, 26.0, 12.0, 4.0, 5.0, 4.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.27734375, -3.191436767578125, -3.10552978515625, -3.019622802734375, -2.9337158203125, -2.847808837890625, -2.76190185546875, -2.675994873046875, -2.590087890625, -2.504180908203125, -2.41827392578125, -2.332366943359375, -2.2464599609375, -2.160552978515625, -2.07464599609375, -1.988739013671875, -1.90283203125, -1.816925048828125, -1.73101806640625, -1.645111083984375, -1.5592041015625, -1.473297119140625, -1.38739013671875, -1.301483154296875, -1.215576171875, -1.129669189453125, -1.04376220703125, -0.957855224609375, -0.8719482421875, -0.786041259765625, -0.70013427734375, -0.614227294921875, -0.5283203125, -0.442413330078125, -0.35650634765625, -0.270599365234375, -0.1846923828125, -0.098785400390625, -0.01287841796875, 0.073028564453125, 0.158935546875, 0.244842529296875, 0.33074951171875, 0.416656494140625, 0.5025634765625, 0.588470458984375, 0.67437744140625, 0.760284423828125, 0.84619140625, 0.932098388671875, 1.01800537109375, 1.103912353515625, 1.1898193359375, 1.275726318359375, 1.36163330078125, 1.447540283203125, 1.533447265625, 1.619354248046875, 1.70526123046875, 1.791168212890625, 1.8770751953125, 1.962982177734375, 2.04888916015625, 2.134796142578125, 2.220703125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 13.0, 6.0, 12.0, 25.0, 21.0, 38.0, 46.0, 50.0, 94.0, 112.0, 119.0, 106.0, 85.0, 59.0, 50.0, 41.0, 42.0, 23.0, 12.0, 14.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.91259765625, -0.8838882446289062, -0.8551788330078125, -0.8264694213867188, -0.797760009765625, -0.7690505981445312, -0.7403411865234375, -0.7116317749023438, -0.68292236328125, -0.6542129516601562, -0.6255035400390625, -0.5967941284179688, -0.568084716796875, -0.5393753051757812, -0.5106658935546875, -0.48195648193359375, -0.4532470703125, -0.42453765869140625, -0.3958282470703125, -0.36711883544921875, -0.338409423828125, -0.30970001220703125, -0.2809906005859375, -0.25228118896484375, -0.22357177734375, -0.19486236572265625, -0.1661529541015625, -0.13744354248046875, -0.108734130859375, -0.08002471923828125, -0.0513153076171875, -0.02260589599609375, 0.006103515625, 0.03481292724609375, 0.0635223388671875, 0.09223175048828125, 0.120941162109375, 0.14965057373046875, 0.1783599853515625, 0.20706939697265625, 0.23577880859375, 0.26448822021484375, 0.2931976318359375, 0.32190704345703125, 0.350616455078125, 0.37932586669921875, 0.4080352783203125, 0.43674468994140625, 0.4654541015625, 0.49416351318359375, 0.5228729248046875, 0.5515823364257812, 0.580291748046875, 0.6090011596679688, 0.6377105712890625, 0.6664199829101562, 0.69512939453125, 0.7238388061523438, 0.7525482177734375, 0.7812576293945312, 0.809967041015625, 0.8386764526367188, 0.8673858642578125, 0.8960952758789062, 0.9248046875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 6.0, 20.0, 37.0, 68.0, 98.0, 138.0, 148.0, 155.0, 125.0, 90.0, 48.0, 36.0, 18.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.142560005187988, -7.656235218048096, -7.169909954071045, -6.683585166931152, -6.197259902954102, -5.710935115814209, -5.224610328674316, -4.738285064697266, -4.251960277557373, -3.7656352519989014, -3.2793102264404297, -2.792985439300537, -2.3066604137420654, -1.8203353881835938, -1.3340106010437012, -0.8476855754852295, -0.3613605499267578, 0.12496441602706909, 0.611289381980896, 1.0976142883300781, 1.5839393138885498, 2.0702643394470215, 2.556589126586914, 3.0429141521453857, 3.5292391777038574, 4.01556396484375, 4.501889228820801, 4.988214015960693, 5.474538803100586, 5.960864067077637, 6.447188854217529, 6.933513641357422, 7.419837951660156, 7.906162738800049, 8.392487525939941, 8.878812789916992, 9.365138053894043, 9.851463317871094, 10.337787628173828, 10.824112892150879, 11.31043815612793, 11.79676342010498, 12.283087730407715, 12.769412994384766, 13.255738258361816, 13.742063522338867, 14.228387832641602, 14.714713096618652, 15.201037406921387, 15.687362670898438, 16.173686981201172, 16.660011291503906, 17.146337509155273, 17.632661819458008, 18.118988037109375, 18.60531234741211, 19.091636657714844, 19.577960968017578, 20.064287185668945, 20.55061149597168, 21.036935806274414, 21.52326202392578, 22.009586334228516, 22.49591064453125, 22.982236862182617]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 3.0, 1.0, 4.0, 9.0, 7.0, 4.0, 5.0, 11.0, 10.0, 7.0, 18.0, 29.0, 24.0, 31.0, 24.0, 37.0, 30.0, 39.0, 38.0, 38.0, 38.0, 44.0, 43.0, 36.0, 49.0, 46.0, 43.0, 37.0, 37.0, 30.0, 28.0, 25.0, 37.0, 34.0, 17.0, 29.0, 14.0, 16.0, 9.0, 9.0, 3.0, 4.0, 5.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.328472137451172, -8.972537994384766, -8.61660385131836, -8.260669708251953, -7.904735565185547, -7.548801422119141, -7.192867279052734, -6.836933135986328, -6.480998992919922, -6.125064849853516, -5.769130706787109, -5.413196563720703, -5.057262420654297, -4.701328277587891, -4.345394134521484, -3.989459753036499, -3.6335253715515137, -3.2775912284851074, -2.921657085418701, -2.565722942352295, -2.2097887992858887, -1.8538545370101929, -1.497920274734497, -1.1419861316680908, -0.7860519886016846, -0.43011781573295593, -0.0741836428642273, 0.28175055980682373, 0.63768470287323, 0.9936188459396362, 1.349553108215332, 1.7054872512817383, 2.0614213943481445, 2.417355537414551, 2.773289680480957, 3.1292238235473633, 3.4851579666137695, 3.841092109680176, 4.197026252746582, 4.552960395812988, 4.9088945388793945, 5.264828681945801, 5.620762825012207, 5.976696968078613, 6.3326311111450195, 6.688565254211426, 7.044499397277832, 7.400433540344238, 7.756368160247803, 8.112302780151367, 8.468236923217773, 8.82417106628418, 9.180105209350586, 9.536039352416992, 9.891973495483398, 10.247907638549805, 10.603841781616211, 10.959775924682617, 11.315710067749023, 11.67164421081543, 12.027578353881836, 12.383512496948242, 12.739446640014648, 13.095380783081055, 13.451314926147461]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 7.0, 14.0, 9.0, 22.0, 16.0, 24.0, 37.0, 58.0, 64.0, 98.0, 199.0, 320.0, 706.0, 1392.0, 3299.0, 8778.0, 34301.0, 418948.0, 3259120.0, 414707.0, 36311.0, 9333.0, 3411.0, 1456.0, 695.0, 364.0, 220.0, 113.0, 76.0, 42.0, 35.0, 35.0, 16.0, 7.0, 6.0, 11.0, 11.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.53125, -7.299560546875, -7.06787109375, -6.836181640625, -6.6044921875, -6.372802734375, -6.14111328125, -5.909423828125, -5.677734375, -5.446044921875, -5.21435546875, -4.982666015625, -4.7509765625, -4.519287109375, -4.28759765625, -4.055908203125, -3.82421875, -3.592529296875, -3.36083984375, -3.129150390625, -2.8974609375, -2.665771484375, -2.43408203125, -2.202392578125, -1.970703125, -1.739013671875, -1.50732421875, -1.275634765625, -1.0439453125, -0.812255859375, -0.58056640625, -0.348876953125, -0.1171875, 0.114501953125, 0.34619140625, 0.577880859375, 0.8095703125, 1.041259765625, 1.27294921875, 1.504638671875, 1.736328125, 1.968017578125, 2.19970703125, 2.431396484375, 2.6630859375, 2.894775390625, 3.12646484375, 3.358154296875, 3.58984375, 3.821533203125, 4.05322265625, 4.284912109375, 4.5166015625, 4.748291015625, 4.97998046875, 5.211669921875, 5.443359375, 5.675048828125, 5.90673828125, 6.138427734375, 6.3701171875, 6.601806640625, 6.83349609375, 7.065185546875, 7.296875]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 10.0, 10.0, 15.0, 21.0, 29.0, 25.0, 32.0, 36.0, 46.0, 54.0, 52.0, 54.0, 61.0, 51.0, 57.0, 57.0, 46.0, 48.0, 45.0, 38.0, 47.0, 35.0, 25.0, 14.0, 27.0, 11.0, 12.0, 11.0, 10.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.265625, -4.146575927734375, -4.02752685546875, -3.908477783203125, -3.7894287109375, -3.670379638671875, -3.55133056640625, -3.432281494140625, -3.313232421875, -3.194183349609375, -3.07513427734375, -2.956085205078125, -2.8370361328125, -2.717987060546875, -2.59893798828125, -2.479888916015625, -2.36083984375, -2.241790771484375, -2.12274169921875, -2.003692626953125, -1.8846435546875, -1.765594482421875, -1.64654541015625, -1.527496337890625, -1.408447265625, -1.289398193359375, -1.17034912109375, -1.051300048828125, -0.9322509765625, -0.813201904296875, -0.69415283203125, -0.575103759765625, -0.4560546875, -0.337005615234375, -0.21795654296875, -0.098907470703125, 0.0201416015625, 0.139190673828125, 0.25823974609375, 0.377288818359375, 0.496337890625, 0.615386962890625, 0.73443603515625, 0.853485107421875, 0.9725341796875, 1.091583251953125, 1.21063232421875, 1.329681396484375, 1.44873046875, 1.567779541015625, 1.68682861328125, 1.805877685546875, 1.9249267578125, 2.043975830078125, 2.16302490234375, 2.282073974609375, 2.401123046875, 2.520172119140625, 2.63922119140625, 2.758270263671875, 2.8773193359375, 2.996368408203125, 3.11541748046875, 3.234466552734375, 3.353515625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 5.0, 2.0, 12.0, 16.0, 22.0, 28.0, 34.0, 54.0, 107.0, 283.0, 1077.0, 6404.0, 109712.0, 4008078.0, 62229.0, 4809.0, 880.0, 258.0, 96.0, 68.0, 29.0, 22.0, 18.0, 14.0, 10.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.796875, -18.2808837890625, -17.764892578125, -17.2489013671875, -16.73291015625, -16.2169189453125, -15.700927734375, -15.1849365234375, -14.6689453125, -14.1529541015625, -13.636962890625, -13.1209716796875, -12.60498046875, -12.0889892578125, -11.572998046875, -11.0570068359375, -10.541015625, -10.0250244140625, -9.509033203125, -8.9930419921875, -8.47705078125, -7.9610595703125, -7.445068359375, -6.9290771484375, -6.4130859375, -5.8970947265625, -5.381103515625, -4.8651123046875, -4.34912109375, -3.8331298828125, -3.317138671875, -2.8011474609375, -2.28515625, -1.7691650390625, -1.253173828125, -0.7371826171875, -0.22119140625, 0.2947998046875, 0.810791015625, 1.3267822265625, 1.8427734375, 2.3587646484375, 2.874755859375, 3.3907470703125, 3.90673828125, 4.4227294921875, 4.938720703125, 5.4547119140625, 5.970703125, 6.4866943359375, 7.002685546875, 7.5186767578125, 8.03466796875, 8.5506591796875, 9.066650390625, 9.5826416015625, 10.0986328125, 10.6146240234375, 11.130615234375, 11.6466064453125, 12.16259765625, 12.6785888671875, 13.194580078125, 13.7105712890625, 14.2265625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 10.0, 6.0, 7.0, 10.0, 11.0, 20.0, 18.0, 34.0, 58.0, 73.0, 150.0, 257.0, 422.0, 662.0, 744.0, 604.0, 391.0, 223.0, 124.0, 73.0, 46.0, 27.0, 18.0, 17.0, 14.0, 12.0, 12.0, 5.0, 7.0, 4.0, 1.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6943359375, -1.6221160888671875, -1.549896240234375, -1.4776763916015625, -1.40545654296875, -1.3332366943359375, -1.261016845703125, -1.1887969970703125, -1.1165771484375, -1.0443572998046875, -0.972137451171875, -0.8999176025390625, -0.82769775390625, -0.7554779052734375, -0.683258056640625, -0.6110382080078125, -0.538818359375, -0.4665985107421875, -0.394378662109375, -0.3221588134765625, -0.24993896484375, -0.1777191162109375, -0.105499267578125, -0.0332794189453125, 0.0389404296875, 0.1111602783203125, 0.183380126953125, 0.2555999755859375, 0.32781982421875, 0.4000396728515625, 0.472259521484375, 0.5444793701171875, 0.61669921875, 0.6889190673828125, 0.761138916015625, 0.8333587646484375, 0.90557861328125, 0.9777984619140625, 1.050018310546875, 1.1222381591796875, 1.1944580078125, 1.2666778564453125, 1.338897705078125, 1.4111175537109375, 1.48333740234375, 1.5555572509765625, 1.627777099609375, 1.6999969482421875, 1.772216796875, 1.8444366455078125, 1.916656494140625, 1.9888763427734375, 2.06109619140625, 2.1333160400390625, 2.205535888671875, 2.2777557373046875, 2.3499755859375, 2.4221954345703125, 2.494415283203125, 2.5666351318359375, 2.63885498046875, 2.7110748291015625, 2.783294677734375, 2.8555145263671875, 2.927734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 2.0, 6.0, 16.0, 14.0, 23.0, 25.0, 38.0, 48.0, 49.0, 48.0, 57.0, 71.0, 66.0, 69.0, 77.0, 67.0, 63.0, 53.0, 44.0, 40.0, 28.0, 20.0, 16.0, 13.0, 11.0, 10.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.329634189605713, -6.166843414306641, -6.004053115844727, -5.841262340545654, -5.678471565246582, -5.515681266784668, -5.352890491485596, -5.190099716186523, -5.027309417724609, -4.864518642425537, -4.701728343963623, -4.538937568664551, -4.3761467933654785, -4.213356018066406, -4.050565719604492, -3.88777494430542, -3.7249841690063477, -3.5621936321258545, -3.3994028568267822, -3.236612319946289, -3.073821544647217, -2.9110310077667236, -2.7482404708862305, -2.585449695587158, -2.422659158706665, -2.259868621826172, -2.0970778465270996, -1.9342873096466064, -1.7714966535568237, -1.608705997467041, -1.4459154605865479, -1.2831248044967651, -1.1203336715698242, -0.9575430154800415, -0.7947524189949036, -0.6319618225097656, -0.4691711664199829, -0.3063805103302002, -0.14358991384506226, 0.019200682640075684, 0.1819913387298584, 0.3447819650173187, 0.507572591304779, 0.670363187789917, 0.8331538438796997, 0.9959444999694824, 1.1587350368499756, 1.3215256929397583, 1.484316349029541, 1.6471070051193237, 1.8098976612091064, 1.9726881980895996, 2.135478973388672, 2.298269510269165, 2.461060047149658, 2.6238508224487305, 2.7866413593292236, 2.949431896209717, 3.112222671508789, 3.2750132083892822, 3.4378037452697754, 3.6005945205688477, 3.763385057449341, 3.926175594329834, 4.088966369628906]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 11.0, 13.0, 12.0, 16.0, 17.0, 21.0, 27.0, 29.0, 33.0, 37.0, 28.0, 47.0, 34.0, 54.0, 39.0, 51.0, 40.0, 56.0, 40.0, 51.0, 55.0, 39.0, 27.0, 31.0, 32.0, 18.0, 24.0, 22.0, 17.0, 10.0, 18.0, 10.0, 7.0, 5.0, 5.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.208187103271484, -4.072391033172607, -3.9365949630737305, -3.8007988929748535, -3.6650028228759766, -3.5292067527770996, -3.3934106826782227, -3.2576146125793457, -3.1218185424804688, -2.986022472381592, -2.850226402282715, -2.714430332183838, -2.578634262084961, -2.442838191986084, -2.307042121887207, -2.17124605178833, -2.035449981689453, -1.8996539115905762, -1.7638578414916992, -1.6280617713928223, -1.4922657012939453, -1.3564696311950684, -1.2206735610961914, -1.0848774909973145, -0.9490814208984375, -0.8132853507995605, -0.6774892807006836, -0.5416932106018066, -0.4058971405029297, -0.27010107040405273, -0.13430500030517578, 0.0014910697937011719, 0.13728761672973633, 0.2730836868286133, 0.40887975692749023, 0.5446758270263672, 0.6804718971252441, 0.8162679672241211, 0.952064037322998, 1.087860107421875, 1.223656177520752, 1.359452247619629, 1.4952483177185059, 1.6310443878173828, 1.7668404579162598, 1.9026365280151367, 2.0384325981140137, 2.1742286682128906, 2.3100247383117676, 2.4458208084106445, 2.5816168785095215, 2.7174129486083984, 2.8532090187072754, 2.9890050888061523, 3.1248011589050293, 3.2605972290039062, 3.396393299102783, 3.53218936920166, 3.667985439300537, 3.803781509399414, 3.939577579498291, 4.075373649597168, 4.211169719696045, 4.346965789794922, 4.482761859893799]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 8.0, 12.0, 11.0, 14.0, 19.0, 24.0, 34.0, 51.0, 79.0, 123.0, 170.0, 290.0, 439.0, 729.0, 1233.0, 2352.0, 4353.0, 10329.0, 41251.0, 375201.0, 526954.0, 61032.0, 12500.0, 5144.0, 2599.0, 1436.0, 837.0, 473.0, 295.0, 181.0, 110.0, 74.0, 64.0, 42.0, 32.0, 16.0, 15.0, 10.0, 5.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.7197265625, -1.6707305908203125, -1.621734619140625, -1.5727386474609375, -1.52374267578125, -1.4747467041015625, -1.425750732421875, -1.3767547607421875, -1.3277587890625, -1.2787628173828125, -1.229766845703125, -1.1807708740234375, -1.13177490234375, -1.0827789306640625, -1.033782958984375, -0.9847869873046875, -0.935791015625, -0.8867950439453125, -0.837799072265625, -0.7888031005859375, -0.73980712890625, -0.6908111572265625, -0.641815185546875, -0.5928192138671875, -0.5438232421875, -0.4948272705078125, -0.445831298828125, -0.3968353271484375, -0.34783935546875, -0.2988433837890625, -0.249847412109375, -0.2008514404296875, -0.15185546875, -0.1028594970703125, -0.053863525390625, -0.0048675537109375, 0.04412841796875, 0.0931243896484375, 0.142120361328125, 0.1911163330078125, 0.2401123046875, 0.2891082763671875, 0.338104248046875, 0.3871002197265625, 0.43609619140625, 0.4850921630859375, 0.534088134765625, 0.5830841064453125, 0.632080078125, 0.6810760498046875, 0.730072021484375, 0.7790679931640625, 0.82806396484375, 0.8770599365234375, 0.926055908203125, 0.9750518798828125, 1.0240478515625, 1.0730438232421875, 1.122039794921875, 1.1710357666015625, 1.22003173828125, 1.2690277099609375, 1.318023681640625, 1.3670196533203125, 1.416015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 0.0, 5.0, 5.0, 9.0, 13.0, 16.0, 23.0, 13.0, 20.0, 16.0, 21.0, 22.0, 26.0, 46.0, 43.0, 50.0, 42.0, 49.0, 56.0, 54.0, 48.0, 53.0, 43.0, 32.0, 47.0, 38.0, 33.0, 33.0, 26.0, 17.0, 22.0, 15.0, 14.0, 9.0, 9.0, 10.0, 5.0, 5.0, 9.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.609375, -2.520111083984375, -2.43084716796875, -2.341583251953125, -2.2523193359375, -2.163055419921875, -2.07379150390625, -1.984527587890625, -1.895263671875, -1.805999755859375, -1.71673583984375, -1.627471923828125, -1.5382080078125, -1.448944091796875, -1.35968017578125, -1.270416259765625, -1.18115234375, -1.091888427734375, -1.00262451171875, -0.913360595703125, -0.8240966796875, -0.734832763671875, -0.64556884765625, -0.556304931640625, -0.467041015625, -0.377777099609375, -0.28851318359375, -0.199249267578125, -0.1099853515625, -0.020721435546875, 0.06854248046875, 0.157806396484375, 0.2470703125, 0.336334228515625, 0.42559814453125, 0.514862060546875, 0.6041259765625, 0.693389892578125, 0.78265380859375, 0.871917724609375, 0.961181640625, 1.050445556640625, 1.13970947265625, 1.228973388671875, 1.3182373046875, 1.407501220703125, 1.49676513671875, 1.586029052734375, 1.67529296875, 1.764556884765625, 1.85382080078125, 1.943084716796875, 2.0323486328125, 2.121612548828125, 2.21087646484375, 2.300140380859375, 2.389404296875, 2.478668212890625, 2.56793212890625, 2.657196044921875, 2.7464599609375, 2.835723876953125, 2.92498779296875, 3.014251708984375, 3.103515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 8.0, 5.0, 7.0, 4.0, 8.0, 23.0, 23.0, 45.0, 79.0, 119.0, 223.0, 440.0, 940.0, 2055.0, 5543.0, 21928.0, 280679.0, 674250.0, 47889.0, 8797.0, 2991.0, 1275.0, 550.0, 253.0, 162.0, 89.0, 56.0, 40.0, 18.0, 20.0, 9.0, 11.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8212890625, -1.7609710693359375, -1.700653076171875, -1.6403350830078125, -1.58001708984375, -1.5196990966796875, -1.459381103515625, -1.3990631103515625, -1.3387451171875, -1.2784271240234375, -1.218109130859375, -1.1577911376953125, -1.09747314453125, -1.0371551513671875, -0.976837158203125, -0.9165191650390625, -0.856201171875, -0.7958831787109375, -0.735565185546875, -0.6752471923828125, -0.61492919921875, -0.5546112060546875, -0.494293212890625, -0.4339752197265625, -0.3736572265625, -0.3133392333984375, -0.253021240234375, -0.1927032470703125, -0.13238525390625, -0.0720672607421875, -0.011749267578125, 0.0485687255859375, 0.10888671875, 0.1692047119140625, 0.229522705078125, 0.2898406982421875, 0.35015869140625, 0.4104766845703125, 0.470794677734375, 0.5311126708984375, 0.5914306640625, 0.6517486572265625, 0.712066650390625, 0.7723846435546875, 0.83270263671875, 0.8930206298828125, 0.953338623046875, 1.0136566162109375, 1.073974609375, 1.1342926025390625, 1.194610595703125, 1.2549285888671875, 1.31524658203125, 1.3755645751953125, 1.435882568359375, 1.4962005615234375, 1.5565185546875, 1.6168365478515625, 1.677154541015625, 1.7374725341796875, 1.79779052734375, 1.8581085205078125, 1.918426513671875, 1.9787445068359375, 2.0390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 7.0, 5.0, 8.0, 12.0, 9.0, 13.0, 19.0, 15.0, 16.0, 22.0, 29.0, 33.0, 27.0, 33.0, 39.0, 37.0, 35.0, 33.0, 39.0, 43.0, 45.0, 55.0, 35.0, 36.0, 30.0, 34.0, 32.0, 33.0, 33.0, 23.0, 32.0, 17.0, 25.0, 18.0, 14.0, 8.0, 8.0, 5.0, 5.0, 5.0, 1.0, 5.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.875, -6.67205810546875, -6.4691162109375, -6.26617431640625, -6.063232421875, -5.86029052734375, -5.6573486328125, -5.45440673828125, -5.25146484375, -5.04852294921875, -4.8455810546875, -4.64263916015625, -4.439697265625, -4.23675537109375, -4.0338134765625, -3.83087158203125, -3.6279296875, -3.42498779296875, -3.2220458984375, -3.01910400390625, -2.816162109375, -2.61322021484375, -2.4102783203125, -2.20733642578125, -2.00439453125, -1.80145263671875, -1.5985107421875, -1.39556884765625, -1.192626953125, -0.98968505859375, -0.7867431640625, -0.58380126953125, -0.380859375, -0.17791748046875, 0.0250244140625, 0.22796630859375, 0.430908203125, 0.63385009765625, 0.8367919921875, 1.03973388671875, 1.24267578125, 1.44561767578125, 1.6485595703125, 1.85150146484375, 2.054443359375, 2.25738525390625, 2.4603271484375, 2.66326904296875, 2.8662109375, 3.06915283203125, 3.2720947265625, 3.47503662109375, 3.677978515625, 3.88092041015625, 4.0838623046875, 4.28680419921875, 4.48974609375, 4.69268798828125, 4.8956298828125, 5.09857177734375, 5.301513671875, 5.50445556640625, 5.7073974609375, 5.91033935546875, 6.11328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 11.0, 8.0, 11.0, 23.0, 24.0, 55.0, 67.0, 130.0, 213.0, 361.0, 775.0, 1722.0, 4197.0, 12803.0, 108008.0, 856917.0, 47940.0, 9240.0, 3296.0, 1340.0, 630.0, 319.0, 189.0, 96.0, 55.0, 38.0, 23.0, 15.0, 12.0, 8.0, 7.0, 5.0, 8.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2060546875, -1.1565704345703125, -1.107086181640625, -1.0576019287109375, -1.00811767578125, -0.9586334228515625, -0.909149169921875, -0.8596649169921875, -0.8101806640625, -0.7606964111328125, -0.711212158203125, -0.6617279052734375, -0.61224365234375, -0.5627593994140625, -0.513275146484375, -0.4637908935546875, -0.414306640625, -0.3648223876953125, -0.315338134765625, -0.2658538818359375, -0.21636962890625, -0.1668853759765625, -0.117401123046875, -0.0679168701171875, -0.0184326171875, 0.0310516357421875, 0.080535888671875, 0.1300201416015625, 0.17950439453125, 0.2289886474609375, 0.278472900390625, 0.3279571533203125, 0.37744140625, 0.4269256591796875, 0.476409912109375, 0.5258941650390625, 0.57537841796875, 0.6248626708984375, 0.674346923828125, 0.7238311767578125, 0.7733154296875, 0.8227996826171875, 0.872283935546875, 0.9217681884765625, 0.97125244140625, 1.0207366943359375, 1.070220947265625, 1.1197052001953125, 1.169189453125, 1.2186737060546875, 1.268157958984375, 1.3176422119140625, 1.36712646484375, 1.4166107177734375, 1.466094970703125, 1.5155792236328125, 1.5650634765625, 1.6145477294921875, 1.664031982421875, 1.7135162353515625, 1.76300048828125, 1.8124847412109375, 1.861968994140625, 1.9114532470703125, 1.9609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 2.0, 4.0, 6.0, 11.0, 6.0, 18.0, 41.0, 63.0, 94.0, 164.0, 192.0, 154.0, 94.0, 69.0, 26.0, 16.0, 12.0, 6.0, 7.0, 6.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005822181701660156, -0.000565260648727417, -0.0005483031272888184, -0.0005313456058502197, -0.0005143880844116211, -0.0004974305629730225, -0.00048047304153442383, -0.0004635155200958252, -0.00044655799865722656, -0.00042960047721862793, -0.0004126429557800293, -0.00039568543434143066, -0.00037872791290283203, -0.0003617703914642334, -0.00034481287002563477, -0.00032785534858703613, -0.0003108978271484375, -0.00029394030570983887, -0.00027698278427124023, -0.0002600252628326416, -0.00024306774139404297, -0.00022611021995544434, -0.0002091526985168457, -0.00019219517707824707, -0.00017523765563964844, -0.0001582801342010498, -0.00014132261276245117, -0.00012436509132385254, -0.0001074075698852539, -9.045004844665527e-05, -7.349252700805664e-05, -5.653500556945801e-05, -3.9577484130859375e-05, -2.2619962692260742e-05, -5.662441253662109e-06, 1.1295080184936523e-05, 2.8252601623535156e-05, 4.521012306213379e-05, 6.216764450073242e-05, 7.912516593933105e-05, 9.608268737792969e-05, 0.00011304020881652832, 0.00012999773025512695, 0.00014695525169372559, 0.00016391277313232422, 0.00018087029457092285, 0.00019782781600952148, 0.00021478533744812012, 0.00023174285888671875, 0.0002487003803253174, 0.000265657901763916, 0.00028261542320251465, 0.0002995729446411133, 0.0003165304660797119, 0.00033348798751831055, 0.0003504455089569092, 0.0003674030303955078, 0.00038436055183410645, 0.0004013180732727051, 0.0004182755947113037, 0.00043523311614990234, 0.000452190637588501, 0.0004691481590270996, 0.00048610568046569824, 0.0005030632019042969]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 7.0, 22.0, 26.0, 54.0, 77.0, 130.0, 172.0, 307.0, 474.0, 786.0, 1311.0, 2227.0, 3950.0, 7784.0, 19161.0, 82103.0, 476630.0, 365116.0, 57681.0, 15178.0, 6663.0, 3366.0, 1997.0, 1243.0, 727.0, 489.0, 318.0, 196.0, 109.0, 95.0, 50.0, 39.0, 29.0, 10.0, 7.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7705078125, -0.745574951171875, -0.72064208984375, -0.695709228515625, -0.6707763671875, -0.645843505859375, -0.62091064453125, -0.595977783203125, -0.571044921875, -0.546112060546875, -0.52117919921875, -0.496246337890625, -0.4713134765625, -0.446380615234375, -0.42144775390625, -0.396514892578125, -0.37158203125, -0.346649169921875, -0.32171630859375, -0.296783447265625, -0.2718505859375, -0.246917724609375, -0.22198486328125, -0.197052001953125, -0.172119140625, -0.147186279296875, -0.12225341796875, -0.097320556640625, -0.0723876953125, -0.047454833984375, -0.02252197265625, 0.002410888671875, 0.02734375, 0.052276611328125, 0.07720947265625, 0.102142333984375, 0.1270751953125, 0.152008056640625, 0.17694091796875, 0.201873779296875, 0.226806640625, 0.251739501953125, 0.27667236328125, 0.301605224609375, 0.3265380859375, 0.351470947265625, 0.37640380859375, 0.401336669921875, 0.42626953125, 0.451202392578125, 0.47613525390625, 0.501068115234375, 0.5260009765625, 0.550933837890625, 0.57586669921875, 0.600799560546875, 0.625732421875, 0.650665283203125, 0.67559814453125, 0.700531005859375, 0.7254638671875, 0.750396728515625, 0.77532958984375, 0.800262451171875, 0.8251953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 6.0, 9.0, 7.0, 13.0, 29.0, 52.0, 72.0, 127.0, 194.0, 175.0, 129.0, 73.0, 50.0, 14.0, 15.0, 11.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.38330078125, -0.37166595458984375, -0.3600311279296875, -0.34839630126953125, -0.336761474609375, -0.32512664794921875, -0.3134918212890625, -0.30185699462890625, -0.29022216796875, -0.27858734130859375, -0.2669525146484375, -0.25531768798828125, -0.243682861328125, -0.23204803466796875, -0.2204132080078125, -0.20877838134765625, -0.1971435546875, -0.18550872802734375, -0.1738739013671875, -0.16223907470703125, -0.150604248046875, -0.13896942138671875, -0.1273345947265625, -0.11569976806640625, -0.10406494140625, -0.09243011474609375, -0.0807952880859375, -0.06916046142578125, -0.057525634765625, -0.04589080810546875, -0.0342559814453125, -0.02262115478515625, -0.010986328125, 0.00064849853515625, 0.0122833251953125, 0.02391815185546875, 0.035552978515625, 0.04718780517578125, 0.0588226318359375, 0.07045745849609375, 0.08209228515625, 0.09372711181640625, 0.1053619384765625, 0.11699676513671875, 0.128631591796875, 0.14026641845703125, 0.1519012451171875, 0.16353607177734375, 0.1751708984375, 0.18680572509765625, 0.1984405517578125, 0.21007537841796875, 0.221710205078125, 0.23334503173828125, 0.2449798583984375, 0.25661468505859375, 0.26824951171875, 0.27988433837890625, 0.2915191650390625, 0.30315399169921875, 0.314788818359375, 0.32642364501953125, 0.3380584716796875, 0.34969329833984375, 0.361328125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 6.0, 16.0, 25.0, 21.0, 25.0, 32.0, 45.0, 47.0, 61.0, 72.0, 60.0, 69.0, 75.0, 85.0, 66.0, 58.0, 53.0, 35.0, 30.0, 25.0, 23.0, 16.0, 8.0, 11.0, 9.0, 2.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.216189384460449, -4.112933158874512, -4.009677410125732, -3.906421184539795, -3.8031649589538574, -3.699908971786499, -3.5966529846191406, -3.493396759033203, -3.3901405334472656, -3.2868845462799072, -3.1836283206939697, -3.0803723335266113, -2.977116107940674, -2.8738601207733154, -2.770604133605957, -2.6673479080200195, -2.564091920852661, -2.4608359336853027, -2.3575797080993652, -2.254323720932007, -2.1510674953460693, -2.047811508178711, -1.944555401802063, -1.841299295425415, -1.738043189048767, -1.6347870826721191, -1.5315309762954712, -1.4282748699188232, -1.3250188827514648, -1.2217626571655273, -1.118506669998169, -1.015250563621521, -0.911994218826294, -0.808738112449646, -0.705482006072998, -0.6022259593009949, -0.4989698529243469, -0.395713746547699, -0.2924576997756958, -0.18920159339904785, -0.0859454870223999, 0.017310604453086853, 0.12056669592857361, 0.22382277250289917, 0.3270788788795471, 0.43033498525619507, 0.5335910320281982, 0.6368471384048462, 0.7401032447814941, 0.8433593511581421, 0.94661545753479, 1.0498714447021484, 1.153127670288086, 1.2563836574554443, 1.3596397638320923, 1.4628958702087402, 1.5661519765853882, 1.6694080829620361, 1.772664189338684, 1.875920295715332, 1.9791762828826904, 2.082432508468628, 2.1856884956359863, 2.288944721221924, 2.3922007083892822]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 8.0, 11.0, 6.0, 13.0, 12.0, 12.0, 26.0, 16.0, 31.0, 26.0, 39.0, 31.0, 41.0, 42.0, 43.0, 38.0, 61.0, 57.0, 50.0, 51.0, 49.0, 49.0, 26.0, 40.0, 38.0, 24.0, 30.0, 29.0, 17.0, 10.0, 12.0, 14.0, 10.0, 7.0, 9.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.465258836746216, -2.377323627471924, -2.289388656616211, -2.201453447341919, -2.113518238067627, -2.025583267211914, -1.937648057937622, -1.84971284866333, -1.7617777585983276, -1.6738426685333252, -1.5859074592590332, -1.4979723691940308, -1.4100372791290283, -1.3221020698547363, -1.2341669797897339, -1.1462318897247314, -1.0582966804504395, -0.9703615307807922, -0.882426381111145, -0.7944912910461426, -0.7065561413764954, -0.6186209917068481, -0.5306859016418457, -0.4427507519721985, -0.35481560230255127, -0.26688045263290405, -0.17894533276557922, -0.0910102128982544, -0.0030750632286071777, 0.08486008644104004, 0.17279517650604248, 0.2607303261756897, 0.3486652374267578, 0.43660038709640503, 0.5245355367660522, 0.6124706268310547, 0.7004057765007019, 0.7883409261703491, 0.8762760162353516, 0.9642111659049988, 1.052146315574646, 1.1400814056396484, 1.2280166149139404, 1.3159517049789429, 1.4038867950439453, 1.4918220043182373, 1.5797570943832397, 1.6676921844482422, 1.7556273937225342, 1.8435624837875366, 1.9314976930618286, 2.019432783126831, 2.107367992401123, 2.195302963256836, 2.283238172531128, 2.37117338180542, 2.459108352661133, 2.547043561935425, 2.6349785327911377, 2.7229137420654297, 2.8108489513397217, 2.8987841606140137, 2.9867191314697266, 3.0746543407440186, 3.1625895500183105]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 6.0, 8.0, 2.0, 4.0, 11.0, 13.0, 22.0, 34.0, 37.0, 64.0, 93.0, 128.0, 189.0, 292.0, 457.0, 840.0, 1381.0, 2579.0, 5356.0, 12239.0, 29863.0, 77947.0, 236650.0, 431748.0, 154942.0, 54381.0, 21155.0, 8965.0, 4091.0, 2080.0, 1132.0, 637.0, 388.0, 260.0, 171.0, 120.0, 75.0, 64.0, 49.0, 27.0, 18.0, 13.0, 8.0, 6.0, 2.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.37890625, -5.21746826171875, -5.0560302734375, -4.89459228515625, -4.733154296875, -4.57171630859375, -4.4102783203125, -4.24884033203125, -4.08740234375, -3.92596435546875, -3.7645263671875, -3.60308837890625, -3.441650390625, -3.28021240234375, -3.1187744140625, -2.95733642578125, -2.7958984375, -2.63446044921875, -2.4730224609375, -2.31158447265625, -2.150146484375, -1.98870849609375, -1.8272705078125, -1.66583251953125, -1.50439453125, -1.34295654296875, -1.1815185546875, -1.02008056640625, -0.858642578125, -0.69720458984375, -0.5357666015625, -0.37432861328125, -0.212890625, -0.05145263671875, 0.1099853515625, 0.27142333984375, 0.432861328125, 0.59429931640625, 0.7557373046875, 0.91717529296875, 1.07861328125, 1.24005126953125, 1.4014892578125, 1.56292724609375, 1.724365234375, 1.88580322265625, 2.0472412109375, 2.20867919921875, 2.3701171875, 2.53155517578125, 2.6929931640625, 2.85443115234375, 3.015869140625, 3.17730712890625, 3.3387451171875, 3.50018310546875, 3.66162109375, 3.82305908203125, 3.9844970703125, 4.14593505859375, 4.307373046875, 4.46881103515625, 4.6302490234375, 4.79168701171875, 4.953125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 8.0, 0.0, 6.0, 3.0, 9.0, 8.0, 11.0, 10.0, 22.0, 16.0, 21.0, 32.0, 42.0, 37.0, 45.0, 36.0, 48.0, 49.0, 57.0, 67.0, 54.0, 65.0, 56.0, 44.0, 40.0, 44.0, 30.0, 26.0, 30.0, 19.0, 18.0, 10.0, 15.0, 8.0, 6.0, 8.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.4913330078125, -4.322509765625, -4.1536865234375, -3.98486328125, -3.8160400390625, -3.647216796875, -3.4783935546875, -3.3095703125, -3.1407470703125, -2.971923828125, -2.8031005859375, -2.63427734375, -2.4654541015625, -2.296630859375, -2.1278076171875, -1.958984375, -1.7901611328125, -1.621337890625, -1.4525146484375, -1.28369140625, -1.1148681640625, -0.946044921875, -0.7772216796875, -0.6083984375, -0.4395751953125, -0.270751953125, -0.1019287109375, 0.06689453125, 0.2357177734375, 0.404541015625, 0.5733642578125, 0.7421875, 0.9110107421875, 1.079833984375, 1.2486572265625, 1.41748046875, 1.5863037109375, 1.755126953125, 1.9239501953125, 2.0927734375, 2.2615966796875, 2.430419921875, 2.5992431640625, 2.76806640625, 2.9368896484375, 3.105712890625, 3.2745361328125, 3.443359375, 3.6121826171875, 3.781005859375, 3.9498291015625, 4.11865234375, 4.2874755859375, 4.456298828125, 4.6251220703125, 4.7939453125, 4.9627685546875, 5.131591796875, 5.3004150390625, 5.46923828125, 5.6380615234375, 5.806884765625, 5.9757080078125, 6.14453125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 5.0, 10.0, 10.0, 10.0, 9.0, 18.0, 35.0, 37.0, 52.0, 73.0, 104.0, 107.0, 160.0, 291.0, 416.0, 660.0, 1117.0, 2002.0, 3712.0, 7393.0, 14617.0, 31118.0, 67935.0, 163220.0, 357906.0, 226794.0, 91094.0, 40296.0, 19038.0, 9293.0, 4771.0, 2548.0, 1376.0, 825.0, 461.0, 302.0, 204.0, 131.0, 100.0, 75.0, 56.0, 52.0, 25.0, 30.0, 24.0, 13.0, 8.0, 8.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0], "bins": [-4.25, -4.11993408203125, -3.9898681640625, -3.85980224609375, -3.729736328125, -3.59967041015625, -3.4696044921875, -3.33953857421875, -3.20947265625, -3.07940673828125, -2.9493408203125, -2.81927490234375, -2.689208984375, -2.55914306640625, -2.4290771484375, -2.29901123046875, -2.1689453125, -2.03887939453125, -1.9088134765625, -1.77874755859375, -1.648681640625, -1.51861572265625, -1.3885498046875, -1.25848388671875, -1.12841796875, -0.99835205078125, -0.8682861328125, -0.73822021484375, -0.608154296875, -0.47808837890625, -0.3480224609375, -0.21795654296875, -0.087890625, 0.04217529296875, 0.1722412109375, 0.30230712890625, 0.432373046875, 0.56243896484375, 0.6925048828125, 0.82257080078125, 0.95263671875, 1.08270263671875, 1.2127685546875, 1.34283447265625, 1.472900390625, 1.60296630859375, 1.7330322265625, 1.86309814453125, 1.9931640625, 2.12322998046875, 2.2532958984375, 2.38336181640625, 2.513427734375, 2.64349365234375, 2.7735595703125, 2.90362548828125, 3.03369140625, 3.16375732421875, 3.2938232421875, 3.42388916015625, 3.553955078125, 3.68402099609375, 3.8140869140625, 3.94415283203125, 4.07421875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 2.0, 11.0, 13.0, 12.0, 17.0, 20.0, 22.0, 37.0, 37.0, 53.0, 37.0, 39.0, 63.0, 58.0, 67.0, 70.0, 62.0, 69.0, 41.0, 51.0, 31.0, 30.0, 28.0, 31.0, 27.0, 12.0, 14.0, 6.0, 5.0, 7.0, 6.0, 5.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.1484375, -7.9278564453125, -7.707275390625, -7.4866943359375, -7.26611328125, -7.0455322265625, -6.824951171875, -6.6043701171875, -6.3837890625, -6.1632080078125, -5.942626953125, -5.7220458984375, -5.50146484375, -5.2808837890625, -5.060302734375, -4.8397216796875, -4.619140625, -4.3985595703125, -4.177978515625, -3.9573974609375, -3.73681640625, -3.5162353515625, -3.295654296875, -3.0750732421875, -2.8544921875, -2.6339111328125, -2.413330078125, -2.1927490234375, -1.97216796875, -1.7515869140625, -1.531005859375, -1.3104248046875, -1.08984375, -0.8692626953125, -0.648681640625, -0.4281005859375, -0.20751953125, 0.0130615234375, 0.233642578125, 0.4542236328125, 0.6748046875, 0.8953857421875, 1.115966796875, 1.3365478515625, 1.55712890625, 1.7777099609375, 1.998291015625, 2.2188720703125, 2.439453125, 2.6600341796875, 2.880615234375, 3.1011962890625, 3.32177734375, 3.5423583984375, 3.762939453125, 3.9835205078125, 4.2041015625, 4.4246826171875, 4.645263671875, 4.8658447265625, 5.08642578125, 5.3070068359375, 5.527587890625, 5.7481689453125, 5.96875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 15.0, 12.0, 17.0, 19.0, 28.0, 44.0, 57.0, 83.0, 92.0, 142.0, 204.0, 315.0, 425.0, 635.0, 1000.0, 1739.0, 3556.0, 7302.0, 17376.0, 44367.0, 115876.0, 364266.0, 304736.0, 111948.0, 42262.0, 16643.0, 7160.0, 3380.0, 1742.0, 992.0, 625.0, 403.0, 321.0, 202.0, 161.0, 111.0, 74.0, 60.0, 50.0, 27.0, 34.0, 12.0, 7.0, 7.0, 5.0, 5.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0], "bins": [-1.2021484375, -1.1656951904296875, -1.129241943359375, -1.0927886962890625, -1.05633544921875, -1.0198822021484375, -0.983428955078125, -0.9469757080078125, -0.9105224609375, -0.8740692138671875, -0.837615966796875, -0.8011627197265625, -0.76470947265625, -0.7282562255859375, -0.691802978515625, -0.6553497314453125, -0.618896484375, -0.5824432373046875, -0.545989990234375, -0.5095367431640625, -0.47308349609375, -0.4366302490234375, -0.400177001953125, -0.3637237548828125, -0.3272705078125, -0.2908172607421875, -0.254364013671875, -0.2179107666015625, -0.18145751953125, -0.1450042724609375, -0.108551025390625, -0.0720977783203125, -0.03564453125, 0.0008087158203125, 0.037261962890625, 0.0737152099609375, 0.11016845703125, 0.1466217041015625, 0.183074951171875, 0.2195281982421875, 0.2559814453125, 0.2924346923828125, 0.328887939453125, 0.3653411865234375, 0.40179443359375, 0.4382476806640625, 0.474700927734375, 0.5111541748046875, 0.547607421875, 0.5840606689453125, 0.620513916015625, 0.6569671630859375, 0.69342041015625, 0.7298736572265625, 0.766326904296875, 0.8027801513671875, 0.8392333984375, 0.8756866455078125, 0.912139892578125, 0.9485931396484375, 0.98504638671875, 1.0214996337890625, 1.057952880859375, 1.0944061279296875, 1.130859375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 10.0, 12.0, 7.0, 22.0, 20.0, 20.0, 29.0, 49.0, 65.0, 84.0, 139.0, 167.0, 91.0, 75.0, 62.0, 43.0, 35.0, 17.0, 12.0, 9.0, 9.0, 6.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00028896331787109375, -0.0002779066562652588, -0.00026684999465942383, -0.00025579333305358887, -0.0002447366714477539, -0.00023368000984191895, -0.00022262334823608398, -0.00021156668663024902, -0.00020051002502441406, -0.0001894533634185791, -0.00017839670181274414, -0.00016734004020690918, -0.00015628337860107422, -0.00014522671699523926, -0.0001341700553894043, -0.00012311339378356934, -0.00011205673217773438, -0.00010100007057189941, -8.994340896606445e-05, -7.888674736022949e-05, -6.783008575439453e-05, -5.677342414855957e-05, -4.571676254272461e-05, -3.466010093688965e-05, -2.3603439331054688e-05, -1.2546777725219727e-05, -1.4901161193847656e-06, 9.566545486450195e-06, 2.0623207092285156e-05, 3.167986869812012e-05, 4.273653030395508e-05, 5.379319190979004e-05, 6.4849853515625e-05, 7.590651512145996e-05, 8.696317672729492e-05, 9.801983833312988e-05, 0.00010907649993896484, 0.0001201331615447998, 0.00013118982315063477, 0.00014224648475646973, 0.0001533031463623047, 0.00016435980796813965, 0.0001754164695739746, 0.00018647313117980957, 0.00019752979278564453, 0.0002085864543914795, 0.00021964311599731445, 0.00023069977760314941, 0.00024175643920898438, 0.00025281310081481934, 0.0002638697624206543, 0.00027492642402648926, 0.0002859830856323242, 0.0002970397472381592, 0.00030809640884399414, 0.0003191530704498291, 0.00033020973205566406, 0.000341266393661499, 0.000352323055267334, 0.00036337971687316895, 0.0003744363784790039, 0.00038549304008483887, 0.00039654970169067383, 0.0004076063632965088, 0.00041866302490234375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 3.0, 9.0, 11.0, 9.0, 21.0, 21.0, 12.0, 30.0, 26.0, 49.0, 48.0, 66.0, 59.0, 95.0, 151.0, 170.0, 251.0, 514.0, 885.0, 1693.0, 3683.0, 10172.0, 41381.0, 255722.0, 607598.0, 95383.0, 19109.0, 5753.0, 2513.0, 1193.0, 654.0, 361.0, 207.0, 155.0, 108.0, 95.0, 66.0, 56.0, 45.0, 32.0, 36.0, 24.0, 20.0, 13.0, 13.0, 14.0, 6.0, 8.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.7421875, -2.659698486328125, -2.57720947265625, -2.494720458984375, -2.4122314453125, -2.329742431640625, -2.24725341796875, -2.164764404296875, -2.082275390625, -1.999786376953125, -1.91729736328125, -1.834808349609375, -1.7523193359375, -1.669830322265625, -1.58734130859375, -1.504852294921875, -1.42236328125, -1.339874267578125, -1.25738525390625, -1.174896240234375, -1.0924072265625, -1.009918212890625, -0.92742919921875, -0.844940185546875, -0.762451171875, -0.679962158203125, -0.59747314453125, -0.514984130859375, -0.4324951171875, -0.350006103515625, -0.26751708984375, -0.185028076171875, -0.1025390625, -0.020050048828125, 0.06243896484375, 0.144927978515625, 0.2274169921875, 0.309906005859375, 0.39239501953125, 0.474884033203125, 0.557373046875, 0.639862060546875, 0.72235107421875, 0.804840087890625, 0.8873291015625, 0.969818115234375, 1.05230712890625, 1.134796142578125, 1.21728515625, 1.299774169921875, 1.38226318359375, 1.464752197265625, 1.5472412109375, 1.629730224609375, 1.71221923828125, 1.794708251953125, 1.877197265625, 1.959686279296875, 2.04217529296875, 2.124664306640625, 2.2071533203125, 2.289642333984375, 2.37213134765625, 2.454620361328125, 2.537109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 11.0, 21.0, 46.0, 71.0, 88.0, 131.0, 219.0, 139.0, 78.0, 70.0, 44.0, 24.0, 14.0, 12.0, 6.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.783203125, -2.7247543334960938, -2.6663055419921875, -2.6078567504882812, -2.549407958984375, -2.4909591674804688, -2.4325103759765625, -2.3740615844726562, -2.31561279296875, -2.2571640014648438, -2.1987152099609375, -2.1402664184570312, -2.081817626953125, -2.0233688354492188, -1.9649200439453125, -1.9064712524414062, -1.8480224609375, -1.7895736694335938, -1.7311248779296875, -1.6726760864257812, -1.614227294921875, -1.5557785034179688, -1.4973297119140625, -1.4388809204101562, -1.38043212890625, -1.3219833374023438, -1.2635345458984375, -1.2050857543945312, -1.146636962890625, -1.0881881713867188, -1.0297393798828125, -0.9712905883789062, -0.912841796875, -0.8543930053710938, -0.7959442138671875, -0.7374954223632812, -0.679046630859375, -0.6205978393554688, -0.5621490478515625, -0.5037002563476562, -0.44525146484375, -0.38680267333984375, -0.3283538818359375, -0.26990509033203125, -0.211456298828125, -0.15300750732421875, -0.0945587158203125, -0.03610992431640625, 0.0223388671875, 0.08078765869140625, 0.1392364501953125, 0.19768524169921875, 0.256134033203125, 0.31458282470703125, 0.3730316162109375, 0.43148040771484375, 0.48992919921875, 0.5483779907226562, 0.6068267822265625, 0.6652755737304688, 0.723724365234375, 0.7821731567382812, 0.8406219482421875, 0.8990707397460938, 0.95751953125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 10.0, 17.0, 27.0, 64.0, 118.0, 147.0, 208.0, 140.0, 110.0, 78.0, 37.0, 16.0, 6.0, 7.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-24.312450408935547, -23.788429260253906, -23.2644100189209, -22.740388870239258, -22.216367721557617, -21.69234848022461, -21.16832733154297, -20.644306182861328, -20.12028694152832, -19.59626579284668, -19.072246551513672, -18.54822540283203, -18.02420425415039, -17.500185012817383, -16.976163864135742, -16.4521427154541, -15.928122520446777, -15.404102325439453, -14.880081176757812, -14.356060981750488, -13.832040786743164, -13.308019638061523, -12.7839994430542, -12.259979248046875, -11.735958099365234, -11.21193790435791, -10.68791675567627, -10.163896560668945, -9.639876365661621, -9.115856170654297, -8.591835021972656, -8.067814826965332, -7.543794631958008, -7.019773960113525, -6.495753765106201, -5.971733093261719, -5.4477128982543945, -4.923692226409912, -4.39967155456543, -3.8756511211395264, -3.351630687713623, -2.8276102542877197, -2.3035898208618164, -1.779569149017334, -1.2555487155914307, -0.7315282821655273, -0.20750761032104492, 0.3165128231048584, 0.8405332565307617, 1.364553689956665, 1.888574242591858, 2.412594795227051, 2.936615228652954, 3.4606356620788574, 3.98465633392334, 4.508676528930664, 5.0326972007751465, 5.556717872619629, 6.080738067626953, 6.6047587394714355, 7.128779411315918, 7.652799606323242, 8.176820755004883, 8.700840950012207, 9.224861145019531]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 6.0, 3.0, 9.0, 12.0, 13.0, 20.0, 23.0, 24.0, 28.0, 28.0, 28.0, 35.0, 41.0, 45.0, 37.0, 43.0, 46.0, 49.0, 48.0, 50.0, 53.0, 48.0, 33.0, 37.0, 40.0, 28.0, 23.0, 21.0, 28.0, 12.0, 21.0, 14.0, 16.0, 15.0, 11.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.9367036819458, -9.620892524719238, -9.30508041381836, -8.989269256591797, -8.673458099365234, -8.357645988464355, -8.041834831237793, -7.726023197174072, -7.410211563110352, -7.094399929046631, -6.778588771820068, -6.462777137756348, -6.146965503692627, -5.831153869628906, -5.515342712402344, -5.199531078338623, -4.8837199211120605, -4.56790828704834, -4.252097129821777, -3.9362854957580566, -3.620473861694336, -3.3046624660491943, -2.9888510704040527, -2.673039436340332, -2.3572280406951904, -2.041416645050049, -1.7256050109863281, -1.4097936153411865, -1.0939821004867554, -0.7781705856323242, -0.4623591899871826, -0.14654755592346191, 0.1692638397216797, 0.48507532477378845, 0.8008868098258972, 1.1166982650756836, 1.4325097799301147, 1.748321294784546, 2.0641326904296875, 2.379944324493408, 2.69575572013855, 3.0115671157836914, 3.327378749847412, 3.6431901454925537, 3.9590015411376953, 4.274813175201416, 4.590624809265137, 4.906435966491699, 5.22224760055542, 5.538059234619141, 5.853870391845703, 6.169682025909424, 6.4854936599731445, 6.801304817199707, 7.117116451263428, 7.432928085327148, 7.748739242553711, 8.064550399780273, 8.380362510681152, 8.696173667907715, 9.011984825134277, 9.327796936035156, 9.643608093261719, 9.959419250488281, 10.27523136138916]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 8.0, 10.0, 15.0, 14.0, 33.0, 30.0, 27.0, 47.0, 60.0, 72.0, 90.0, 140.0, 174.0, 259.0, 322.0, 467.0, 688.0, 948.0, 1433.0, 2712.0, 1034491.0, 3237.0, 1604.0, 1057.0, 729.0, 503.0, 359.0, 301.0, 205.0, 123.0, 104.0, 70.0, 65.0, 50.0, 40.0, 31.0, 19.0, 16.0, 9.0, 7.0, 8.0, 6.0, 7.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.840611457824707, -12.446940422058105, -12.053269386291504, -11.659598350524902, -11.265926361083984, -10.872255325317383, -10.478584289550781, -10.08491325378418, -9.691242218017578, -9.297571182250977, -8.903900146484375, -8.510229110717773, -8.116558074951172, -7.722886562347412, -7.329215049743652, -6.935544013977051, -6.541872978210449, -6.148201942443848, -5.754530906677246, -5.360859394073486, -4.967188358306885, -4.573517322540283, -4.179845809936523, -3.786174774169922, -3.3925037384033203, -2.9988327026367188, -2.605161428451538, -2.2114901542663574, -1.8178191184997559, -1.4241479635238647, -1.0304768085479736, -0.636805534362793, -0.2431344985961914, 0.1505366563796997, 0.5442078113555908, 0.9378789663314819, 1.331550121307373, 1.7252212762832642, 2.1188924312591553, 2.512563705444336, 2.9062347412109375, 3.299905776977539, 3.6935770511627197, 4.0872483253479, 4.480919361114502, 4.8745903968811035, 5.268261909484863, 5.661932945251465, 6.055603981018066, 6.449275016784668, 6.8429460525512695, 7.236617565155029, 7.630288600921631, 8.02396011352539, 8.417631149291992, 8.811302185058594, 9.204973220825195, 9.598644256591797, 9.992315292358398, 10.385986328125, 10.779657363891602, 11.17332935333252, 11.567000389099121, 11.960671424865723, 12.354342460632324]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 12.0, 16.0, 21.0, 25.0, 52.0, 93.0, 189.0, 417.0, 1104.0, 2778.0, 6683.0, 18227.0, 51405384.0, 22178.0, 8001.0, 3522.0, 1408.0, 673.0, 264.0, 123.0, 59.0, 25.0, 27.0, 18.0, 11.0, 5.0, 5.0, 9.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.0942268371582, -43.5697021484375, -42.04517364501953, -40.52064895629883, -38.996124267578125, -37.471595764160156, -35.94707107543945, -34.42254638671875, -32.89801788330078, -31.373491287231445, -29.848966598510742, -28.324440002441406, -26.799915313720703, -25.275388717651367, -23.75086212158203, -22.226337432861328, -20.701812744140625, -19.17728614807129, -17.652761459350586, -16.12823486328125, -14.60370922088623, -13.079183578491211, -11.554656982421875, -10.030131340026855, -8.505605697631836, -6.981080055236816, -5.456553936004639, -3.932027816772461, -2.4075021743774414, -0.8829765319824219, 0.6415500640869141, 2.1660757064819336, 3.690601348876953, 5.215126991271973, 6.73965311050415, 8.264179229736328, 9.788704872131348, 11.313230514526367, 12.837757110595703, 14.362282752990723, 15.886808395385742, 17.411334991455078, 18.93585968017578, 20.460386276245117, 21.984912872314453, 23.509437561035156, 25.033964157104492, 26.558490753173828, 28.08301544189453, 29.607542037963867, 31.13206672668457, 32.656593322753906, 34.18111801147461, 35.70564270019531, 37.23017120361328, 38.754695892333984, 40.27922058105469, 41.80374526977539, 43.32827377319336, 44.85279846191406, 46.377323150634766, 47.90184783935547, 49.42637634277344, 50.95090103149414, 52.47542953491211]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 11.0, 17.0, 20.0, 31.0, 57.0, 93.0, 113.0, 170.0, 269.0, 451.0, 754.0, 1273.0, 2099.0, 3459.0, 6036.0, 10327.0, 18521.0, 33054.0, 61313.0, 110673.0, 192848.0, 316899.0, 535697.0, 2740188.0, 1247054.0, 409761.0, 257401.0, 152026.0, 84738.0, 46393.0, 25626.0, 14136.0, 8181.0, 4723.0, 2772.0, 1644.0, 1027.0, 589.0, 372.0, 209.0, 136.0, 89.0, 74.0, 32.0, 26.0, 15.0, 12.0, 6.0, 10.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.03515625, -4.876708984375, -4.71826171875, -4.559814453125, -4.4013671875, -4.242919921875, -4.08447265625, -3.926025390625, -3.767578125, -3.609130859375, -3.45068359375, -3.292236328125, -3.1337890625, -2.975341796875, -2.81689453125, -2.658447265625, -2.5, -2.341552734375, -2.18310546875, -2.024658203125, -1.8662109375, -1.707763671875, -1.54931640625, -1.390869140625, -1.232421875, -1.073974609375, -0.91552734375, -0.757080078125, -0.5986328125, -0.440185546875, -0.28173828125, -0.123291015625, 0.03515625, 0.193603515625, 0.35205078125, 0.510498046875, 0.6689453125, 0.827392578125, 0.98583984375, 1.144287109375, 1.302734375, 1.461181640625, 1.61962890625, 1.778076171875, 1.9365234375, 2.094970703125, 2.25341796875, 2.411865234375, 2.5703125, 2.728759765625, 2.88720703125, 3.045654296875, 3.2041015625, 3.362548828125, 3.52099609375, 3.679443359375, 3.837890625, 3.996337890625, 4.15478515625, 4.313232421875, 4.4716796875, 4.630126953125, 4.78857421875, 4.947021484375, 5.10546875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 3.0, 6.0, 4.0, 7.0, 9.0, 9.0, 13.0, 17.0, 14.0, 24.0, 19.0, 27.0, 32.0, 42.0, 28.0, 38.0, 38.0, 38.0, 41.0, 66.0, 188.0, 787.0, 138.0, 57.0, 48.0, 51.0, 39.0, 34.0, 24.0, 36.0, 25.0, 16.0, 12.0, 15.0, 14.0, 15.0, 15.0, 6.0, 7.0, 6.0, 10.0, 5.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-40.0625, -38.865234375, -37.66796875, -36.470703125, -35.2734375, -34.076171875, -32.87890625, -31.681640625, -30.484375, -29.287109375, -28.08984375, -26.892578125, -25.6953125, -24.498046875, -23.30078125, -22.103515625, -20.90625, -19.708984375, -18.51171875, -17.314453125, -16.1171875, -14.919921875, -13.72265625, -12.525390625, -11.328125, -10.130859375, -8.93359375, -7.736328125, -6.5390625, -5.341796875, -4.14453125, -2.947265625, -1.75, -0.552734375, 0.64453125, 1.841796875, 3.0390625, 4.236328125, 5.43359375, 6.630859375, 7.828125, 9.025390625, 10.22265625, 11.419921875, 12.6171875, 13.814453125, 15.01171875, 16.208984375, 17.40625, 18.603515625, 19.80078125, 20.998046875, 22.1953125, 23.392578125, 24.58984375, 25.787109375, 26.984375, 28.181640625, 29.37890625, 30.576171875, 31.7734375, 32.970703125, 34.16796875, 35.365234375, 36.5625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 5.0, 8.0, 31.0, 39.0, 75.0, 147.0, 158.0, 274.0, 472.0, 790.0, 1284.0, 1924.0, 3175.0, 5049.0, 7746.0, 11834.0, 17976.0, 27646.0, 39880.0, 57122.0, 80146.0, 108067.0, 142503.0, 178908.0, 215620.0, 262751.0, 670730.0, 2323483.0, 909784.0, 282719.0, 221997.0, 185094.0, 147608.0, 114068.0, 84318.0, 60934.0, 42857.0, 28696.0, 19503.0, 12956.0, 8440.0, 5266.0, 3429.0, 2193.0, 1461.0, 904.0, 540.0, 327.0, 210.0, 119.0, 73.0, 48.0, 19.0, 15.0, 14.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9794921875, -1.9147796630859375, -1.850067138671875, -1.7853546142578125, -1.72064208984375, -1.6559295654296875, -1.591217041015625, -1.5265045166015625, -1.4617919921875, -1.3970794677734375, -1.332366943359375, -1.2676544189453125, -1.20294189453125, -1.1382293701171875, -1.073516845703125, -1.0088043212890625, -0.944091796875, -0.8793792724609375, -0.814666748046875, -0.7499542236328125, -0.68524169921875, -0.6205291748046875, -0.555816650390625, -0.4911041259765625, -0.4263916015625, -0.3616790771484375, -0.296966552734375, -0.2322540283203125, -0.16754150390625, -0.1028289794921875, -0.038116455078125, 0.0265960693359375, 0.09130859375, 0.1560211181640625, 0.220733642578125, 0.2854461669921875, 0.35015869140625, 0.4148712158203125, 0.479583740234375, 0.5442962646484375, 0.6090087890625, 0.6737213134765625, 0.738433837890625, 0.8031463623046875, 0.86785888671875, 0.9325714111328125, 0.997283935546875, 1.0619964599609375, 1.126708984375, 1.1914215087890625, 1.256134033203125, 1.3208465576171875, 1.38555908203125, 1.4502716064453125, 1.514984130859375, 1.5796966552734375, 1.6444091796875, 1.7091217041015625, 1.773834228515625, 1.8385467529296875, 1.90325927734375, 1.9679718017578125, 2.032684326171875, 2.0973968505859375, 2.162109375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 4.0, 10.0, 7.0, 5.0, 9.0, 6.0, 7.0, 11.0, 19.0, 23.0, 32.0, 27.0, 35.0, 25.0, 36.0, 36.0, 41.0, 29.0, 47.0, 46.0, 399.0, 684.0, 74.0, 34.0, 40.0, 31.0, 35.0, 43.0, 29.0, 30.0, 24.0, 19.0, 22.0, 13.0, 21.0, 11.0, 12.0, 3.0, 11.0, 10.0, 7.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.8125, -27.917724609375, -27.02294921875, -26.128173828125, -25.2333984375, -24.338623046875, -23.44384765625, -22.549072265625, -21.654296875, -20.759521484375, -19.86474609375, -18.969970703125, -18.0751953125, -17.180419921875, -16.28564453125, -15.390869140625, -14.49609375, -13.601318359375, -12.70654296875, -11.811767578125, -10.9169921875, -10.022216796875, -9.12744140625, -8.232666015625, -7.337890625, -6.443115234375, -5.54833984375, -4.653564453125, -3.7587890625, -2.864013671875, -1.96923828125, -1.074462890625, -0.1796875, 0.715087890625, 1.60986328125, 2.504638671875, 3.3994140625, 4.294189453125, 5.18896484375, 6.083740234375, 6.978515625, 7.873291015625, 8.76806640625, 9.662841796875, 10.5576171875, 11.452392578125, 12.34716796875, 13.241943359375, 14.13671875, 15.031494140625, 15.92626953125, 16.821044921875, 17.7158203125, 18.610595703125, 19.50537109375, 20.400146484375, 21.294921875, 22.189697265625, 23.08447265625, 23.979248046875, 24.8740234375, 25.768798828125, 26.66357421875, 27.558349609375, 28.453125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 4.0, 3.0, 7.0, 9.0, 11.0, 13.0, 22.0, 31.0, 34.0, 47.0, 65.0, 80.0, 116.0, 147.0, 223.0, 256.0, 376.0, 599.0, 813.0, 1106.0, 1585.0, 2594.0, 4613.0, 8727.0, 18955.0, 42533.0, 95293.0, 202425.0, 381495.0, 754639.0, 3593429.0, 553763.0, 322069.0, 163330.0, 74834.0, 33309.0, 15174.0, 7450.0, 3932.0, 2293.0, 1523.0, 969.0, 680.0, 486.0, 352.0, 246.0, 221.0, 159.0, 120.0, 83.0, 60.0, 53.0, 25.0, 19.0, 14.0, 7.0, 6.0, 7.0, 6.0, 4.0, 2.0], "bins": [-4.625, -4.486328125, -4.34765625, -4.208984375, -4.0703125, -3.931640625, -3.79296875, -3.654296875, -3.515625, -3.376953125, -3.23828125, -3.099609375, -2.9609375, -2.822265625, -2.68359375, -2.544921875, -2.40625, -2.267578125, -2.12890625, -1.990234375, -1.8515625, -1.712890625, -1.57421875, -1.435546875, -1.296875, -1.158203125, -1.01953125, -0.880859375, -0.7421875, -0.603515625, -0.46484375, -0.326171875, -0.1875, -0.048828125, 0.08984375, 0.228515625, 0.3671875, 0.505859375, 0.64453125, 0.783203125, 0.921875, 1.060546875, 1.19921875, 1.337890625, 1.4765625, 1.615234375, 1.75390625, 1.892578125, 2.03125, 2.169921875, 2.30859375, 2.447265625, 2.5859375, 2.724609375, 2.86328125, 3.001953125, 3.140625, 3.279296875, 3.41796875, 3.556640625, 3.6953125, 3.833984375, 3.97265625, 4.111328125, 4.25]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 4.0, 7.0, 3.0, 10.0, 12.0, 19.0, 17.0, 16.0, 21.0, 19.0, 21.0, 28.0, 31.0, 25.0, 31.0, 40.0, 43.0, 37.0, 47.0, 42.0, 560.0, 527.0, 51.0, 37.0, 35.0, 39.0, 32.0, 34.0, 36.0, 33.0, 22.0, 27.0, 26.0, 19.0, 7.0, 11.0, 15.0, 7.0, 7.0, 5.0, 11.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.8125, -24.9228515625, -24.033203125, -23.1435546875, -22.25390625, -21.3642578125, -20.474609375, -19.5849609375, -18.6953125, -17.8056640625, -16.916015625, -16.0263671875, -15.13671875, -14.2470703125, -13.357421875, -12.4677734375, -11.578125, -10.6884765625, -9.798828125, -8.9091796875, -8.01953125, -7.1298828125, -6.240234375, -5.3505859375, -4.4609375, -3.5712890625, -2.681640625, -1.7919921875, -0.90234375, -0.0126953125, 0.876953125, 1.7666015625, 2.65625, 3.5458984375, 4.435546875, 5.3251953125, 6.21484375, 7.1044921875, 7.994140625, 8.8837890625, 9.7734375, 10.6630859375, 11.552734375, 12.4423828125, 13.33203125, 14.2216796875, 15.111328125, 16.0009765625, 16.890625, 17.7802734375, 18.669921875, 19.5595703125, 20.44921875, 21.3388671875, 22.228515625, 23.1181640625, 24.0078125, 24.8974609375, 25.787109375, 26.6767578125, 27.56640625, 28.4560546875, 29.345703125, 30.2353515625, 31.125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 13.0, 17.0, 50.0, 197.0, 417.0, 225.0, 60.0, 17.0, 5.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.47903442382812, -109.41681671142578, -104.35459899902344, -99.29238891601562, -94.23017120361328, -89.16795349121094, -84.10574340820312, -79.04352569580078, -73.98130798339844, -68.9190902709961, -63.856876373291016, -58.79466247558594, -53.732444763183594, -48.67022705078125, -43.60801315307617, -38.545799255371094, -33.48358154296875, -28.42136573791504, -23.359149932861328, -18.296934127807617, -13.234718322753906, -8.172502517700195, -3.1102867126464844, 1.9519271850585938, 7.0141448974609375, 12.076360702514648, 17.13857650756836, 22.20079231262207, 27.26300811767578, 32.325225830078125, 37.3874397277832, 42.44965362548828, 47.511871337890625, 52.57408905029297, 57.63630294799805, 62.698516845703125, 67.76073455810547, 72.82295227050781, 77.88516235351562, 82.94738006591797, 88.00959777832031, 93.07181549072266, 98.134033203125, 103.19624328613281, 108.25846099853516, 113.3206787109375, 118.38288879394531, 123.44510650634766, 128.50732421875, 133.5695343017578, 138.6317596435547, 143.6939697265625, 148.75619506835938, 153.8184051513672, 158.880615234375, 163.94284057617188, 169.0050506591797, 174.0672607421875, 179.12948608398438, 184.1916961669922, 189.25390625, 194.31613159179688, 199.3783416748047, 204.4405517578125, 209.50277709960938]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 5.0, 2.0, 7.0, 6.0, 5.0, 2.0, 13.0, 10.0, 18.0, 14.0, 16.0, 23.0, 32.0, 44.0, 31.0, 32.0, 45.0, 42.0, 40.0, 47.0, 45.0, 47.0, 50.0, 47.0, 46.0, 38.0, 46.0, 34.0, 31.0, 39.0, 16.0, 22.0, 21.0, 18.0, 16.0, 11.0, 12.0, 8.0, 5.0, 10.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-68.62208557128906, -66.3858413696289, -64.14958953857422, -61.91334533691406, -59.67709732055664, -57.44084930419922, -55.2046012878418, -52.968353271484375, -50.73210906982422, -48.4958610534668, -46.259613037109375, -44.02336883544922, -41.7871208190918, -39.550872802734375, -37.31462478637695, -35.07837677001953, -32.84212875366211, -30.605880737304688, -28.3696346282959, -26.133386611938477, -23.897140502929688, -21.660892486572266, -19.424644470214844, -17.188396453857422, -14.952150344848633, -12.715903282165527, -10.479656219482422, -8.243408203125, -6.0071611404418945, -3.770914077758789, -1.5346660614013672, 0.7015810012817383, 2.9378280639648438, 5.174075126647949, 7.410322666168213, 9.646570205688477, 11.882817268371582, 14.119064331054688, 16.35531234741211, 18.59156036376953, 20.82780647277832, 23.064054489135742, 25.30030059814453, 27.536548614501953, 29.772796630859375, 32.00904083251953, 34.24529266357422, 36.481536865234375, 38.7177848815918, 40.95403289794922, 43.19028091430664, 45.42652893066406, 47.66277313232422, 49.89902114868164, 52.13526916503906, 54.371517181396484, 56.607765197753906, 58.84401321411133, 61.08026123046875, 63.316505432128906, 65.5527572631836, 67.78900146484375, 70.02525329589844, 72.2614974975586, 74.49774169921875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 7.0, 11.0, 7.0, 9.0, 19.0, 16.0, 21.0, 32.0, 46.0, 74.0, 111.0, 233.0, 511.0, 1249.0, 3272.0, 9545.0, 48577.0, 2309317.0, 1761481.0, 45098.0, 9314.0, 3069.0, 1160.0, 478.0, 251.0, 134.0, 65.0, 45.0, 27.0, 25.0, 26.0, 14.0, 7.0, 5.0, 9.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.904144287109375, -1.84637451171875, -1.788604736328125, -1.7308349609375, -1.673065185546875, -1.61529541015625, -1.557525634765625, -1.499755859375, -1.441986083984375, -1.38421630859375, -1.326446533203125, -1.2686767578125, -1.210906982421875, -1.15313720703125, -1.095367431640625, -1.03759765625, -0.979827880859375, -0.92205810546875, -0.864288330078125, -0.8065185546875, -0.748748779296875, -0.69097900390625, -0.633209228515625, -0.575439453125, -0.517669677734375, -0.45989990234375, -0.402130126953125, -0.3443603515625, -0.286590576171875, -0.22882080078125, -0.171051025390625, -0.11328125, -0.055511474609375, 0.00225830078125, 0.060028076171875, 0.1177978515625, 0.175567626953125, 0.23333740234375, 0.291107177734375, 0.348876953125, 0.406646728515625, 0.46441650390625, 0.522186279296875, 0.5799560546875, 0.637725830078125, 0.69549560546875, 0.753265380859375, 0.81103515625, 0.868804931640625, 0.92657470703125, 0.984344482421875, 1.0421142578125, 1.099884033203125, 1.15765380859375, 1.215423583984375, 1.273193359375, 1.330963134765625, 1.38873291015625, 1.446502685546875, 1.5042724609375, 1.562042236328125, 1.61981201171875, 1.677581787109375, 1.7353515625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 7.0, 6.0, 7.0, 8.0, 13.0, 14.0, 11.0, 25.0, 26.0, 32.0, 38.0, 51.0, 41.0, 57.0, 65.0, 85.0, 82.0, 61.0, 59.0, 49.0, 53.0, 45.0, 38.0, 26.0, 27.0, 10.0, 17.0, 7.0, 9.0, 8.0, 9.0, 4.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82568359375, -0.8039779663085938, -0.7822723388671875, -0.7605667114257812, -0.738861083984375, -0.7171554565429688, -0.6954498291015625, -0.6737442016601562, -0.65203857421875, -0.6303329467773438, -0.6086273193359375, -0.5869216918945312, -0.565216064453125, -0.5435104370117188, -0.5218048095703125, -0.5000991821289062, -0.4783935546875, -0.45668792724609375, -0.4349822998046875, -0.41327667236328125, -0.391571044921875, -0.36986541748046875, -0.3481597900390625, -0.32645416259765625, -0.30474853515625, -0.28304290771484375, -0.2613372802734375, -0.23963165283203125, -0.217926025390625, -0.19622039794921875, -0.1745147705078125, -0.15280914306640625, -0.131103515625, -0.10939788818359375, -0.0876922607421875, -0.06598663330078125, -0.044281005859375, -0.02257537841796875, -0.0008697509765625, 0.02083587646484375, 0.04254150390625, 0.06424713134765625, 0.0859527587890625, 0.10765838623046875, 0.129364013671875, 0.15106964111328125, 0.1727752685546875, 0.19448089599609375, 0.2161865234375, 0.23789215087890625, 0.2595977783203125, 0.28130340576171875, 0.303009033203125, 0.32471466064453125, 0.3464202880859375, 0.36812591552734375, 0.38983154296875, 0.41153717041015625, 0.4332427978515625, 0.45494842529296875, 0.476654052734375, 0.49835968017578125, 0.5200653076171875, 0.5417709350585938, 0.5634765625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 4.0, 7.0, 6.0, 5.0, 10.0, 13.0, 15.0, 16.0, 35.0, 40.0, 56.0, 115.0, 297.0, 896.0, 5307.0, 157895.0, 3972956.0, 52371.0, 3186.0, 598.0, 212.0, 88.0, 40.0, 28.0, 16.0, 12.0, 15.0, 6.0, 5.0, 7.0, 2.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.138671875, -2.0726318359375, -2.006591796875, -1.9405517578125, -1.87451171875, -1.8084716796875, -1.742431640625, -1.6763916015625, -1.6103515625, -1.5443115234375, -1.478271484375, -1.4122314453125, -1.34619140625, -1.2801513671875, -1.214111328125, -1.1480712890625, -1.08203125, -1.0159912109375, -0.949951171875, -0.8839111328125, -0.81787109375, -0.7518310546875, -0.685791015625, -0.6197509765625, -0.5537109375, -0.4876708984375, -0.421630859375, -0.3555908203125, -0.28955078125, -0.2235107421875, -0.157470703125, -0.0914306640625, -0.025390625, 0.0406494140625, 0.106689453125, 0.1727294921875, 0.23876953125, 0.3048095703125, 0.370849609375, 0.4368896484375, 0.5029296875, 0.5689697265625, 0.635009765625, 0.7010498046875, 0.76708984375, 0.8331298828125, 0.899169921875, 0.9652099609375, 1.03125, 1.0972900390625, 1.163330078125, 1.2293701171875, 1.29541015625, 1.3614501953125, 1.427490234375, 1.4935302734375, 1.5595703125, 1.6256103515625, 1.691650390625, 1.7576904296875, 1.82373046875, 1.8897705078125, 1.955810546875, 2.0218505859375, 2.087890625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 10.0, 16.0, 16.0, 23.0, 23.0, 56.0, 82.0, 160.0, 266.0, 490.0, 708.0, 764.0, 564.0, 344.0, 180.0, 116.0, 62.0, 44.0, 26.0, 19.0, 14.0, 18.0, 9.0, 4.0, 14.0, 2.0, 5.0, 5.0, 3.0, 2.0, 3.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.86767578125, -0.8415451049804688, -0.8154144287109375, -0.7892837524414062, -0.763153076171875, -0.7370223999023438, -0.7108917236328125, -0.6847610473632812, -0.65863037109375, -0.6324996948242188, -0.6063690185546875, -0.5802383422851562, -0.554107666015625, -0.5279769897460938, -0.5018463134765625, -0.47571563720703125, -0.4495849609375, -0.42345428466796875, -0.3973236083984375, -0.37119293212890625, -0.345062255859375, -0.31893157958984375, -0.2928009033203125, -0.26667022705078125, -0.24053955078125, -0.21440887451171875, -0.1882781982421875, -0.16214752197265625, -0.136016845703125, -0.10988616943359375, -0.0837554931640625, -0.05762481689453125, -0.031494140625, -0.00536346435546875, 0.0207672119140625, 0.04689788818359375, 0.073028564453125, 0.09915924072265625, 0.1252899169921875, 0.15142059326171875, 0.17755126953125, 0.20368194580078125, 0.2298126220703125, 0.25594329833984375, 0.282073974609375, 0.30820465087890625, 0.3343353271484375, 0.36046600341796875, 0.3865966796875, 0.41272735595703125, 0.4388580322265625, 0.46498870849609375, 0.491119384765625, 0.5172500610351562, 0.5433807373046875, 0.5695114135742188, 0.59564208984375, 0.6217727661132812, 0.6479034423828125, 0.6740341186523438, 0.700164794921875, 0.7262954711914062, 0.7524261474609375, 0.7785568237304688, 0.8046875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 31.0, 305.0, 594.0, 73.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.446352958679199, -4.964015483856201, -4.481678009033203, -3.999340295791626, -3.517002820968628, -3.03466534614563, -2.5523276329040527, -2.0699901580810547, -1.5876526832580566, -1.1053152084350586, -0.622977614402771, -0.1406400203704834, 0.34169745445251465, 0.8240349292755127, 1.3063726425170898, 1.788710117340088, 2.271047592163086, 2.753385066986084, 3.235722541809082, 3.718060255050659, 4.200397491455078, 4.682735443115234, 5.165072917938232, 5.6474103927612305, 6.1297478675842285, 6.612085342407227, 7.094422817230225, 7.576760292053223, 8.059098243713379, 8.541435241699219, 9.023773193359375, 9.506111145019531, 9.988447189331055, 10.470785140991211, 10.95312213897705, 11.435460090637207, 11.917797088623047, 12.400135040283203, 12.88247299194336, 13.3648099899292, 13.847146987915039, 14.329484939575195, 14.811821937561035, 15.294159889221191, 15.776496887207031, 16.258834838867188, 16.741172790527344, 17.2235107421875, 17.705848693847656, 18.188186645507812, 18.67052459716797, 19.152860641479492, 19.63519859313965, 20.117536544799805, 20.59987449645996, 21.082210540771484, 21.56454849243164, 22.046886444091797, 22.529224395751953, 23.011560440063477, 23.493898391723633, 23.97623634338379, 24.458574295043945, 24.94091033935547, 25.423248291015625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 8.0, 8.0, 10.0, 6.0, 9.0, 17.0, 14.0, 22.0, 28.0, 36.0, 33.0, 41.0, 47.0, 45.0, 61.0, 48.0, 39.0, 49.0, 79.0, 48.0, 42.0, 42.0, 36.0, 34.0, 36.0, 39.0, 20.0, 22.0, 14.0, 23.0, 7.0, 14.0, 10.0, 5.0, 5.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.184354305267334, -2.1020870208740234, -2.019819736480713, -1.9375523328781128, -1.8552849292755127, -1.7730176448822021, -1.6907503604888916, -1.6084829568862915, -1.5262155532836914, -1.4439482688903809, -1.3616808652877808, -1.2794135808944702, -1.1971461772918701, -1.1148788928985596, -1.032611608505249, -0.9503442049026489, -0.8680769205093384, -0.7858095765113831, -0.7035422325134277, -0.6212749481201172, -0.5390075445175171, -0.45674023032188416, -0.3744729161262512, -0.2922055721282959, -0.20993822813034058, -0.12767088413238525, -0.045403555035591125, 0.036863774061203, 0.11913111805915833, 0.20139846205711365, 0.2836657762527466, 0.3659331202507019, 0.4482004642486572, 0.5304678082466125, 0.6127351522445679, 0.6950024366378784, 0.7772698402404785, 0.8595371246337891, 0.9418044686317444, 1.0240718126296997, 1.1063392162322998, 1.1886065006256104, 1.2708739042282104, 1.353141188621521, 1.435408592224121, 1.5176758766174316, 1.5999431610107422, 1.6822105646133423, 1.7644778490066528, 1.8467451333999634, 1.9290125370025635, 2.011279821395874, 2.0935471057891846, 2.175814628601074, 2.2580819129943848, 2.3403491973876953, 2.422616481781006, 2.5048837661743164, 2.587151050567627, 2.6694185733795166, 2.751685857772827, 2.8339531421661377, 2.9162204265594482, 2.998487949371338, 3.0807552337646484]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 6.0, 9.0, 18.0, 12.0, 22.0, 32.0, 43.0, 58.0, 106.0, 153.0, 216.0, 322.0, 526.0, 901.0, 1588.0, 3032.0, 7046.0, 22135.0, 240531.0, 702197.0, 49374.0, 10555.0, 4441.0, 2209.0, 1172.0, 703.0, 390.0, 244.0, 172.0, 107.0, 71.0, 45.0, 35.0, 19.0, 17.0, 13.0, 6.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6689453125, -1.6171417236328125, -1.565338134765625, -1.5135345458984375, -1.46173095703125, -1.4099273681640625, -1.358123779296875, -1.3063201904296875, -1.2545166015625, -1.2027130126953125, -1.150909423828125, -1.0991058349609375, -1.04730224609375, -0.9954986572265625, -0.943695068359375, -0.8918914794921875, -0.840087890625, -0.7882843017578125, -0.736480712890625, -0.6846771240234375, -0.63287353515625, -0.5810699462890625, -0.529266357421875, -0.4774627685546875, -0.4256591796875, -0.3738555908203125, -0.322052001953125, -0.2702484130859375, -0.21844482421875, -0.1666412353515625, -0.114837646484375, -0.0630340576171875, -0.01123046875, 0.0405731201171875, 0.092376708984375, 0.1441802978515625, 0.19598388671875, 0.2477874755859375, 0.299591064453125, 0.3513946533203125, 0.4031982421875, 0.4550018310546875, 0.506805419921875, 0.5586090087890625, 0.61041259765625, 0.6622161865234375, 0.714019775390625, 0.7658233642578125, 0.817626953125, 0.8694305419921875, 0.921234130859375, 0.9730377197265625, 1.02484130859375, 1.0766448974609375, 1.128448486328125, 1.1802520751953125, 1.2320556640625, 1.2838592529296875, 1.335662841796875, 1.3874664306640625, 1.43927001953125, 1.4910736083984375, 1.542877197265625, 1.5946807861328125, 1.646484375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 9.0, 10.0, 6.0, 9.0, 13.0, 9.0, 16.0, 24.0, 24.0, 35.0, 43.0, 39.0, 46.0, 59.0, 74.0, 67.0, 67.0, 66.0, 63.0, 41.0, 44.0, 51.0, 31.0, 30.0, 27.0, 23.0, 13.0, 8.0, 6.0, 12.0, 10.0, 6.0, 8.0, 2.0, 5.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.83203125, -0.811798095703125, -0.79156494140625, -0.771331787109375, -0.7510986328125, -0.730865478515625, -0.71063232421875, -0.690399169921875, -0.670166015625, -0.649932861328125, -0.62969970703125, -0.609466552734375, -0.5892333984375, -0.569000244140625, -0.54876708984375, -0.528533935546875, -0.50830078125, -0.488067626953125, -0.46783447265625, -0.447601318359375, -0.4273681640625, -0.407135009765625, -0.38690185546875, -0.366668701171875, -0.346435546875, -0.326202392578125, -0.30596923828125, -0.285736083984375, -0.2655029296875, -0.245269775390625, -0.22503662109375, -0.204803466796875, -0.1845703125, -0.164337158203125, -0.14410400390625, -0.123870849609375, -0.1036376953125, -0.083404541015625, -0.06317138671875, -0.042938232421875, -0.022705078125, -0.002471923828125, 0.01776123046875, 0.037994384765625, 0.0582275390625, 0.078460693359375, 0.09869384765625, 0.118927001953125, 0.13916015625, 0.159393310546875, 0.17962646484375, 0.199859619140625, 0.2200927734375, 0.240325927734375, 0.26055908203125, 0.280792236328125, 0.301025390625, 0.321258544921875, 0.34149169921875, 0.361724853515625, 0.3819580078125, 0.402191162109375, 0.42242431640625, 0.442657470703125, 0.462890625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 2.0, 12.0, 9.0, 27.0, 26.0, 31.0, 43.0, 39.0, 59.0, 113.0, 210.0, 1024.0, 11628.0, 362785.0, 644522.0, 25646.0, 1634.0, 309.0, 130.0, 70.0, 52.0, 36.0, 24.0, 28.0, 14.0, 17.0, 16.0, 11.0, 6.0, 5.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6240234375, -1.5764312744140625, -1.528839111328125, -1.4812469482421875, -1.43365478515625, -1.3860626220703125, -1.338470458984375, -1.2908782958984375, -1.2432861328125, -1.1956939697265625, -1.148101806640625, -1.1005096435546875, -1.05291748046875, -1.0053253173828125, -0.957733154296875, -0.9101409912109375, -0.862548828125, -0.8149566650390625, -0.767364501953125, -0.7197723388671875, -0.67218017578125, -0.6245880126953125, -0.576995849609375, -0.5294036865234375, -0.4818115234375, -0.4342193603515625, -0.386627197265625, -0.3390350341796875, -0.29144287109375, -0.2438507080078125, -0.196258544921875, -0.1486663818359375, -0.10107421875, -0.0534820556640625, -0.005889892578125, 0.0417022705078125, 0.08929443359375, 0.1368865966796875, 0.184478759765625, 0.2320709228515625, 0.2796630859375, 0.3272552490234375, 0.374847412109375, 0.4224395751953125, 0.47003173828125, 0.5176239013671875, 0.565216064453125, 0.6128082275390625, 0.660400390625, 0.7079925537109375, 0.755584716796875, 0.8031768798828125, 0.85076904296875, 0.8983612060546875, 0.945953369140625, 0.9935455322265625, 1.0411376953125, 1.0887298583984375, 1.136322021484375, 1.1839141845703125, 1.23150634765625, 1.2790985107421875, 1.326690673828125, 1.3742828369140625, 1.421875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 11.0, 13.0, 7.0, 22.0, 21.0, 15.0, 27.0, 34.0, 41.0, 46.0, 50.0, 49.0, 49.0, 54.0, 55.0, 53.0, 59.0, 52.0, 52.0, 52.0, 40.0, 35.0, 29.0, 42.0, 21.0, 21.0, 14.0, 10.0, 5.0, 12.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6904296875, -1.63763427734375, -1.5848388671875, -1.53204345703125, -1.479248046875, -1.42645263671875, -1.3736572265625, -1.32086181640625, -1.26806640625, -1.21527099609375, -1.1624755859375, -1.10968017578125, -1.056884765625, -1.00408935546875, -0.9512939453125, -0.89849853515625, -0.845703125, -0.79290771484375, -0.7401123046875, -0.68731689453125, -0.634521484375, -0.58172607421875, -0.5289306640625, -0.47613525390625, -0.42333984375, -0.37054443359375, -0.3177490234375, -0.26495361328125, -0.212158203125, -0.15936279296875, -0.1065673828125, -0.05377197265625, -0.0009765625, 0.05181884765625, 0.1046142578125, 0.15740966796875, 0.210205078125, 0.26300048828125, 0.3157958984375, 0.36859130859375, 0.42138671875, 0.47418212890625, 0.5269775390625, 0.57977294921875, 0.632568359375, 0.68536376953125, 0.7381591796875, 0.79095458984375, 0.84375, 0.89654541015625, 0.9493408203125, 1.00213623046875, 1.054931640625, 1.10772705078125, 1.1605224609375, 1.21331787109375, 1.26611328125, 1.31890869140625, 1.3717041015625, 1.42449951171875, 1.477294921875, 1.53009033203125, 1.5828857421875, 1.63568115234375, 1.6884765625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 4.0, 9.0, 9.0, 10.0, 15.0, 26.0, 28.0, 54.0, 87.0, 146.0, 346.0, 833.0, 2846.0, 13945.0, 106021.0, 604789.0, 279402.0, 32171.0, 5400.0, 1390.0, 489.0, 217.0, 108.0, 57.0, 45.0, 31.0, 20.0, 12.0, 16.0, 8.0, 5.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2822265625, -0.27385711669921875, -0.2654876708984375, -0.25711822509765625, -0.248748779296875, -0.24037933349609375, -0.2320098876953125, -0.22364044189453125, -0.21527099609375, -0.20690155029296875, -0.1985321044921875, -0.19016265869140625, -0.181793212890625, -0.17342376708984375, -0.1650543212890625, -0.15668487548828125, -0.1483154296875, -0.13994598388671875, -0.1315765380859375, -0.12320709228515625, -0.114837646484375, -0.10646820068359375, -0.0980987548828125, -0.08972930908203125, -0.08135986328125, -0.07299041748046875, -0.0646209716796875, -0.05625152587890625, -0.047882080078125, -0.03951263427734375, -0.0311431884765625, -0.02277374267578125, -0.014404296875, -0.00603485107421875, 0.0023345947265625, 0.01070404052734375, 0.019073486328125, 0.02744293212890625, 0.0358123779296875, 0.04418182373046875, 0.05255126953125, 0.06092071533203125, 0.0692901611328125, 0.07765960693359375, 0.086029052734375, 0.09439849853515625, 0.1027679443359375, 0.11113739013671875, 0.1195068359375, 0.12787628173828125, 0.1362457275390625, 0.14461517333984375, 0.152984619140625, 0.16135406494140625, 0.1697235107421875, 0.17809295654296875, 0.18646240234375, 0.19483184814453125, 0.2032012939453125, 0.21157073974609375, 0.219940185546875, 0.22830963134765625, 0.2366790771484375, 0.24504852294921875, 0.25341796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 10.0, 4.0, 7.0, 7.0, 13.0, 18.0, 32.0, 17.0, 53.0, 53.0, 65.0, 83.0, 95.0, 84.0, 104.0, 65.0, 72.0, 55.0, 38.0, 30.0, 24.0, 17.0, 10.0, 14.0, 8.0, 7.0, 3.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3172626495361328e-05, -1.2657605111598969e-05, -1.2142583727836609e-05, -1.162756234407425e-05, -1.111254096031189e-05, -1.059751957654953e-05, -1.008249819278717e-05, -9.56747680902481e-06, -9.052455425262451e-06, -8.537434041500092e-06, -8.022412657737732e-06, -7.507391273975372e-06, -6.992369890213013e-06, -6.477348506450653e-06, -5.9623271226882935e-06, -5.447305738925934e-06, -4.932284355163574e-06, -4.417262971401215e-06, -3.902241587638855e-06, -3.3872202038764954e-06, -2.8721988201141357e-06, -2.357177436351776e-06, -1.8421560525894165e-06, -1.3271346688270569e-06, -8.121132850646973e-07, -2.9709190130233765e-07, 2.1792948246002197e-07, 7.329508662223816e-07, 1.2479722499847412e-06, 1.7629936337471008e-06, 2.2780150175094604e-06, 2.79303640127182e-06, 3.3080577850341797e-06, 3.823079168796539e-06, 4.338100552558899e-06, 4.8531219363212585e-06, 5.368143320083618e-06, 5.883164703845978e-06, 6.398186087608337e-06, 6.913207471370697e-06, 7.428228855133057e-06, 7.943250238895416e-06, 8.458271622657776e-06, 8.973293006420135e-06, 9.488314390182495e-06, 1.0003335773944855e-05, 1.0518357157707214e-05, 1.1033378541469574e-05, 1.1548399925231934e-05, 1.2063421308994293e-05, 1.2578442692756653e-05, 1.3093464076519012e-05, 1.3608485460281372e-05, 1.4123506844043732e-05, 1.4638528227806091e-05, 1.5153549611568451e-05, 1.566857099533081e-05, 1.618359237909317e-05, 1.669861376285553e-05, 1.721363514661789e-05, 1.772865653038025e-05, 1.824367791414261e-05, 1.8758699297904968e-05, 1.9273720681667328e-05, 1.9788742065429688e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 8.0, 14.0, 29.0, 29.0, 63.0, 95.0, 150.0, 304.0, 679.0, 1321.0, 3652.0, 12009.0, 55297.0, 302248.0, 506000.0, 131483.0, 24560.0, 6479.0, 2259.0, 899.0, 438.0, 218.0, 101.0, 70.0, 38.0, 36.0, 19.0, 14.0, 8.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.237060546875, -0.23013877868652344, -0.22321701049804688, -0.2162952423095703, -0.20937347412109375, -0.2024517059326172, -0.19552993774414062, -0.18860816955566406, -0.1816864013671875, -0.17476463317871094, -0.16784286499023438, -0.1609210968017578, -0.15399932861328125, -0.1470775604248047, -0.14015579223632812, -0.13323402404785156, -0.126312255859375, -0.11939048767089844, -0.11246871948242188, -0.10554695129394531, -0.09862518310546875, -0.09170341491699219, -0.08478164672851562, -0.07785987854003906, -0.0709381103515625, -0.06401634216308594, -0.057094573974609375, -0.05017280578613281, -0.04325103759765625, -0.03632926940917969, -0.029407501220703125, -0.022485733032226562, -0.01556396484375, -0.008642196655273438, -0.001720428466796875, 0.0052013397216796875, 0.01212310791015625, 0.019044876098632812, 0.025966644287109375, 0.03288841247558594, 0.0398101806640625, 0.04673194885253906, 0.053653717041015625, 0.06057548522949219, 0.06749725341796875, 0.07441902160644531, 0.08134078979492188, 0.08826255798339844, 0.095184326171875, 0.10210609436035156, 0.10902786254882812, 0.11594963073730469, 0.12287139892578125, 0.1297931671142578, 0.13671493530273438, 0.14363670349121094, 0.1505584716796875, 0.15748023986816406, 0.16440200805664062, 0.1713237762451172, 0.17824554443359375, 0.1851673126220703, 0.19208908081054688, 0.19901084899902344, 0.2059326171875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 8.0, 8.0, 12.0, 12.0, 6.0, 16.0, 13.0, 20.0, 32.0, 38.0, 32.0, 55.0, 49.0, 52.0, 60.0, 50.0, 48.0, 59.0, 60.0, 63.0, 53.0, 45.0, 38.0, 30.0, 16.0, 22.0, 17.0, 10.0, 8.0, 9.0, 12.0, 9.0, 7.0, 2.0, 4.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1748046875, -0.16942787170410156, -0.16405105590820312, -0.1586742401123047, -0.15329742431640625, -0.1479206085205078, -0.14254379272460938, -0.13716697692871094, -0.1317901611328125, -0.12641334533691406, -0.12103652954101562, -0.11565971374511719, -0.11028289794921875, -0.10490608215332031, -0.09952926635742188, -0.09415245056152344, -0.088775634765625, -0.08339881896972656, -0.07802200317382812, -0.07264518737792969, -0.06726837158203125, -0.06189155578613281, -0.056514739990234375, -0.05113792419433594, -0.0457611083984375, -0.04038429260253906, -0.035007476806640625, -0.029630661010742188, -0.02425384521484375, -0.018877029418945312, -0.013500213623046875, -0.008123397827148438, -0.00274658203125, 0.0026302337646484375, 0.008007049560546875, 0.013383865356445312, 0.01876068115234375, 0.024137496948242188, 0.029514312744140625, 0.03489112854003906, 0.0402679443359375, 0.04564476013183594, 0.051021575927734375, 0.05639839172363281, 0.06177520751953125, 0.06715202331542969, 0.07252883911132812, 0.07790565490722656, 0.083282470703125, 0.08865928649902344, 0.09403610229492188, 0.09941291809082031, 0.10478973388671875, 0.11016654968261719, 0.11554336547851562, 0.12092018127441406, 0.1262969970703125, 0.13167381286621094, 0.13705062866210938, 0.1424274444580078, 0.14780426025390625, 0.1531810760498047, 0.15855789184570312, 0.16393470764160156, 0.1693115234375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 29.0, 152.0, 388.0, 310.0, 103.0, 17.0, 3.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.674155235290527, -14.315423965454102, -13.95669174194336, -13.597960472106934, -13.239229202270508, -12.880496978759766, -12.52176570892334, -12.163034439086914, -11.804302215576172, -11.445570945739746, -11.086838722229004, -10.728107452392578, -10.369375228881836, -10.01064395904541, -9.651912689208984, -9.293180465698242, -8.934449195861816, -8.57571792602539, -8.216985702514648, -7.858254432678223, -7.499522686004639, -7.140790939331055, -6.782059669494629, -6.423327922821045, -6.064596176147461, -5.705864429473877, -5.347132682800293, -4.988401412963867, -4.629669666290283, -4.270937919616699, -3.9122064113616943, -3.5534749031066895, -3.194744110107422, -2.836012363433838, -2.477280855178833, -2.118549346923828, -1.7598176002502441, -1.4010859727859497, -1.0423543453216553, -0.6836228370666504, -0.3248910903930664, 0.03384053707122803, 0.39257216453552246, 0.7513037919998169, 1.1100354194641113, 1.4687670469284058, 1.8274986743927002, 2.186230182647705, 2.544961929321289, 2.903693675994873, 3.262425184249878, 3.621156692504883, 3.979888439178467, 4.338620185852051, 4.697351455688477, 5.0560832023620605, 5.4148149490356445, 5.7735466957092285, 6.1322784423828125, 6.491009712219238, 6.849741458892822, 7.208473205566406, 7.567204475402832, 7.925936222076416, 8.28466796875]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 7.0, 15.0, 9.0, 10.0, 19.0, 18.0, 19.0, 20.0, 23.0, 34.0, 32.0, 53.0, 41.0, 55.0, 61.0, 61.0, 55.0, 61.0, 54.0, 55.0, 38.0, 38.0, 30.0, 33.0, 32.0, 28.0, 20.0, 17.0, 13.0, 17.0, 5.0, 5.0, 7.0, 3.0, 1.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.93811321258545, -8.700550079345703, -8.462986946105957, -8.225423812866211, -7.987860679626465, -7.750297546386719, -7.512734413146973, -7.275171279907227, -7.0376081466674805, -6.800045013427734, -6.562481880187988, -6.324918746948242, -6.087355613708496, -5.84979248046875, -5.612229347229004, -5.374666213989258, -5.13710355758667, -4.899540424346924, -4.661977291107178, -4.424414157867432, -4.1868510246276855, -3.9492878913879395, -3.7117249965667725, -3.4741618633270264, -3.2365987300872803, -2.999035596847534, -2.761472463607788, -2.523909568786621, -2.286346435546875, -2.048783302307129, -1.8112201690673828, -1.5736570358276367, -1.3360939025878906, -1.0985307693481445, -0.8609676957130432, -0.6234046220779419, -0.3858414888381958, -0.1482783555984497, 0.08928465843200684, 0.32684779167175293, 0.564410924911499, 0.8019740581512451, 1.0395371913909912, 1.2771002054214478, 1.5146633386611938, 1.75222647190094, 1.9897894859313965, 2.2273526191711426, 2.4649157524108887, 2.7024788856506348, 2.940042018890381, 3.177605152130127, 3.415168285369873, 3.652731418609619, 3.890294313430786, 4.127857208251953, 4.365420341491699, 4.602983474731445, 4.840546607971191, 5.0781097412109375, 5.315672874450684, 5.55323600769043, 5.790799140930176, 6.028362274169922, 6.265925407409668]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 12.0, 11.0, 10.0, 15.0, 18.0, 27.0, 25.0, 21.0, 63.0, 56.0, 167.0, 397.0, 1765.0, 34765.0, 4107007.0, 47118.0, 1922.0, 430.0, 164.0, 82.0, 41.0, 31.0, 29.0, 22.0, 16.0, 13.0, 9.0, 9.0, 6.0, 7.0, 4.0, 2.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.17578125, -5.04144287109375, -4.9071044921875, -4.77276611328125, -4.638427734375, -4.50408935546875, -4.3697509765625, -4.23541259765625, -4.10107421875, -3.96673583984375, -3.8323974609375, -3.69805908203125, -3.563720703125, -3.42938232421875, -3.2950439453125, -3.16070556640625, -3.0263671875, -2.89202880859375, -2.7576904296875, -2.62335205078125, -2.489013671875, -2.35467529296875, -2.2203369140625, -2.08599853515625, -1.95166015625, -1.81732177734375, -1.6829833984375, -1.54864501953125, -1.414306640625, -1.27996826171875, -1.1456298828125, -1.01129150390625, -0.876953125, -0.74261474609375, -0.6082763671875, -0.47393798828125, -0.339599609375, -0.20526123046875, -0.0709228515625, 0.06341552734375, 0.19775390625, 0.33209228515625, 0.4664306640625, 0.60076904296875, 0.735107421875, 0.86944580078125, 1.0037841796875, 1.13812255859375, 1.2724609375, 1.40679931640625, 1.5411376953125, 1.67547607421875, 1.809814453125, 1.94415283203125, 2.0784912109375, 2.21282958984375, 2.34716796875, 2.48150634765625, 2.6158447265625, 2.75018310546875, 2.884521484375, 3.01885986328125, 3.1531982421875, 3.28753662109375, 3.421875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 8.0, 8.0, 9.0, 11.0, 10.0, 18.0, 31.0, 24.0, 29.0, 32.0, 35.0, 46.0, 65.0, 61.0, 68.0, 68.0, 65.0, 54.0, 68.0, 50.0, 47.0, 39.0, 40.0, 19.0, 18.0, 17.0, 11.0, 9.0, 5.0, 7.0, 7.0, 6.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.78271484375, -0.7628135681152344, -0.7429122924804688, -0.7230110168457031, -0.7031097412109375, -0.6832084655761719, -0.6633071899414062, -0.6434059143066406, -0.623504638671875, -0.6036033630371094, -0.5837020874023438, -0.5638008117675781, -0.5438995361328125, -0.5239982604980469, -0.5040969848632812, -0.4841957092285156, -0.46429443359375, -0.4443931579589844, -0.42449188232421875, -0.4045906066894531, -0.3846893310546875, -0.3647880554199219, -0.34488677978515625, -0.3249855041503906, -0.305084228515625, -0.2851829528808594, -0.26528167724609375, -0.24538040161132812, -0.2254791259765625, -0.20557785034179688, -0.18567657470703125, -0.16577529907226562, -0.1458740234375, -0.12597274780273438, -0.10607147216796875, -0.08617019653320312, -0.0662689208984375, -0.046367645263671875, -0.02646636962890625, -0.006565093994140625, 0.013336181640625, 0.033237457275390625, 0.05313873291015625, 0.07304000854492188, 0.0929412841796875, 0.11284255981445312, 0.13274383544921875, 0.15264511108398438, 0.17254638671875, 0.19244766235351562, 0.21234893798828125, 0.23225021362304688, 0.2521514892578125, 0.2720527648925781, 0.29195404052734375, 0.3118553161621094, 0.331756591796875, 0.3516578674316406, 0.37155914306640625, 0.3914604187011719, 0.4113616943359375, 0.4312629699707031, 0.45116424560546875, 0.4710655212402344, 0.490966796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 6.0, 6.0, 4.0, 5.0, 18.0, 9.0, 28.0, 42.0, 76.0, 177.0, 469.0, 1451.0, 5268.0, 22690.0, 124675.0, 776240.0, 2425510.0, 697774.0, 112128.0, 20619.0, 4954.0, 1318.0, 444.0, 164.0, 88.0, 37.0, 17.0, 21.0, 10.0, 11.0, 5.0, 4.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2060546875, -1.1710662841796875, -1.136077880859375, -1.1010894775390625, -1.06610107421875, -1.0311126708984375, -0.996124267578125, -0.9611358642578125, -0.9261474609375, -0.8911590576171875, -0.856170654296875, -0.8211822509765625, -0.78619384765625, -0.7512054443359375, -0.716217041015625, -0.6812286376953125, -0.646240234375, -0.6112518310546875, -0.576263427734375, -0.5412750244140625, -0.50628662109375, -0.4712982177734375, -0.436309814453125, -0.4013214111328125, -0.3663330078125, -0.3313446044921875, -0.296356201171875, -0.2613677978515625, -0.22637939453125, -0.1913909912109375, -0.156402587890625, -0.1214141845703125, -0.08642578125, -0.0514373779296875, -0.016448974609375, 0.0185394287109375, 0.05352783203125, 0.0885162353515625, 0.123504638671875, 0.1584930419921875, 0.1934814453125, 0.2284698486328125, 0.263458251953125, 0.2984466552734375, 0.33343505859375, 0.3684234619140625, 0.403411865234375, 0.4384002685546875, 0.473388671875, 0.5083770751953125, 0.543365478515625, 0.5783538818359375, 0.61334228515625, 0.6483306884765625, 0.683319091796875, 0.7183074951171875, 0.7532958984375, 0.7882843017578125, 0.823272705078125, 0.8582611083984375, 0.89324951171875, 0.9282379150390625, 0.963226318359375, 0.9982147216796875, 1.033203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 7.0, 8.0, 6.0, 10.0, 20.0, 24.0, 24.0, 38.0, 55.0, 99.0, 110.0, 153.0, 220.0, 272.0, 385.0, 502.0, 535.0, 446.0, 315.0, 228.0, 179.0, 127.0, 88.0, 74.0, 55.0, 36.0, 20.0, 15.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.65283203125, -0.6348114013671875, -0.616790771484375, -0.5987701416015625, -0.58074951171875, -0.5627288818359375, -0.544708251953125, -0.5266876220703125, -0.5086669921875, -0.4906463623046875, -0.472625732421875, -0.4546051025390625, -0.43658447265625, -0.4185638427734375, -0.400543212890625, -0.3825225830078125, -0.364501953125, -0.3464813232421875, -0.328460693359375, -0.3104400634765625, -0.29241943359375, -0.2743988037109375, -0.256378173828125, -0.2383575439453125, -0.2203369140625, -0.2023162841796875, -0.184295654296875, -0.1662750244140625, -0.14825439453125, -0.1302337646484375, -0.112213134765625, -0.0941925048828125, -0.076171875, -0.0581512451171875, -0.040130615234375, -0.0221099853515625, -0.00408935546875, 0.0139312744140625, 0.031951904296875, 0.0499725341796875, 0.0679931640625, 0.0860137939453125, 0.104034423828125, 0.1220550537109375, 0.14007568359375, 0.1580963134765625, 0.176116943359375, 0.1941375732421875, 0.212158203125, 0.2301788330078125, 0.248199462890625, 0.2662200927734375, 0.28424072265625, 0.3022613525390625, 0.320281982421875, 0.3383026123046875, 0.3563232421875, 0.3743438720703125, 0.392364501953125, 0.4103851318359375, 0.42840576171875, 0.4464263916015625, 0.464447021484375, 0.4824676513671875, 0.50048828125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 11.0, 38.0, 104.0, 195.0, 241.0, 206.0, 114.0, 57.0, 18.0, 8.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.346762657165527, -6.18272590637207, -6.018688678741455, -5.854651927947998, -5.690615177154541, -5.526577949523926, -5.362541198730469, -5.198504447937012, -5.034467697143555, -4.870430946350098, -4.706393718719482, -4.542356967926025, -4.378320217132568, -4.214282989501953, -4.050246238708496, -3.886209487915039, -3.722172260284424, -3.5581352710723877, -3.3940985202789307, -3.2300615310668945, -3.0660247802734375, -2.9019877910614014, -2.7379508018493652, -2.573914051055908, -2.409877061843872, -2.245840072631836, -2.081803321838379, -1.9177663326263428, -1.7537294626235962, -1.5896925926208496, -1.4256556034088135, -1.261618733406067, -1.0975818634033203, -0.9335449934005737, -0.7695080637931824, -0.605471134185791, -0.44143426418304443, -0.27739739418029785, -0.1133604645729065, 0.05067646503448486, 0.21471333503723145, 0.3787502348423004, 0.5427871346473694, 0.7068240642547607, 0.8708609342575073, 1.034897804260254, 1.19893479347229, 1.3629716634750366, 1.5270085334777832, 1.6910454034805298, 1.8550822734832764, 2.0191192626953125, 2.1831560134887695, 2.3471930027008057, 2.511229991912842, 2.675266742706299, 2.839303731918335, 3.003340721130371, 3.167377471923828, 3.3314144611358643, 3.4954514503479004, 3.6594882011413574, 3.8235251903533936, 3.9875621795654297, 4.151598930358887]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 9.0, 8.0, 12.0, 11.0, 14.0, 15.0, 20.0, 24.0, 22.0, 34.0, 33.0, 45.0, 37.0, 41.0, 46.0, 53.0, 32.0, 52.0, 62.0, 48.0, 45.0, 37.0, 35.0, 39.0, 34.0, 29.0, 25.0, 30.0, 13.0, 19.0, 17.0, 11.0, 12.0, 9.0, 9.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0], "bins": [-2.0339834690093994, -1.981648564338684, -1.9293136596679688, -1.8769787549972534, -1.824643850326538, -1.7723089456558228, -1.7199740409851074, -1.667639136314392, -1.6153042316436768, -1.5629693269729614, -1.510634422302246, -1.4582995176315308, -1.4059646129608154, -1.3536297082901, -1.3012948036193848, -1.2489598989486694, -1.196624994277954, -1.1442900896072388, -1.0919551849365234, -1.039620280265808, -0.9872853755950928, -0.9349504709243774, -0.8826155662536621, -0.8302806615829468, -0.7779456377029419, -0.7256107330322266, -0.6732758283615112, -0.6209409236907959, -0.5686060190200806, -0.5162711143493652, -0.4639361798763275, -0.4116012752056122, -0.35926640033721924, -0.3069314956665039, -0.2545965909957886, -0.20226167142391205, -0.14992676675319672, -0.09759184718132019, -0.04525694251060486, 0.007077962160110474, 0.059412866830825806, 0.11174777150154114, 0.16408267617225647, 0.216417595744133, 0.2687525153160095, 0.32108741998672485, 0.3734223246574402, 0.4257572293281555, 0.47809213399887085, 0.5304270386695862, 0.5827619433403015, 0.6350968480110168, 0.6874317526817322, 0.7397667169570923, 0.7921016216278076, 0.844436526298523, 0.8967714309692383, 0.9491063356399536, 1.001441240310669, 1.0537761449813843, 1.1061110496520996, 1.158445954322815, 1.2107808589935303, 1.2631157636642456, 1.315450668334961]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 9.0, 21.0, 15.0, 24.0, 36.0, 86.0, 99.0, 162.0, 309.0, 475.0, 967.0, 1804.0, 3873.0, 9534.0, 25735.0, 79531.0, 241899.0, 390813.0, 195076.0, 62765.0, 20951.0, 7619.0, 3303.0, 1518.0, 791.0, 437.0, 261.0, 155.0, 103.0, 57.0, 35.0, 24.0, 20.0, 20.0, 11.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8603515625, -0.8320465087890625, -0.803741455078125, -0.7754364013671875, -0.74713134765625, -0.7188262939453125, -0.690521240234375, -0.6622161865234375, -0.6339111328125, -0.6056060791015625, -0.577301025390625, -0.5489959716796875, -0.52069091796875, -0.4923858642578125, -0.464080810546875, -0.4357757568359375, -0.407470703125, -0.3791656494140625, -0.350860595703125, -0.3225555419921875, -0.29425048828125, -0.2659454345703125, -0.237640380859375, -0.2093353271484375, -0.1810302734375, -0.1527252197265625, -0.124420166015625, -0.0961151123046875, -0.06781005859375, -0.0395050048828125, -0.011199951171875, 0.0171051025390625, 0.04541015625, 0.0737152099609375, 0.102020263671875, 0.1303253173828125, 0.15863037109375, 0.1869354248046875, 0.215240478515625, 0.2435455322265625, 0.2718505859375, 0.3001556396484375, 0.328460693359375, 0.3567657470703125, 0.38507080078125, 0.4133758544921875, 0.441680908203125, 0.4699859619140625, 0.498291015625, 0.5265960693359375, 0.554901123046875, 0.5832061767578125, 0.61151123046875, 0.6398162841796875, 0.668121337890625, 0.6964263916015625, 0.7247314453125, 0.7530364990234375, 0.781341552734375, 0.8096466064453125, 0.83795166015625, 0.8662567138671875, 0.894561767578125, 0.9228668212890625, 0.951171875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 5.0, 9.0, 9.0, 11.0, 17.0, 15.0, 26.0, 29.0, 24.0, 33.0, 38.0, 43.0, 62.0, 83.0, 66.0, 64.0, 72.0, 75.0, 58.0, 48.0, 35.0, 38.0, 21.0, 32.0, 15.0, 16.0, 19.0, 8.0, 10.0, 4.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.77978515625, -0.7594070434570312, -0.7390289306640625, -0.7186508178710938, -0.698272705078125, -0.6778945922851562, -0.6575164794921875, -0.6371383666992188, -0.61676025390625, -0.5963821411132812, -0.5760040283203125, -0.5556259155273438, -0.535247802734375, -0.5148696899414062, -0.4944915771484375, -0.47411346435546875, -0.4537353515625, -0.43335723876953125, -0.4129791259765625, -0.39260101318359375, -0.372222900390625, -0.35184478759765625, -0.3314666748046875, -0.31108856201171875, -0.29071044921875, -0.27033233642578125, -0.2499542236328125, -0.22957611083984375, -0.209197998046875, -0.18881988525390625, -0.1684417724609375, -0.14806365966796875, -0.127685546875, -0.10730743408203125, -0.0869293212890625, -0.06655120849609375, -0.046173095703125, -0.02579498291015625, -0.0054168701171875, 0.01496124267578125, 0.03533935546875, 0.05571746826171875, 0.0760955810546875, 0.09647369384765625, 0.116851806640625, 0.13722991943359375, 0.1576080322265625, 0.17798614501953125, 0.1983642578125, 0.21874237060546875, 0.2391204833984375, 0.25949859619140625, 0.279876708984375, 0.30025482177734375, 0.3206329345703125, 0.34101104736328125, 0.36138916015625, 0.38176727294921875, 0.4021453857421875, 0.42252349853515625, 0.442901611328125, 0.46327972412109375, 0.4836578369140625, 0.5040359497070312, 0.5244140625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 4.0, 7.0, 5.0, 11.0, 6.0, 12.0, 11.0, 19.0, 23.0, 21.0, 24.0, 27.0, 30.0, 43.0, 48.0, 71.0, 155.0, 433.0, 3381.0, 129080.0, 876374.0, 36421.0, 1579.0, 285.0, 117.0, 66.0, 53.0, 38.0, 28.0, 25.0, 23.0, 14.0, 19.0, 16.0, 18.0, 12.0, 11.0, 8.0, 4.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.5703125, -3.4564208984375, -3.342529296875, -3.2286376953125, -3.11474609375, -3.0008544921875, -2.886962890625, -2.7730712890625, -2.6591796875, -2.5452880859375, -2.431396484375, -2.3175048828125, -2.20361328125, -2.0897216796875, -1.975830078125, -1.8619384765625, -1.748046875, -1.6341552734375, -1.520263671875, -1.4063720703125, -1.29248046875, -1.1785888671875, -1.064697265625, -0.9508056640625, -0.8369140625, -0.7230224609375, -0.609130859375, -0.4952392578125, -0.38134765625, -0.2674560546875, -0.153564453125, -0.0396728515625, 0.07421875, 0.1881103515625, 0.302001953125, 0.4158935546875, 0.52978515625, 0.6436767578125, 0.757568359375, 0.8714599609375, 0.9853515625, 1.0992431640625, 1.213134765625, 1.3270263671875, 1.44091796875, 1.5548095703125, 1.668701171875, 1.7825927734375, 1.896484375, 2.0103759765625, 2.124267578125, 2.2381591796875, 2.35205078125, 2.4659423828125, 2.579833984375, 2.6937255859375, 2.8076171875, 2.9215087890625, 3.035400390625, 3.1492919921875, 3.26318359375, 3.3770751953125, 3.490966796875, 3.6048583984375, 3.71875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 1.0, 7.0, 9.0, 11.0, 14.0, 10.0, 9.0, 16.0, 20.0, 20.0, 22.0, 35.0, 24.0, 31.0, 31.0, 28.0, 40.0, 42.0, 42.0, 38.0, 47.0, 44.0, 28.0, 46.0, 39.0, 39.0, 42.0, 28.0, 35.0, 27.0, 34.0, 15.0, 22.0, 16.0, 20.0, 14.0, 11.0, 11.0, 4.0, 10.0, 4.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.97314453125, -0.9416885375976562, -0.9102325439453125, -0.8787765502929688, -0.847320556640625, -0.8158645629882812, -0.7844085693359375, -0.7529525756835938, -0.72149658203125, -0.6900405883789062, -0.6585845947265625, -0.6271286010742188, -0.595672607421875, -0.5642166137695312, -0.5327606201171875, -0.5013046264648438, -0.4698486328125, -0.43839263916015625, -0.4069366455078125, -0.37548065185546875, -0.344024658203125, -0.31256866455078125, -0.2811126708984375, -0.24965667724609375, -0.21820068359375, -0.18674468994140625, -0.1552886962890625, -0.12383270263671875, -0.092376708984375, -0.06092071533203125, -0.0294647216796875, 0.00199127197265625, 0.033447265625, 0.06490325927734375, 0.0963592529296875, 0.12781524658203125, 0.159271240234375, 0.19072723388671875, 0.2221832275390625, 0.25363922119140625, 0.28509521484375, 0.31655120849609375, 0.3480072021484375, 0.37946319580078125, 0.410919189453125, 0.44237518310546875, 0.4738311767578125, 0.5052871704101562, 0.5367431640625, 0.5681991577148438, 0.5996551513671875, 0.6311111450195312, 0.662567138671875, 0.6940231323242188, 0.7254791259765625, 0.7569351196289062, 0.78839111328125, 0.8198471069335938, 0.8513031005859375, 0.8827590942382812, 0.914215087890625, 0.9456710815429688, 0.9771270751953125, 1.0085830688476562, 1.0400390625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 4.0, 11.0, 8.0, 16.0, 16.0, 30.0, 39.0, 61.0, 95.0, 176.0, 328.0, 597.0, 1100.0, 2029.0, 4016.0, 8870.0, 20082.0, 49726.0, 130183.0, 294100.0, 304317.0, 139669.0, 52989.0, 21672.0, 9333.0, 4434.0, 2168.0, 1118.0, 588.0, 295.0, 189.0, 113.0, 65.0, 34.0, 24.0, 15.0, 16.0, 4.0, 7.0, 5.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.29541015625, -0.2852363586425781, -0.27506256103515625, -0.2648887634277344, -0.2547149658203125, -0.24454116821289062, -0.23436737060546875, -0.22419357299804688, -0.214019775390625, -0.20384597778320312, -0.19367218017578125, -0.18349838256835938, -0.1733245849609375, -0.16315078735351562, -0.15297698974609375, -0.14280319213867188, -0.13262939453125, -0.12245559692382812, -0.11228179931640625, -0.10210800170898438, -0.0919342041015625, -0.08176040649414062, -0.07158660888671875, -0.061412811279296875, -0.051239013671875, -0.041065216064453125, -0.03089141845703125, -0.020717620849609375, -0.0105438232421875, -0.000370025634765625, 0.00980377197265625, 0.019977569580078125, 0.0301513671875, 0.040325164794921875, 0.05049896240234375, 0.060672760009765625, 0.0708465576171875, 0.08102035522460938, 0.09119415283203125, 0.10136795043945312, 0.111541748046875, 0.12171554565429688, 0.13188934326171875, 0.14206314086914062, 0.1522369384765625, 0.16241073608398438, 0.17258453369140625, 0.18275833129882812, 0.19293212890625, 0.20310592651367188, 0.21327972412109375, 0.22345352172851562, 0.2336273193359375, 0.24380111694335938, 0.25397491455078125, 0.2641487121582031, 0.274322509765625, 0.2844963073730469, 0.29467010498046875, 0.3048439025878906, 0.3150177001953125, 0.3251914978027344, 0.33536529541015625, 0.3455390930175781, 0.355712890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 5.0, 4.0, 2.0, 3.0, 5.0, 13.0, 11.0, 14.0, 21.0, 29.0, 36.0, 61.0, 73.0, 86.0, 86.0, 108.0, 105.0, 79.0, 68.0, 59.0, 30.0, 28.0, 24.0, 15.0, 11.0, 6.0, 4.0, 4.0, 7.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.137920379638672e-05, -4.968792200088501e-05, -4.79966402053833e-05, -4.630535840988159e-05, -4.461407661437988e-05, -4.2922794818878174e-05, -4.1231513023376465e-05, -3.9540231227874756e-05, -3.784894943237305e-05, -3.615766763687134e-05, -3.446638584136963e-05, -3.277510404586792e-05, -3.108382225036621e-05, -2.9392540454864502e-05, -2.7701258659362793e-05, -2.6009976863861084e-05, -2.4318695068359375e-05, -2.2627413272857666e-05, -2.0936131477355957e-05, -1.9244849681854248e-05, -1.755356788635254e-05, -1.586228609085083e-05, -1.4171004295349121e-05, -1.2479722499847412e-05, -1.0788440704345703e-05, -9.097158908843994e-06, -7.405877113342285e-06, -5.714595317840576e-06, -4.023313522338867e-06, -2.332031726837158e-06, -6.407499313354492e-07, 1.0505318641662598e-06, 2.7418136596679688e-06, 4.433095455169678e-06, 6.124377250671387e-06, 7.815659046173096e-06, 9.506940841674805e-06, 1.1198222637176514e-05, 1.2889504432678223e-05, 1.4580786228179932e-05, 1.627206802368164e-05, 1.796334981918335e-05, 1.965463161468506e-05, 2.1345913410186768e-05, 2.3037195205688477e-05, 2.4728477001190186e-05, 2.6419758796691895e-05, 2.8111040592193604e-05, 2.9802322387695312e-05, 3.149360418319702e-05, 3.318488597869873e-05, 3.487616777420044e-05, 3.656744956970215e-05, 3.825873136520386e-05, 3.9950013160705566e-05, 4.1641294956207275e-05, 4.3332576751708984e-05, 4.502385854721069e-05, 4.67151403427124e-05, 4.840642213821411e-05, 5.009770393371582e-05, 5.178898572921753e-05, 5.348026752471924e-05, 5.517154932022095e-05, 5.6862831115722656e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 6.0, 4.0, 12.0, 18.0, 19.0, 23.0, 35.0, 29.0, 52.0, 81.0, 233.0, 1583.0, 48067.0, 906973.0, 88638.0, 2220.0, 242.0, 93.0, 58.0, 48.0, 34.0, 26.0, 23.0, 15.0, 11.0, 7.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.470703125, -1.4325714111328125, -1.394439697265625, -1.3563079833984375, -1.31817626953125, -1.2800445556640625, -1.241912841796875, -1.2037811279296875, -1.1656494140625, -1.1275177001953125, -1.089385986328125, -1.0512542724609375, -1.01312255859375, -0.9749908447265625, -0.936859130859375, -0.8987274169921875, -0.860595703125, -0.8224639892578125, -0.784332275390625, -0.7462005615234375, -0.70806884765625, -0.6699371337890625, -0.631805419921875, -0.5936737060546875, -0.5555419921875, -0.5174102783203125, -0.479278564453125, -0.4411468505859375, -0.40301513671875, -0.3648834228515625, -0.326751708984375, -0.2886199951171875, -0.25048828125, -0.2123565673828125, -0.174224853515625, -0.1360931396484375, -0.09796142578125, -0.0598297119140625, -0.021697998046875, 0.0164337158203125, 0.0545654296875, 0.0926971435546875, 0.130828857421875, 0.1689605712890625, 0.20709228515625, 0.2452239990234375, 0.283355712890625, 0.3214874267578125, 0.359619140625, 0.3977508544921875, 0.435882568359375, 0.4740142822265625, 0.51214599609375, 0.5502777099609375, 0.588409423828125, 0.6265411376953125, 0.6646728515625, 0.7028045654296875, 0.740936279296875, 0.7790679931640625, 0.81719970703125, 0.8553314208984375, 0.893463134765625, 0.9315948486328125, 0.9697265625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 4.0, 9.0, 10.0, 29.0, 20.0, 22.0, 24.0, 40.0, 48.0, 64.0, 58.0, 68.0, 63.0, 71.0, 67.0, 59.0, 59.0, 59.0, 50.0, 40.0, 42.0, 20.0, 19.0, 20.0, 13.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.326416015625, -0.3181324005126953, -0.3098487854003906, -0.30156517028808594, -0.29328155517578125, -0.28499794006347656, -0.2767143249511719, -0.2684307098388672, -0.2601470947265625, -0.2518634796142578, -0.24357986450195312, -0.23529624938964844, -0.22701263427734375, -0.21872901916503906, -0.21044540405273438, -0.2021617889404297, -0.193878173828125, -0.1855945587158203, -0.17731094360351562, -0.16902732849121094, -0.16074371337890625, -0.15246009826660156, -0.14417648315429688, -0.1358928680419922, -0.1276092529296875, -0.11932563781738281, -0.11104202270507812, -0.10275840759277344, -0.09447479248046875, -0.08619117736816406, -0.07790756225585938, -0.06962394714355469, -0.06134033203125, -0.05305671691894531, -0.044773101806640625, -0.03648948669433594, -0.02820587158203125, -0.019922256469726562, -0.011638641357421875, -0.0033550262451171875, 0.0049285888671875, 0.013212203979492188, 0.021495819091796875, 0.029779434204101562, 0.03806304931640625, 0.04634666442871094, 0.054630279541015625, 0.06291389465332031, 0.071197509765625, 0.07948112487792969, 0.08776473999023438, 0.09604835510253906, 0.10433197021484375, 0.11261558532714844, 0.12089920043945312, 0.1291828155517578, 0.1374664306640625, 0.1457500457763672, 0.15403366088867188, 0.16231727600097656, 0.17060089111328125, 0.17888450622558594, 0.18716812133789062, 0.1954517364501953, 0.2037353515625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 83.0, 604.0, 295.0, 26.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0106654167175293, -2.4901881217956543, -1.9697108268737793, -1.4492335319519043, -0.9287562370300293, -0.4082789421081543, 0.1121983528137207, 0.6326756477355957, 1.1531529426574707, 1.6736302375793457, 2.1941075325012207, 2.7145848274230957, 3.2350621223449707, 3.7555394172668457, 4.276016712188721, 4.796494007110596, 5.316971302032471, 5.837448596954346, 6.357925891876221, 6.878403186798096, 7.398880481719971, 7.919357776641846, 8.439834594726562, 8.960311889648438, 9.480789184570312, 10.001266479492188, 10.521743774414062, 11.042221069335938, 11.562698364257812, 12.083175659179688, 12.603652954101562, 13.124130249023438, 13.644607543945312, 14.165084838867188, 14.685562133789062, 15.206039428710938, 15.726516723632812, 16.246994018554688, 16.767471313476562, 17.287948608398438, 17.808425903320312, 18.328903198242188, 18.849380493164062, 19.369857788085938, 19.890335083007812, 20.410812377929688, 20.931289672851562, 21.451766967773438, 21.972244262695312, 22.492721557617188, 23.013198852539062, 23.533676147460938, 24.054153442382812, 24.574630737304688, 25.095108032226562, 25.615585327148438, 26.136062622070312, 26.656539916992188, 27.177017211914062, 27.697494506835938, 28.217971801757812, 28.738449096679688, 29.258926391601562, 29.779403686523438, 30.299880981445312]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 1.0, 5.0, 8.0, 5.0, 5.0, 8.0, 12.0, 17.0, 14.0, 9.0, 16.0, 23.0, 24.0, 29.0, 33.0, 39.0, 41.0, 54.0, 43.0, 34.0, 41.0, 54.0, 49.0, 48.0, 29.0, 49.0, 37.0, 38.0, 45.0, 30.0, 29.0, 27.0, 21.0, 20.0, 15.0, 8.0, 14.0, 9.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.63928484916687, -3.5110559463500977, -3.382827043533325, -3.2545981407165527, -3.1263694763183594, -2.998140573501587, -2.8699116706848145, -2.741682767868042, -2.6134538650512695, -2.485224962234497, -2.3569960594177246, -2.2287673950195312, -2.100538492202759, -1.9723095893859863, -1.8440806865692139, -1.7158517837524414, -1.587623119354248, -1.4593942165374756, -1.3311654329299927, -1.2029365301132202, -1.0747077465057373, -0.9464788436889648, -0.8182499408721924, -0.6900210976600647, -0.561792254447937, -0.4335634112358093, -0.30533453822135925, -0.17710566520690918, -0.048876821994781494, 0.07935202121734619, 0.20758092403411865, 0.33580976724624634, 0.4640388488769531, 0.5922676920890808, 0.7204965353012085, 0.848725438117981, 0.9769542813301086, 1.1051831245422363, 1.2334120273590088, 1.3616409301757812, 1.4898697137832642, 1.6180986166000366, 1.7463274002075195, 1.874556303024292, 2.0027852058410645, 2.131013870239258, 2.2592430114746094, 2.3874716758728027, 2.515700578689575, 2.6439294815063477, 2.77215838432312, 2.9003872871398926, 3.028615951538086, 3.1568448543548584, 3.285073757171631, 3.4133026599884033, 3.541531562805176, 3.6697604656219482, 3.7979893684387207, 3.926218032836914, 4.054447174072266, 4.182675838470459, 4.310904502868652, 4.439133644104004, 4.567362308502197]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 9.0, 12.0, 15.0, 7.0, 11.0, 26.0, 24.0, 28.0, 48.0, 69.0, 61.0, 146.0, 201.0, 306.0, 644.0, 1410.0, 3857.0, 14912.0, 92372.0, 1252955.0, 2594872.0, 198559.0, 24866.0, 5446.0, 1718.0, 712.0, 346.0, 174.0, 131.0, 91.0, 75.0, 36.0, 39.0, 31.0, 20.0, 18.0, 12.0, 10.0, 5.0, 6.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-1.68359375, -1.6382904052734375, -1.592987060546875, -1.5476837158203125, -1.50238037109375, -1.4570770263671875, -1.411773681640625, -1.3664703369140625, -1.3211669921875, -1.2758636474609375, -1.230560302734375, -1.1852569580078125, -1.13995361328125, -1.0946502685546875, -1.049346923828125, -1.0040435791015625, -0.958740234375, -0.9134368896484375, -0.868133544921875, -0.8228302001953125, -0.77752685546875, -0.7322235107421875, -0.686920166015625, -0.6416168212890625, -0.5963134765625, -0.5510101318359375, -0.505706787109375, -0.4604034423828125, -0.41510009765625, -0.3697967529296875, -0.324493408203125, -0.2791900634765625, -0.23388671875, -0.1885833740234375, -0.143280029296875, -0.0979766845703125, -0.05267333984375, -0.0073699951171875, 0.037933349609375, 0.0832366943359375, 0.1285400390625, 0.1738433837890625, 0.219146728515625, 0.2644500732421875, 0.30975341796875, 0.3550567626953125, 0.400360107421875, 0.4456634521484375, 0.490966796875, 0.5362701416015625, 0.581573486328125, 0.6268768310546875, 0.67218017578125, 0.7174835205078125, 0.762786865234375, 0.8080902099609375, 0.8533935546875, 0.8986968994140625, 0.944000244140625, 0.9893035888671875, 1.03460693359375, 1.0799102783203125, 1.125213623046875, 1.1705169677734375, 1.2158203125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 12.0, 1.0, 12.0, 13.0, 6.0, 14.0, 17.0, 20.0, 28.0, 26.0, 35.0, 44.0, 50.0, 53.0, 66.0, 62.0, 64.0, 59.0, 59.0, 62.0, 43.0, 40.0, 46.0, 30.0, 15.0, 26.0, 21.0, 19.0, 11.0, 9.0, 9.0, 8.0, 7.0, 6.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.71435546875, -0.6957931518554688, -0.6772308349609375, -0.6586685180664062, -0.640106201171875, -0.6215438842773438, -0.6029815673828125, -0.5844192504882812, -0.56585693359375, -0.5472946166992188, -0.5287322998046875, -0.5101699829101562, -0.491607666015625, -0.47304534912109375, -0.4544830322265625, -0.43592071533203125, -0.4173583984375, -0.39879608154296875, -0.3802337646484375, -0.36167144775390625, -0.343109130859375, -0.32454681396484375, -0.3059844970703125, -0.28742218017578125, -0.26885986328125, -0.25029754638671875, -0.2317352294921875, -0.21317291259765625, -0.194610595703125, -0.17604827880859375, -0.1574859619140625, -0.13892364501953125, -0.120361328125, -0.10179901123046875, -0.0832366943359375, -0.06467437744140625, -0.046112060546875, -0.02754974365234375, -0.0089874267578125, 0.00957489013671875, 0.02813720703125, 0.04669952392578125, 0.0652618408203125, 0.08382415771484375, 0.102386474609375, 0.12094879150390625, 0.1395111083984375, 0.15807342529296875, 0.1766357421875, 0.19519805908203125, 0.2137603759765625, 0.23232269287109375, 0.250885009765625, 0.26944732666015625, 0.2880096435546875, 0.30657196044921875, 0.32513427734375, 0.34369659423828125, 0.3622589111328125, 0.38082122802734375, 0.399383544921875, 0.41794586181640625, 0.4365081787109375, 0.45507049560546875, 0.4736328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 9.0, 4.0, 7.0, 14.0, 13.0, 19.0, 49.0, 54.0, 83.0, 187.0, 370.0, 866.0, 2859.0, 10177.0, 43633.0, 223928.0, 1095195.0, 2063920.0, 605457.0, 115033.0, 23535.0, 5790.0, 1745.0, 658.0, 296.0, 152.0, 76.0, 46.0, 29.0, 20.0, 14.0, 13.0, 9.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.072265625, -1.0343780517578125, -0.996490478515625, -0.9586029052734375, -0.92071533203125, -0.8828277587890625, -0.844940185546875, -0.8070526123046875, -0.7691650390625, -0.7312774658203125, -0.693389892578125, -0.6555023193359375, -0.61761474609375, -0.5797271728515625, -0.541839599609375, -0.5039520263671875, -0.466064453125, -0.4281768798828125, -0.390289306640625, -0.3524017333984375, -0.31451416015625, -0.2766265869140625, -0.238739013671875, -0.2008514404296875, -0.1629638671875, -0.1250762939453125, -0.087188720703125, -0.0493011474609375, -0.01141357421875, 0.0264739990234375, 0.064361572265625, 0.1022491455078125, 0.14013671875, 0.1780242919921875, 0.215911865234375, 0.2537994384765625, 0.29168701171875, 0.3295745849609375, 0.367462158203125, 0.4053497314453125, 0.4432373046875, 0.4811248779296875, 0.519012451171875, 0.5569000244140625, 0.59478759765625, 0.6326751708984375, 0.670562744140625, 0.7084503173828125, 0.746337890625, 0.7842254638671875, 0.822113037109375, 0.8600006103515625, 0.89788818359375, 0.9357757568359375, 0.973663330078125, 1.0115509033203125, 1.0494384765625, 1.0873260498046875, 1.125213623046875, 1.1631011962890625, 1.20098876953125, 1.2388763427734375, 1.276763916015625, 1.3146514892578125, 1.3525390625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 6.0, 13.0, 15.0, 22.0, 24.0, 28.0, 34.0, 53.0, 64.0, 87.0, 103.0, 136.0, 183.0, 227.0, 272.0, 288.0, 331.0, 402.0, 324.0, 277.0, 228.0, 198.0, 152.0, 134.0, 105.0, 66.0, 63.0, 48.0, 38.0, 31.0, 28.0, 23.0, 14.0, 11.0, 7.0, 8.0, 5.0, 9.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5029296875, -0.48520660400390625, -0.4674835205078125, -0.44976043701171875, -0.432037353515625, -0.41431427001953125, -0.3965911865234375, -0.37886810302734375, -0.36114501953125, -0.34342193603515625, -0.3256988525390625, -0.30797576904296875, -0.290252685546875, -0.27252960205078125, -0.2548065185546875, -0.23708343505859375, -0.2193603515625, -0.20163726806640625, -0.1839141845703125, -0.16619110107421875, -0.148468017578125, -0.13074493408203125, -0.1130218505859375, -0.09529876708984375, -0.07757568359375, -0.05985260009765625, -0.0421295166015625, -0.02440643310546875, -0.006683349609375, 0.01103973388671875, 0.0287628173828125, 0.04648590087890625, 0.064208984375, 0.08193206787109375, 0.0996551513671875, 0.11737823486328125, 0.135101318359375, 0.15282440185546875, 0.1705474853515625, 0.18827056884765625, 0.20599365234375, 0.22371673583984375, 0.2414398193359375, 0.25916290283203125, 0.276885986328125, 0.29460906982421875, 0.3123321533203125, 0.33005523681640625, 0.3477783203125, 0.36550140380859375, 0.3832244873046875, 0.40094757080078125, 0.418670654296875, 0.43639373779296875, 0.4541168212890625, 0.47183990478515625, 0.48956298828125, 0.5072860717773438, 0.5250091552734375, 0.5427322387695312, 0.560455322265625, 0.5781784057617188, 0.5959014892578125, 0.6136245727539062, 0.63134765625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 14.0, 19.0, 40.0, 63.0, 132.0, 122.0, 170.0, 146.0, 131.0, 75.0, 50.0, 15.0, 15.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.313518047332764, -6.164902687072754, -6.016287326812744, -5.867671966552734, -5.719057083129883, -5.570441722869873, -5.421826362609863, -5.2732110023498535, -5.124595642089844, -4.975980281829834, -4.827364921569824, -4.6787495613098145, -4.530134201049805, -4.381519317626953, -4.232903957366943, -4.084288597106934, -3.935673236846924, -3.787057876586914, -3.6384425163269043, -3.4898273944854736, -3.341212034225464, -3.192596673965454, -3.0439815521240234, -2.8953661918640137, -2.746750831604004, -2.598135471343994, -2.4495201110839844, -2.3009049892425537, -2.152289628982544, -2.003674268722534, -1.855059027671814, -1.7064437866210938, -1.5578281879425049, -1.4092128276824951, -1.260597586631775, -1.1119823455810547, -0.9633669853210449, -0.8147516846656799, -0.6661363840103149, -0.5175211429595947, -0.36890578269958496, -0.22029048204421997, -0.07167518138885498, 0.07694011926651001, 0.225555419921875, 0.37417072057724, 0.522786021232605, 0.6714012622833252, 0.820016622543335, 0.9686319231987, 1.117247223854065, 1.2658624649047852, 1.414477825164795, 1.5630931854248047, 1.711708426475525, 1.8603236675262451, 2.008939027786255, 2.1575543880462646, 2.3061695098876953, 2.454784870147705, 2.603400230407715, 2.7520155906677246, 2.9006309509277344, 3.049246072769165, 3.197861433029175]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 3.0, 10.0, 10.0, 5.0, 8.0, 11.0, 12.0, 13.0, 24.0, 21.0, 21.0, 24.0, 32.0, 26.0, 26.0, 39.0, 36.0, 35.0, 45.0, 49.0, 43.0, 40.0, 27.0, 44.0, 52.0, 41.0, 40.0, 37.0, 28.0, 25.0, 28.0, 25.0, 23.0, 15.0, 18.0, 13.0, 11.0, 14.0, 5.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.040915012359619, -1.9760526418685913, -1.9111902713775635, -1.8463279008865356, -1.7814655303955078, -1.71660315990448, -1.6517407894134521, -1.5868782997131348, -1.5220160484313965, -1.4571536779403687, -1.3922913074493408, -1.327428936958313, -1.2625665664672852, -1.1977041959762573, -1.1328418254852295, -1.067979335784912, -1.0031169652938843, -0.9382545948028564, -0.8733922243118286, -0.8085298538208008, -0.743667483329773, -0.6788051128387451, -0.6139426827430725, -0.5490803122520447, -0.48421794176101685, -0.419355571269989, -0.3544932007789612, -0.28963080048561096, -0.22476842999458313, -0.1599060595035553, -0.09504365921020508, -0.030181288719177246, 0.034681081771850586, 0.09954345971345901, 0.16440583765506744, 0.22926822304725647, 0.2941305935382843, 0.35899296402931213, 0.42385536432266235, 0.4887177348136902, 0.553580105304718, 0.6184424757957458, 0.6833048462867737, 0.7481672763824463, 0.8130296468734741, 0.877892017364502, 0.9427543878555298, 1.0076167583465576, 1.0724791288375854, 1.1373414993286133, 1.2022038698196411, 1.267066240310669, 1.3319286108016968, 1.3967909812927246, 1.461653470993042, 1.5265157222747803, 1.5913782119750977, 1.6562405824661255, 1.7211029529571533, 1.7859653234481812, 1.850827693939209, 1.9156900644302368, 1.9805524349212646, 2.045414924621582, 2.1102771759033203]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 0.0, 4.0, 11.0, 21.0, 24.0, 28.0, 70.0, 74.0, 141.0, 206.0, 315.0, 492.0, 812.0, 1298.0, 2171.0, 3540.0, 5967.0, 10783.0, 21840.0, 52367.0, 132017.0, 278436.0, 288216.0, 142876.0, 56464.0, 23403.0, 11317.0, 6078.0, 3580.0, 2255.0, 1413.0, 852.0, 532.0, 345.0, 218.0, 122.0, 93.0, 52.0, 34.0, 27.0, 18.0, 14.0, 7.0, 6.0, 2.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.99951171875, -0.9692611694335938, -0.9390106201171875, -0.9087600708007812, -0.878509521484375, -0.8482589721679688, -0.8180084228515625, -0.7877578735351562, -0.75750732421875, -0.7272567749023438, -0.6970062255859375, -0.6667556762695312, -0.636505126953125, -0.6062545776367188, -0.5760040283203125, -0.5457534790039062, -0.5155029296875, -0.48525238037109375, -0.4550018310546875, -0.42475128173828125, -0.394500732421875, -0.36425018310546875, -0.3339996337890625, -0.30374908447265625, -0.27349853515625, -0.24324798583984375, -0.2129974365234375, -0.18274688720703125, -0.152496337890625, -0.12224578857421875, -0.0919952392578125, -0.06174468994140625, -0.031494140625, -0.00124359130859375, 0.0290069580078125, 0.05925750732421875, 0.089508056640625, 0.11975860595703125, 0.1500091552734375, 0.18025970458984375, 0.21051025390625, 0.24076080322265625, 0.2710113525390625, 0.30126190185546875, 0.331512451171875, 0.36176300048828125, 0.3920135498046875, 0.42226409912109375, 0.4525146484375, 0.48276519775390625, 0.5130157470703125, 0.5432662963867188, 0.573516845703125, 0.6037673950195312, 0.6340179443359375, 0.6642684936523438, 0.69451904296875, 0.7247695922851562, 0.7550201416015625, 0.7852706909179688, 0.815521240234375, 0.8457717895507812, 0.8760223388671875, 0.9062728881835938, 0.9365234375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 12.0, 7.0, 10.0, 13.0, 13.0, 22.0, 16.0, 30.0, 46.0, 29.0, 48.0, 58.0, 66.0, 63.0, 60.0, 64.0, 63.0, 60.0, 51.0, 48.0, 50.0, 34.0, 25.0, 26.0, 13.0, 19.0, 17.0, 12.0, 6.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.76611328125, -0.7469100952148438, -0.7277069091796875, -0.7085037231445312, -0.689300537109375, -0.6700973510742188, -0.6508941650390625, -0.6316909790039062, -0.61248779296875, -0.5932846069335938, -0.5740814208984375, -0.5548782348632812, -0.535675048828125, -0.5164718627929688, -0.4972686767578125, -0.47806549072265625, -0.4588623046875, -0.43965911865234375, -0.4204559326171875, -0.40125274658203125, -0.382049560546875, -0.36284637451171875, -0.3436431884765625, -0.32444000244140625, -0.30523681640625, -0.28603363037109375, -0.2668304443359375, -0.24762725830078125, -0.228424072265625, -0.20922088623046875, -0.1900177001953125, -0.17081451416015625, -0.151611328125, -0.13240814208984375, -0.1132049560546875, -0.09400177001953125, -0.074798583984375, -0.05559539794921875, -0.0363922119140625, -0.01718902587890625, 0.00201416015625, 0.02121734619140625, 0.0404205322265625, 0.05962371826171875, 0.078826904296875, 0.09803009033203125, 0.1172332763671875, 0.13643646240234375, 0.1556396484375, 0.17484283447265625, 0.1940460205078125, 0.21324920654296875, 0.232452392578125, 0.25165557861328125, 0.2708587646484375, 0.29006195068359375, 0.30926513671875, 0.32846832275390625, 0.3476715087890625, 0.36687469482421875, 0.386077880859375, 0.40528106689453125, 0.4244842529296875, 0.44368743896484375, 0.462890625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 11.0, 15.0, 27.0, 35.0, 45.0, 90.0, 174.0, 328.0, 820.0, 2250.0, 6544.0, 22098.0, 124805.0, 574988.0, 262160.0, 38665.0, 10001.0, 3313.0, 1196.0, 458.0, 212.0, 109.0, 58.0, 43.0, 25.0, 20.0, 13.0, 7.0, 8.0, 9.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.087890625, -2.025909423828125, -1.96392822265625, -1.901947021484375, -1.8399658203125, -1.777984619140625, -1.71600341796875, -1.654022216796875, -1.592041015625, -1.530059814453125, -1.46807861328125, -1.406097412109375, -1.3441162109375, -1.282135009765625, -1.22015380859375, -1.158172607421875, -1.09619140625, -1.034210205078125, -0.97222900390625, -0.910247802734375, -0.8482666015625, -0.786285400390625, -0.72430419921875, -0.662322998046875, -0.600341796875, -0.538360595703125, -0.47637939453125, -0.414398193359375, -0.3524169921875, -0.290435791015625, -0.22845458984375, -0.166473388671875, -0.1044921875, -0.042510986328125, 0.01947021484375, 0.081451416015625, 0.1434326171875, 0.205413818359375, 0.26739501953125, 0.329376220703125, 0.391357421875, 0.453338623046875, 0.51531982421875, 0.577301025390625, 0.6392822265625, 0.701263427734375, 0.76324462890625, 0.825225830078125, 0.88720703125, 0.949188232421875, 1.01116943359375, 1.073150634765625, 1.1351318359375, 1.197113037109375, 1.25909423828125, 1.321075439453125, 1.383056640625, 1.445037841796875, 1.50701904296875, 1.569000244140625, 1.6309814453125, 1.692962646484375, 1.75494384765625, 1.816925048828125, 1.87890625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 9.0, 5.0, 5.0, 7.0, 14.0, 13.0, 13.0, 33.0, 31.0, 47.0, 46.0, 52.0, 48.0, 74.0, 69.0, 71.0, 73.0, 57.0, 41.0, 47.0, 54.0, 40.0, 32.0, 27.0, 31.0, 18.0, 13.0, 6.0, 5.0, 4.0, 6.0, 7.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.306640625, -1.262725830078125, -1.21881103515625, -1.174896240234375, -1.1309814453125, -1.087066650390625, -1.04315185546875, -0.999237060546875, -0.955322265625, -0.911407470703125, -0.86749267578125, -0.823577880859375, -0.7796630859375, -0.735748291015625, -0.69183349609375, -0.647918701171875, -0.60400390625, -0.560089111328125, -0.51617431640625, -0.472259521484375, -0.4283447265625, -0.384429931640625, -0.34051513671875, -0.296600341796875, -0.252685546875, -0.208770751953125, -0.16485595703125, -0.120941162109375, -0.0770263671875, -0.033111572265625, 0.01080322265625, 0.054718017578125, 0.0986328125, 0.142547607421875, 0.18646240234375, 0.230377197265625, 0.2742919921875, 0.318206787109375, 0.36212158203125, 0.406036376953125, 0.449951171875, 0.493865966796875, 0.53778076171875, 0.581695556640625, 0.6256103515625, 0.669525146484375, 0.71343994140625, 0.757354736328125, 0.80126953125, 0.845184326171875, 0.88909912109375, 0.933013916015625, 0.9769287109375, 1.020843505859375, 1.06475830078125, 1.108673095703125, 1.152587890625, 1.196502685546875, 1.24041748046875, 1.284332275390625, 1.3282470703125, 1.372161865234375, 1.41607666015625, 1.459991455078125, 1.50390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 10.0, 17.0, 22.0, 30.0, 37.0, 64.0, 106.0, 159.0, 240.0, 370.0, 600.0, 1068.0, 1972.0, 4183.0, 10309.0, 37233.0, 262087.0, 577477.0, 117573.0, 21195.0, 6980.0, 3030.0, 1530.0, 852.0, 525.0, 312.0, 200.0, 124.0, 87.0, 39.0, 48.0, 23.0, 15.0, 8.0, 8.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8544921875, -0.8193359375, -0.7841796875, -0.7490234375, -0.7138671875, -0.6787109375, -0.6435546875, -0.6083984375, -0.5732421875, -0.5380859375, -0.5029296875, -0.4677734375, -0.4326171875, -0.3974609375, -0.3623046875, -0.3271484375, -0.2919921875, -0.2568359375, -0.2216796875, -0.1865234375, -0.1513671875, -0.1162109375, -0.0810546875, -0.0458984375, -0.0107421875, 0.0244140625, 0.0595703125, 0.0947265625, 0.1298828125, 0.1650390625, 0.2001953125, 0.2353515625, 0.2705078125, 0.3056640625, 0.3408203125, 0.3759765625, 0.4111328125, 0.4462890625, 0.4814453125, 0.5166015625, 0.5517578125, 0.5869140625, 0.6220703125, 0.6572265625, 0.6923828125, 0.7275390625, 0.7626953125, 0.7978515625, 0.8330078125, 0.8681640625, 0.9033203125, 0.9384765625, 0.9736328125, 1.0087890625, 1.0439453125, 1.0791015625, 1.1142578125, 1.1494140625, 1.1845703125, 1.2197265625, 1.2548828125, 1.2900390625, 1.3251953125, 1.3603515625, 1.3955078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 1.0, 12.0, 9.0, 22.0, 38.0, 72.0, 149.0, 250.0, 211.0, 117.0, 48.0, 27.0, 9.0, 6.0, 8.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00013017654418945312, -0.00012547709047794342, -0.00012077763676643372, -0.00011607818305492401, -0.0001113787293434143, -0.0001066792756319046, -0.0001019798219203949, -9.728036820888519e-05, -9.258091449737549e-05, -8.788146078586578e-05, -8.318200707435608e-05, -7.848255336284637e-05, -7.378309965133667e-05, -6.908364593982697e-05, -6.438419222831726e-05, -5.9684738516807556e-05, -5.498528480529785e-05, -5.028583109378815e-05, -4.558637738227844e-05, -4.088692367076874e-05, -3.618746995925903e-05, -3.148801624774933e-05, -2.6788562536239624e-05, -2.208910882472992e-05, -1.7389655113220215e-05, -1.269020140171051e-05, -7.990747690200806e-06, -3.291293978691101e-06, 1.4081597328186035e-06, 6.107613444328308e-06, 1.0807067155838013e-05, 1.5506520867347717e-05, 2.0205974578857422e-05, 2.4905428290367126e-05, 2.960488200187683e-05, 3.4304335713386536e-05, 3.900378942489624e-05, 4.3703243136405945e-05, 4.840269684791565e-05, 5.3102150559425354e-05, 5.780160427093506e-05, 6.250105798244476e-05, 6.720051169395447e-05, 7.189996540546417e-05, 7.659941911697388e-05, 8.129887282848358e-05, 8.599832653999329e-05, 9.069778025150299e-05, 9.53972339630127e-05, 0.0001000966876745224, 0.0001047961413860321, 0.00010949559509754181, 0.00011419504880905151, 0.00011889450252056122, 0.00012359395623207092, 0.00012829340994358063, 0.00013299286365509033, 0.00013769231736660004, 0.00014239177107810974, 0.00014709122478961945, 0.00015179067850112915, 0.00015649013221263885, 0.00016118958592414856, 0.00016588903963565826, 0.00017058849334716797]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 9.0, 5.0, 4.0, 11.0, 16.0, 17.0, 24.0, 37.0, 67.0, 121.0, 174.0, 251.0, 513.0, 899.0, 1677.0, 3334.0, 6983.0, 16080.0, 42554.0, 117000.0, 256113.0, 307215.0, 179881.0, 70418.0, 25142.0, 10023.0, 4714.0, 2378.0, 1239.0, 627.0, 407.0, 229.0, 129.0, 81.0, 47.0, 41.0, 24.0, 12.0, 12.0, 10.0, 6.0, 4.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.426513671875, -0.4124107360839844, -0.39830780029296875, -0.3842048645019531, -0.3701019287109375, -0.3559989929199219, -0.34189605712890625, -0.3277931213378906, -0.313690185546875, -0.2995872497558594, -0.28548431396484375, -0.2713813781738281, -0.2572784423828125, -0.24317550659179688, -0.22907257080078125, -0.21496963500976562, -0.20086669921875, -0.18676376342773438, -0.17266082763671875, -0.15855789184570312, -0.1444549560546875, -0.13035202026367188, -0.11624908447265625, -0.10214614868164062, -0.088043212890625, -0.07394027709960938, -0.05983734130859375, -0.045734405517578125, -0.0316314697265625, -0.017528533935546875, -0.00342559814453125, 0.010677337646484375, 0.0247802734375, 0.038883209228515625, 0.05298614501953125, 0.06708908081054688, 0.0811920166015625, 0.09529495239257812, 0.10939788818359375, 0.12350082397460938, 0.137603759765625, 0.15170669555664062, 0.16580963134765625, 0.17991256713867188, 0.1940155029296875, 0.20811843872070312, 0.22222137451171875, 0.23632431030273438, 0.25042724609375, 0.2645301818847656, 0.27863311767578125, 0.2927360534667969, 0.3068389892578125, 0.3209419250488281, 0.33504486083984375, 0.3491477966308594, 0.363250732421875, 0.3773536682128906, 0.39145660400390625, 0.4055595397949219, 0.4196624755859375, 0.4337654113769531, 0.44786834716796875, 0.4619712829589844, 0.47607421875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 5.0, 11.0, 14.0, 16.0, 22.0, 22.0, 24.0, 38.0, 46.0, 62.0, 45.0, 66.0, 83.0, 68.0, 68.0, 63.0, 67.0, 53.0, 37.0, 38.0, 20.0, 27.0, 15.0, 21.0, 12.0, 11.0, 6.0, 7.0, 6.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.3369140625, -0.327117919921875, -0.31732177734375, -0.307525634765625, -0.2977294921875, -0.287933349609375, -0.27813720703125, -0.268341064453125, -0.258544921875, -0.248748779296875, -0.23895263671875, -0.229156494140625, -0.2193603515625, -0.209564208984375, -0.19976806640625, -0.189971923828125, -0.18017578125, -0.170379638671875, -0.16058349609375, -0.150787353515625, -0.1409912109375, -0.131195068359375, -0.12139892578125, -0.111602783203125, -0.101806640625, -0.092010498046875, -0.08221435546875, -0.072418212890625, -0.0626220703125, -0.052825927734375, -0.04302978515625, -0.033233642578125, -0.0234375, -0.013641357421875, -0.00384521484375, 0.005950927734375, 0.0157470703125, 0.025543212890625, 0.03533935546875, 0.045135498046875, 0.054931640625, 0.064727783203125, 0.07452392578125, 0.084320068359375, 0.0941162109375, 0.103912353515625, 0.11370849609375, 0.123504638671875, 0.13330078125, 0.143096923828125, 0.15289306640625, 0.162689208984375, 0.1724853515625, 0.182281494140625, 0.19207763671875, 0.201873779296875, 0.211669921875, 0.221466064453125, 0.23126220703125, 0.241058349609375, 0.2508544921875, 0.260650634765625, 0.27044677734375, 0.280242919921875, 0.2900390625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 17.0, 119.0, 374.0, 386.0, 97.0, 15.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9712295532226562, -3.5269527435302734, -3.0826761722564697, -2.638399362564087, -2.194122791290283, -1.7498459815979004, -1.3055691719055176, -0.8612926006317139, -0.41701579093933105, 0.027260929346084595, 0.47153764963150024, 0.9158143997192383, 1.3600910902023315, 1.8043677806854248, 2.2486445903778076, 2.6929211616516113, 3.137197971343994, 3.581474781036377, 4.02575159072876, 4.470027923583984, 4.914304733276367, 5.35858154296875, 5.802858352661133, 6.247135162353516, 6.691411972045898, 7.135688781738281, 7.579965591430664, 8.024242401123047, 8.46851921081543, 8.912796020507812, 9.357072830200195, 9.801348686218262, 10.245625495910645, 10.689902305603027, 11.13417911529541, 11.578455924987793, 12.022732734680176, 12.467008590698242, 12.911285400390625, 13.355562210083008, 13.79983901977539, 14.244115829467773, 14.688392639160156, 15.132669448852539, 15.576946258544922, 16.021223068237305, 16.465499877929688, 16.90977668762207, 17.354053497314453, 17.798330307006836, 18.24260711669922, 18.6868839263916, 19.131160736083984, 19.575437545776367, 20.01971435546875, 20.463991165161133, 20.908266067504883, 21.352542877197266, 21.79681968688965, 22.24109649658203, 22.685373306274414, 23.129650115966797, 23.57392692565918, 24.018203735351562, 24.462480545043945]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 7.0, 6.0, 10.0, 10.0, 16.0, 17.0, 14.0, 22.0, 24.0, 26.0, 36.0, 30.0, 44.0, 46.0, 43.0, 42.0, 36.0, 48.0, 44.0, 49.0, 50.0, 37.0, 35.0, 39.0, 36.0, 22.0, 21.0, 38.0, 28.0, 31.0, 17.0, 17.0, 13.0, 10.0, 9.0, 4.0, 9.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.0581321716308594, -2.966860771179199, -2.87558913230896, -2.7843177318573, -2.6930460929870605, -2.6017746925354004, -2.5105032920837402, -2.41923189163208, -2.327960252761841, -2.2366888523101807, -2.1454172134399414, -2.0541458129882812, -1.9628742933273315, -1.8716027736663818, -1.7803313732147217, -1.689059853553772, -1.5977883338928223, -1.5065168142318726, -1.4152452945709229, -1.3239738941192627, -1.232702374458313, -1.1414308547973633, -1.0501594543457031, -0.9588879346847534, -0.8676164150238037, -0.776344895362854, -0.6850734353065491, -0.5938019752502441, -0.5025304555892944, -0.4112589657306671, -0.3199874758720398, -0.22871601581573486, -0.13744449615478516, -0.04617300629615784, 0.04509848356246948, 0.1363699734210968, 0.22764146327972412, 0.31891295313835144, 0.41018444299697876, 0.5014559030532837, 0.5927274227142334, 0.6839989423751831, 0.775270402431488, 0.866541862487793, 0.9578133821487427, 1.0490849018096924, 1.1403563022613525, 1.2316278219223022, 1.322899341583252, 1.4141708612442017, 1.5054423809051514, 1.5967137813568115, 1.6879853010177612, 1.779256820678711, 1.870528221130371, 1.9617997407913208, 2.0530712604522705, 2.1443426609039307, 2.23561429977417, 2.32688570022583, 2.4181571006774902, 2.5094287395477295, 2.6007001399993896, 2.691971778869629, 2.783243179321289]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 7.0, 7.0, 9.0, 18.0, 22.0, 40.0, 67.0, 81.0, 135.0, 271.0, 467.0, 972.0, 2205.0, 5246.0, 15284.0, 55940.0, 292969.0, 1629999.0, 1761717.0, 338701.0, 63575.0, 16982.0, 5579.0, 2080.0, 941.0, 429.0, 219.0, 115.0, 65.0, 44.0, 40.0, 19.0, 13.0, 13.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88916015625, -0.863037109375, -0.8369140625, -0.810791015625, -0.78466796875, -0.758544921875, -0.732421875, -0.706298828125, -0.68017578125, -0.654052734375, -0.6279296875, -0.601806640625, -0.57568359375, -0.549560546875, -0.5234375, -0.497314453125, -0.47119140625, -0.445068359375, -0.4189453125, -0.392822265625, -0.36669921875, -0.340576171875, -0.314453125, -0.288330078125, -0.26220703125, -0.236083984375, -0.2099609375, -0.183837890625, -0.15771484375, -0.131591796875, -0.10546875, -0.079345703125, -0.05322265625, -0.027099609375, -0.0009765625, 0.025146484375, 0.05126953125, 0.077392578125, 0.103515625, 0.129638671875, 0.15576171875, 0.181884765625, 0.2080078125, 0.234130859375, 0.26025390625, 0.286376953125, 0.3125, 0.338623046875, 0.36474609375, 0.390869140625, 0.4169921875, 0.443115234375, 0.46923828125, 0.495361328125, 0.521484375, 0.547607421875, 0.57373046875, 0.599853515625, 0.6259765625, 0.652099609375, 0.67822265625, 0.704345703125, 0.73046875, 0.756591796875, 0.78271484375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 12.0, 13.0, 14.0, 13.0, 17.0, 20.0, 29.0, 39.0, 41.0, 61.0, 54.0, 66.0, 50.0, 65.0, 68.0, 62.0, 55.0, 65.0, 38.0, 36.0, 38.0, 28.0, 30.0, 24.0, 19.0, 11.0, 8.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.77734375, -0.7578659057617188, -0.7383880615234375, -0.7189102172851562, -0.699432373046875, -0.6799545288085938, -0.6604766845703125, -0.6409988403320312, -0.62152099609375, -0.6020431518554688, -0.5825653076171875, -0.5630874633789062, -0.543609619140625, -0.5241317749023438, -0.5046539306640625, -0.48517608642578125, -0.4656982421875, -0.44622039794921875, -0.4267425537109375, -0.40726470947265625, -0.387786865234375, -0.36830902099609375, -0.3488311767578125, -0.32935333251953125, -0.30987548828125, -0.29039764404296875, -0.2709197998046875, -0.25144195556640625, -0.231964111328125, -0.21248626708984375, -0.1930084228515625, -0.17353057861328125, -0.154052734375, -0.13457489013671875, -0.1150970458984375, -0.09561920166015625, -0.076141357421875, -0.05666351318359375, -0.0371856689453125, -0.01770782470703125, 0.00177001953125, 0.02124786376953125, 0.0407257080078125, 0.06020355224609375, 0.079681396484375, 0.09915924072265625, 0.1186370849609375, 0.13811492919921875, 0.1575927734375, 0.17707061767578125, 0.1965484619140625, 0.21602630615234375, 0.235504150390625, 0.25498199462890625, 0.2744598388671875, 0.29393768310546875, 0.31341552734375, 0.33289337158203125, 0.3523712158203125, 0.37184906005859375, 0.391326904296875, 0.41080474853515625, 0.4302825927734375, 0.44976043701171875, 0.46923828125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 10.0, 5.0, 20.0, 26.0, 37.0, 77.0, 103.0, 216.0, 430.0, 1122.0, 3098.0, 11399.0, 51277.0, 265816.0, 1199279.0, 1888550.0, 617468.0, 121108.0, 24770.0, 6133.0, 1827.0, 757.0, 324.0, 170.0, 102.0, 52.0, 44.0, 22.0, 13.0, 10.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.93994140625, -0.9088821411132812, -0.8778228759765625, -0.8467636108398438, -0.815704345703125, -0.7846450805664062, -0.7535858154296875, -0.7225265502929688, -0.69146728515625, -0.6604080200195312, -0.6293487548828125, -0.5982894897460938, -0.567230224609375, -0.5361709594726562, -0.5051116943359375, -0.47405242919921875, -0.4429931640625, -0.41193389892578125, -0.3808746337890625, -0.34981536865234375, -0.318756103515625, -0.28769683837890625, -0.2566375732421875, -0.22557830810546875, -0.19451904296875, -0.16345977783203125, -0.1324005126953125, -0.10134124755859375, -0.070281982421875, -0.03922271728515625, -0.0081634521484375, 0.02289581298828125, 0.053955078125, 0.08501434326171875, 0.1160736083984375, 0.14713287353515625, 0.178192138671875, 0.20925140380859375, 0.2403106689453125, 0.27136993408203125, 0.30242919921875, 0.33348846435546875, 0.3645477294921875, 0.39560699462890625, 0.426666259765625, 0.45772552490234375, 0.4887847900390625, 0.5198440551757812, 0.5509033203125, 0.5819625854492188, 0.6130218505859375, 0.6440811157226562, 0.675140380859375, 0.7061996459960938, 0.7372589111328125, 0.7683181762695312, 0.79937744140625, 0.8304367065429688, 0.8614959716796875, 0.8925552368164062, 0.923614501953125, 0.9546737670898438, 0.9857330322265625, 1.0167922973632812, 1.0478515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 0.0, 2.0, 4.0, 6.0, 14.0, 17.0, 14.0, 27.0, 30.0, 36.0, 47.0, 72.0, 83.0, 93.0, 140.0, 166.0, 191.0, 237.0, 241.0, 298.0, 315.0, 315.0, 289.0, 261.0, 236.0, 186.0, 163.0, 136.0, 102.0, 85.0, 58.0, 48.0, 37.0, 25.0, 21.0, 20.0, 12.0, 10.0, 11.0, 10.0, 6.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.56640625, -0.5468902587890625, -0.527374267578125, -0.5078582763671875, -0.48834228515625, -0.4688262939453125, -0.449310302734375, -0.4297943115234375, -0.4102783203125, -0.3907623291015625, -0.371246337890625, -0.3517303466796875, -0.33221435546875, -0.3126983642578125, -0.293182373046875, -0.2736663818359375, -0.254150390625, -0.2346343994140625, -0.215118408203125, -0.1956024169921875, -0.17608642578125, -0.1565704345703125, -0.137054443359375, -0.1175384521484375, -0.0980224609375, -0.0785064697265625, -0.058990478515625, -0.0394744873046875, -0.01995849609375, -0.0004425048828125, 0.019073486328125, 0.0385894775390625, 0.05810546875, 0.0776214599609375, 0.097137451171875, 0.1166534423828125, 0.13616943359375, 0.1556854248046875, 0.175201416015625, 0.1947174072265625, 0.2142333984375, 0.2337493896484375, 0.253265380859375, 0.2727813720703125, 0.29229736328125, 0.3118133544921875, 0.331329345703125, 0.3508453369140625, 0.370361328125, 0.3898773193359375, 0.409393310546875, 0.4289093017578125, 0.44842529296875, 0.4679412841796875, 0.487457275390625, 0.5069732666015625, 0.5264892578125, 0.5460052490234375, 0.565521240234375, 0.5850372314453125, 0.60455322265625, 0.6240692138671875, 0.643585205078125, 0.6631011962890625, 0.6826171875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 17.0, 52.0, 150.0, 255.0, 299.0, 169.0, 51.0, 15.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.94739055633545, -15.616182327270508, -15.284974098205566, -14.953764915466309, -14.622556686401367, -14.291348457336426, -13.960140228271484, -13.628931045532227, -13.297722816467285, -12.966514587402344, -12.635306358337402, -12.304097175598145, -11.972888946533203, -11.641680717468262, -11.31047248840332, -10.979263305664062, -10.648056030273438, -10.316847801208496, -9.985639572143555, -9.654430389404297, -9.323222160339355, -8.992013931274414, -8.660805702209473, -8.329597473144531, -7.998388290405273, -7.667180061340332, -7.335971355438232, -7.004763126373291, -6.673554420471191, -6.34234619140625, -6.011137962341309, -5.679929256439209, -5.348721027374268, -5.017512798309326, -4.686304092407227, -4.355095863342285, -4.0238871574401855, -3.692678928375244, -3.3614704608917236, -3.030261993408203, -2.6990535259246826, -2.367845058441162, -2.0366365909576416, -1.7054282426834106, -1.3742197751998901, -1.0430113077163696, -0.7118029594421387, -0.38059449195861816, -0.049386024475097656, 0.28182241320610046, 0.6130308508872986, 0.9442392587661743, 1.2754477262496948, 1.6066561937332153, 1.9378645420074463, 2.269073009490967, 2.6002814769744873, 2.931489944458008, 3.2626984119415283, 3.593906879425049, 3.9251151084899902, 4.25632381439209, 4.587532043457031, 4.918740272521973, 5.249948978424072]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 8.0, 1.0, 6.0, 7.0, 14.0, 15.0, 14.0, 19.0, 30.0, 19.0, 23.0, 40.0, 30.0, 27.0, 42.0, 41.0, 61.0, 42.0, 52.0, 55.0, 33.0, 43.0, 46.0, 35.0, 42.0, 38.0, 33.0, 24.0, 26.0, 30.0, 17.0, 12.0, 23.0, 12.0, 12.0, 11.0, 7.0, 3.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.85854172706604, -2.7727255821228027, -2.6869096755981445, -2.6010935306549072, -2.51527738571167, -2.4294614791870117, -2.3436453342437744, -2.257829189300537, -2.172013282775879, -2.0861971378326416, -2.0003812313079834, -1.914565086364746, -1.8287489414215088, -1.742932915687561, -1.6571168899536133, -1.571300745010376, -1.4854846000671387, -1.399668574333191, -1.3138524293899536, -1.2280364036560059, -1.1422202587127686, -1.0564042329788208, -0.970588207244873, -0.8847721219062805, -0.798956036567688, -0.7131399512290955, -0.6273238658905029, -0.5415078401565552, -0.45569175481796265, -0.3698756694793701, -0.28405964374542236, -0.19824355840682983, -0.1124277114868164, -0.02661164104938507, 0.059204429388046265, 0.1450204849243164, 0.23083657026290894, 0.31665265560150146, 0.4024686813354492, 0.48828476667404175, 0.5741008520126343, 0.6599169373512268, 0.7457330226898193, 0.8315490484237671, 0.9173651337623596, 1.0031812191009521, 1.0889972448349, 1.1748132705688477, 1.260629415512085, 1.3464454412460327, 1.43226158618927, 1.5180776119232178, 1.603893756866455, 1.6897097826004028, 1.7755258083343506, 1.861341953277588, 1.9471579790115356, 2.0329740047454834, 2.1187901496887207, 2.204606056213379, 2.290422201156616, 2.3762383460998535, 2.4620542526245117, 2.547870397567749, 2.6336865425109863]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 16.0, 13.0, 28.0, 39.0, 36.0, 72.0, 104.0, 160.0, 269.0, 514.0, 753.0, 1337.0, 2448.0, 4249.0, 7572.0, 13672.0, 24515.0, 45834.0, 82511.0, 142633.0, 204551.0, 201290.0, 138494.0, 79842.0, 43692.0, 23587.0, 13118.0, 7290.0, 4071.0, 2347.0, 1378.0, 817.0, 464.0, 323.0, 173.0, 102.0, 61.0, 42.0, 40.0, 22.0, 23.0, 9.0, 8.0, 2.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.8759765625, -0.850189208984375, -0.82440185546875, -0.798614501953125, -0.7728271484375, -0.747039794921875, -0.72125244140625, -0.695465087890625, -0.669677734375, -0.643890380859375, -0.61810302734375, -0.592315673828125, -0.5665283203125, -0.540740966796875, -0.51495361328125, -0.489166259765625, -0.46337890625, -0.437591552734375, -0.41180419921875, -0.386016845703125, -0.3602294921875, -0.334442138671875, -0.30865478515625, -0.282867431640625, -0.257080078125, -0.231292724609375, -0.20550537109375, -0.179718017578125, -0.1539306640625, -0.128143310546875, -0.10235595703125, -0.076568603515625, -0.05078125, -0.024993896484375, 0.00079345703125, 0.026580810546875, 0.0523681640625, 0.078155517578125, 0.10394287109375, 0.129730224609375, 0.155517578125, 0.181304931640625, 0.20709228515625, 0.232879638671875, 0.2586669921875, 0.284454345703125, 0.31024169921875, 0.336029052734375, 0.36181640625, 0.387603759765625, 0.41339111328125, 0.439178466796875, 0.4649658203125, 0.490753173828125, 0.51654052734375, 0.542327880859375, 0.568115234375, 0.593902587890625, 0.61968994140625, 0.645477294921875, 0.6712646484375, 0.697052001953125, 0.72283935546875, 0.748626708984375, 0.7744140625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 6.0, 8.0, 12.0, 15.0, 15.0, 13.0, 23.0, 33.0, 22.0, 47.0, 56.0, 63.0, 62.0, 64.0, 69.0, 59.0, 52.0, 58.0, 59.0, 35.0, 48.0, 38.0, 33.0, 27.0, 21.0, 17.0, 12.0, 10.0, 5.0, 7.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.72412109375, -0.7055587768554688, -0.6869964599609375, -0.6684341430664062, -0.649871826171875, -0.6313095092773438, -0.6127471923828125, -0.5941848754882812, -0.57562255859375, -0.5570602416992188, -0.5384979248046875, -0.5199356079101562, -0.501373291015625, -0.48281097412109375, -0.4642486572265625, -0.44568634033203125, -0.4271240234375, -0.40856170654296875, -0.3899993896484375, -0.37143707275390625, -0.352874755859375, -0.33431243896484375, -0.3157501220703125, -0.29718780517578125, -0.27862548828125, -0.26006317138671875, -0.2415008544921875, -0.22293853759765625, -0.204376220703125, -0.18581390380859375, -0.1672515869140625, -0.14868927001953125, -0.130126953125, -0.11156463623046875, -0.0930023193359375, -0.07444000244140625, -0.055877685546875, -0.03731536865234375, -0.0187530517578125, -0.00019073486328125, 0.01837158203125, 0.03693389892578125, 0.0554962158203125, 0.07405853271484375, 0.092620849609375, 0.11118316650390625, 0.1297454833984375, 0.14830780029296875, 0.1668701171875, 0.18543243408203125, 0.2039947509765625, 0.22255706787109375, 0.241119384765625, 0.25968170166015625, 0.2782440185546875, 0.29680633544921875, 0.31536865234375, 0.33393096923828125, 0.3524932861328125, 0.37105560302734375, 0.389617919921875, 0.40818023681640625, 0.4267425537109375, 0.44530487060546875, 0.4638671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 10.0, 9.0, 8.0, 11.0, 23.0, 33.0, 49.0, 63.0, 83.0, 153.0, 264.0, 455.0, 858.0, 1714.0, 3665.0, 8185.0, 18739.0, 42167.0, 93771.0, 193242.0, 277396.0, 210993.0, 106892.0, 49054.0, 21955.0, 9957.0, 4418.0, 2066.0, 1031.0, 512.0, 278.0, 165.0, 102.0, 68.0, 45.0, 33.0, 24.0, 18.0, 16.0, 9.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1630859375, -1.126251220703125, -1.08941650390625, -1.052581787109375, -1.0157470703125, -0.978912353515625, -0.94207763671875, -0.905242919921875, -0.868408203125, -0.831573486328125, -0.79473876953125, -0.757904052734375, -0.7210693359375, -0.684234619140625, -0.64739990234375, -0.610565185546875, -0.57373046875, -0.536895751953125, -0.50006103515625, -0.463226318359375, -0.4263916015625, -0.389556884765625, -0.35272216796875, -0.315887451171875, -0.279052734375, -0.242218017578125, -0.20538330078125, -0.168548583984375, -0.1317138671875, -0.094879150390625, -0.05804443359375, -0.021209716796875, 0.015625, 0.052459716796875, 0.08929443359375, 0.126129150390625, 0.1629638671875, 0.199798583984375, 0.23663330078125, 0.273468017578125, 0.310302734375, 0.347137451171875, 0.38397216796875, 0.420806884765625, 0.4576416015625, 0.494476318359375, 0.53131103515625, 0.568145751953125, 0.60498046875, 0.641815185546875, 0.67864990234375, 0.715484619140625, 0.7523193359375, 0.789154052734375, 0.82598876953125, 0.862823486328125, 0.899658203125, 0.936492919921875, 0.97332763671875, 1.010162353515625, 1.0469970703125, 1.083831787109375, 1.12066650390625, 1.157501220703125, 1.1943359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 7.0, 4.0, 4.0, 5.0, 9.0, 9.0, 12.0, 17.0, 12.0, 16.0, 22.0, 20.0, 28.0, 24.0, 32.0, 33.0, 36.0, 42.0, 38.0, 42.0, 51.0, 58.0, 41.0, 60.0, 29.0, 46.0, 38.0, 35.0, 34.0, 29.0, 25.0, 21.0, 24.0, 15.0, 21.0, 19.0, 15.0, 9.0, 9.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.34765625, -1.3082122802734375, -1.268768310546875, -1.2293243408203125, -1.18988037109375, -1.1504364013671875, -1.110992431640625, -1.0715484619140625, -1.0321044921875, -0.9926605224609375, -0.953216552734375, -0.9137725830078125, -0.87432861328125, -0.8348846435546875, -0.795440673828125, -0.7559967041015625, -0.716552734375, -0.6771087646484375, -0.637664794921875, -0.5982208251953125, -0.55877685546875, -0.5193328857421875, -0.479888916015625, -0.4404449462890625, -0.4010009765625, -0.3615570068359375, -0.322113037109375, -0.2826690673828125, -0.24322509765625, -0.2037811279296875, -0.164337158203125, -0.1248931884765625, -0.08544921875, -0.0460052490234375, -0.006561279296875, 0.0328826904296875, 0.07232666015625, 0.1117706298828125, 0.151214599609375, 0.1906585693359375, 0.2301025390625, 0.2695465087890625, 0.308990478515625, 0.3484344482421875, 0.38787841796875, 0.4273223876953125, 0.466766357421875, 0.5062103271484375, 0.545654296875, 0.5850982666015625, 0.624542236328125, 0.6639862060546875, 0.70343017578125, 0.7428741455078125, 0.782318115234375, 0.8217620849609375, 0.8612060546875, 0.9006500244140625, 0.940093994140625, 0.9795379638671875, 1.01898193359375, 1.0584259033203125, 1.097869873046875, 1.1373138427734375, 1.1767578125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 12.0, 11.0, 12.0, 14.0, 19.0, 28.0, 49.0, 61.0, 70.0, 110.0, 163.0, 214.0, 363.0, 521.0, 944.0, 1608.0, 2933.0, 9955.0, 99422.0, 620481.0, 278614.0, 23408.0, 4338.0, 2011.0, 1145.0, 697.0, 419.0, 314.0, 179.0, 120.0, 82.0, 71.0, 47.0, 27.0, 25.0, 16.0, 13.0, 13.0, 8.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.658203125, -1.607513427734375, -1.55682373046875, -1.506134033203125, -1.4554443359375, -1.404754638671875, -1.35406494140625, -1.303375244140625, -1.252685546875, -1.201995849609375, -1.15130615234375, -1.100616455078125, -1.0499267578125, -0.999237060546875, -0.94854736328125, -0.897857666015625, -0.84716796875, -0.796478271484375, -0.74578857421875, -0.695098876953125, -0.6444091796875, -0.593719482421875, -0.54302978515625, -0.492340087890625, -0.441650390625, -0.390960693359375, -0.34027099609375, -0.289581298828125, -0.2388916015625, -0.188201904296875, -0.13751220703125, -0.086822509765625, -0.0361328125, 0.014556884765625, 0.06524658203125, 0.115936279296875, 0.1666259765625, 0.217315673828125, 0.26800537109375, 0.318695068359375, 0.369384765625, 0.420074462890625, 0.47076416015625, 0.521453857421875, 0.5721435546875, 0.622833251953125, 0.67352294921875, 0.724212646484375, 0.77490234375, 0.825592041015625, 0.87628173828125, 0.926971435546875, 0.9776611328125, 1.028350830078125, 1.07904052734375, 1.129730224609375, 1.180419921875, 1.231109619140625, 1.28179931640625, 1.332489013671875, 1.3831787109375, 1.433868408203125, 1.48455810546875, 1.535247802734375, 1.5859375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 16.0, 23.0, 50.0, 89.0, 147.0, 227.0, 187.0, 133.0, 59.0, 27.0, 17.0, 12.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014281272888183594, -0.0001352168619632721, -0.00012762099504470825, -0.00012002512812614441, -0.00011242926120758057, -0.00010483339428901672, -9.723752737045288e-05, -8.964166045188904e-05, -8.20457935333252e-05, -7.444992661476135e-05, -6.685405969619751e-05, -5.925819277763367e-05, -5.1662325859069824e-05, -4.406645894050598e-05, -3.647059202194214e-05, -2.8874725103378296e-05, -2.1278858184814453e-05, -1.368299126625061e-05, -6.087124347686768e-06, 1.5087425708770752e-06, 9.104609489440918e-06, 1.670047640800476e-05, 2.4296343326568604e-05, 3.1892210245132446e-05, 3.948807716369629e-05, 4.708394408226013e-05, 5.4679811000823975e-05, 6.227567791938782e-05, 6.987154483795166e-05, 7.74674117565155e-05, 8.506327867507935e-05, 9.265914559364319e-05, 0.00010025501251220703, 0.00010785087943077087, 0.00011544674634933472, 0.00012304261326789856, 0.0001306384801864624, 0.00013823434710502625, 0.0001458302140235901, 0.00015342608094215393, 0.00016102194786071777, 0.00016861781477928162, 0.00017621368169784546, 0.0001838095486164093, 0.00019140541553497314, 0.000199001282453537, 0.00020659714937210083, 0.00021419301629066467, 0.00022178888320922852, 0.00022938475012779236, 0.0002369806170463562, 0.00024457648396492004, 0.0002521723508834839, 0.00025976821780204773, 0.00026736408472061157, 0.0002749599516391754, 0.00028255581855773926, 0.0002901516854763031, 0.00029774755239486694, 0.0003053434193134308, 0.00031293928623199463, 0.00032053515315055847, 0.0003281310200691223, 0.00033572688698768616, 0.00034332275390625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 7.0, 7.0, 13.0, 16.0, 20.0, 31.0, 42.0, 63.0, 88.0, 146.0, 236.0, 369.0, 671.0, 1259.0, 2356.0, 4757.0, 9631.0, 19288.0, 38289.0, 72851.0, 121696.0, 171690.0, 191928.0, 164968.0, 113287.0, 66132.0, 34464.0, 17180.0, 8392.0, 4065.0, 2053.0, 1094.0, 575.0, 324.0, 216.0, 114.0, 87.0, 45.0, 39.0, 20.0, 17.0, 7.0, 15.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356689453125, -0.3460197448730469, -0.33535003662109375, -0.3246803283691406, -0.3140106201171875, -0.3033409118652344, -0.29267120361328125, -0.2820014953613281, -0.271331787109375, -0.2606620788574219, -0.24999237060546875, -0.23932266235351562, -0.2286529541015625, -0.21798324584960938, -0.20731353759765625, -0.19664382934570312, -0.18597412109375, -0.17530441284179688, -0.16463470458984375, -0.15396499633789062, -0.1432952880859375, -0.13262557983398438, -0.12195587158203125, -0.11128616333007812, -0.100616455078125, -0.08994674682617188, -0.07927703857421875, -0.06860733032226562, -0.0579376220703125, -0.047267913818359375, -0.03659820556640625, -0.025928497314453125, -0.0152587890625, -0.004589080810546875, 0.00608062744140625, 0.016750335693359375, 0.0274200439453125, 0.038089752197265625, 0.04875946044921875, 0.059429168701171875, 0.070098876953125, 0.08076858520507812, 0.09143829345703125, 0.10210800170898438, 0.1127777099609375, 0.12344741821289062, 0.13411712646484375, 0.14478683471679688, 0.15545654296875, 0.16612625122070312, 0.17679595947265625, 0.18746566772460938, 0.1981353759765625, 0.20880508422851562, 0.21947479248046875, 0.23014450073242188, 0.240814208984375, 0.2514839172363281, 0.26215362548828125, 0.2728233337402344, 0.2834930419921875, 0.2941627502441406, 0.30483245849609375, 0.3155021667480469, 0.326171875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 10.0, 4.0, 7.0, 10.0, 10.0, 14.0, 8.0, 9.0, 10.0, 11.0, 22.0, 22.0, 19.0, 20.0, 22.0, 39.0, 32.0, 42.0, 38.0, 38.0, 48.0, 38.0, 35.0, 34.0, 47.0, 43.0, 38.0, 39.0, 32.0, 37.0, 21.0, 30.0, 26.0, 21.0, 19.0, 14.0, 16.0, 13.0, 11.0, 11.0, 9.0, 3.0, 6.0, 4.0, 5.0, 2.0, 6.0, 5.0, 2.0, 3.0, 0.0, 4.0, 0.0, 3.0], "bins": [-0.240234375, -0.2327423095703125, -0.225250244140625, -0.2177581787109375, -0.21026611328125, -0.2027740478515625, -0.195281982421875, -0.1877899169921875, -0.1802978515625, -0.1728057861328125, -0.165313720703125, -0.1578216552734375, -0.15032958984375, -0.1428375244140625, -0.135345458984375, -0.1278533935546875, -0.120361328125, -0.1128692626953125, -0.105377197265625, -0.0978851318359375, -0.09039306640625, -0.0829010009765625, -0.075408935546875, -0.0679168701171875, -0.0604248046875, -0.0529327392578125, -0.045440673828125, -0.0379486083984375, -0.03045654296875, -0.0229644775390625, -0.015472412109375, -0.0079803466796875, -0.00048828125, 0.0070037841796875, 0.014495849609375, 0.0219879150390625, 0.02947998046875, 0.0369720458984375, 0.044464111328125, 0.0519561767578125, 0.0594482421875, 0.0669403076171875, 0.074432373046875, 0.0819244384765625, 0.08941650390625, 0.0969085693359375, 0.104400634765625, 0.1118927001953125, 0.119384765625, 0.1268768310546875, 0.134368896484375, 0.1418609619140625, 0.14935302734375, 0.1568450927734375, 0.164337158203125, 0.1718292236328125, 0.1793212890625, 0.1868133544921875, 0.194305419921875, 0.2017974853515625, 0.20928955078125, 0.2167816162109375, 0.224273681640625, 0.2317657470703125, 0.2392578125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 21.0, 52.0, 155.0, 216.0, 277.0, 188.0, 63.0, 25.0, 10.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-17.807525634765625, -17.472366333007812, -17.137208938598633, -16.80204963684082, -16.466890335083008, -16.131732940673828, -15.796573638916016, -15.46141529083252, -15.126256942749023, -14.791098594665527, -14.455939292907715, -14.120780944824219, -13.785622596740723, -13.450464248657227, -13.115304946899414, -12.780146598815918, -12.444987297058105, -12.10982894897461, -11.774669647216797, -11.4395112991333, -11.104352951049805, -10.769193649291992, -10.434035301208496, -10.098876953125, -9.763717651367188, -9.428559303283691, -9.093400001525879, -8.758241653442383, -8.423083305358887, -8.08792495727539, -7.752765655517578, -7.417607307434082, -7.082449436187744, -6.74729061126709, -6.412132263183594, -6.0769734382629395, -5.741814613342285, -5.406656265258789, -5.071497440338135, -4.7363386154174805, -4.401180267333984, -4.06602144241333, -3.730863094329834, -3.3957042694091797, -3.0605456829071045, -2.7253870964050293, -2.390228271484375, -2.0550696849823, -1.7199110984802246, -1.3847525119781494, -1.0495938062667847, -0.7144351005554199, -0.3792765140533447, -0.04411792755126953, 0.29104089736938477, 0.62619948387146, 0.9613580703735352, 1.2965166568756104, 1.631675362586975, 1.9668340682983398, 2.301992654800415, 2.6371512413024902, 2.9723100662231445, 3.3074686527252197, 3.642627239227295]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 3.0, 2.0, 5.0, 5.0, 9.0, 11.0, 12.0, 9.0, 13.0, 14.0, 16.0, 16.0, 24.0, 26.0, 36.0, 28.0, 42.0, 38.0, 35.0, 45.0, 41.0, 39.0, 39.0, 34.0, 28.0, 47.0, 47.0, 27.0, 28.0, 25.0, 36.0, 28.0, 22.0, 23.0, 24.0, 14.0, 18.0, 17.0, 15.0, 16.0, 2.0, 8.0, 9.0, 7.0, 6.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.206321954727173, -3.1024374961853027, -2.9985530376434326, -2.8946683406829834, -2.7907838821411133, -2.686899423599243, -2.583014965057373, -2.479130268096924, -2.3752458095550537, -2.2713613510131836, -2.1674768924713135, -2.0635921955108643, -1.9597077369689941, -1.855823278427124, -1.751938819885254, -1.6480542421340942, -1.5441697835922241, -1.440285325050354, -1.3364007472991943, -1.2325162887573242, -1.1286317110061646, -1.0247472524642944, -0.9208627343177795, -0.8169782161712646, -0.7130936980247498, -0.6092091798782349, -0.50532466173172, -0.40144017338752747, -0.2975556552410126, -0.19367116689682007, -0.08978664875030518, 0.014097869396209717, 0.11798238754272461, 0.2218669056892395, 0.3257514238357544, 0.4296359121799469, 0.5335204601287842, 0.6374049186706543, 0.7412894368171692, 0.8451739549636841, 0.949058473110199, 1.0529429912567139, 1.156827449798584, 1.2607120275497437, 1.3645964860916138, 1.4684810638427734, 1.5723655223846436, 1.6762499809265137, 1.7801345586776733, 1.8840190172195435, 1.9879035949707031, 2.0917880535125732, 2.1956725120544434, 2.2995572090148926, 2.4034416675567627, 2.507326126098633, 2.611210584640503, 2.715095043182373, 2.818979501724243, 2.9228641986846924, 3.0267486572265625, 3.1306331157684326, 3.2345175743103027, 3.338402271270752, 3.442286729812622]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 3.0, 7.0, 6.0, 11.0, 17.0, 29.0, 33.0, 52.0, 71.0, 114.0, 172.0, 377.0, 1347.0, 10935.0, 271442.0, 3565775.0, 328936.0, 12566.0, 1524.0, 353.0, 173.0, 104.0, 64.0, 53.0, 30.0, 24.0, 26.0, 6.0, 14.0, 7.0, 2.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.166015625, -2.1097869873046875, -2.053558349609375, -1.9973297119140625, -1.94110107421875, -1.8848724365234375, -1.828643798828125, -1.7724151611328125, -1.7161865234375, -1.6599578857421875, -1.603729248046875, -1.5475006103515625, -1.49127197265625, -1.4350433349609375, -1.378814697265625, -1.3225860595703125, -1.266357421875, -1.2101287841796875, -1.153900146484375, -1.0976715087890625, -1.04144287109375, -0.9852142333984375, -0.928985595703125, -0.8727569580078125, -0.8165283203125, -0.7602996826171875, -0.704071044921875, -0.6478424072265625, -0.59161376953125, -0.5353851318359375, -0.479156494140625, -0.4229278564453125, -0.36669921875, -0.3104705810546875, -0.254241943359375, -0.1980133056640625, -0.14178466796875, -0.0855560302734375, -0.029327392578125, 0.0269012451171875, 0.0831298828125, 0.1393585205078125, 0.195587158203125, 0.2518157958984375, 0.30804443359375, 0.3642730712890625, 0.420501708984375, 0.4767303466796875, 0.532958984375, 0.5891876220703125, 0.645416259765625, 0.7016448974609375, 0.75787353515625, 0.8141021728515625, 0.870330810546875, 0.9265594482421875, 0.9827880859375, 1.0390167236328125, 1.095245361328125, 1.1514739990234375, 1.20770263671875, 1.2639312744140625, 1.320159912109375, 1.3763885498046875, 1.4326171875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 4.0, 8.0, 9.0, 5.0, 17.0, 18.0, 16.0, 33.0, 27.0, 49.0, 44.0, 47.0, 59.0, 75.0, 50.0, 65.0, 69.0, 60.0, 54.0, 42.0, 40.0, 47.0, 36.0, 22.0, 32.0, 19.0, 13.0, 10.0, 9.0, 7.0, 9.0, 7.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77099609375, -0.7509994506835938, -0.7310028076171875, -0.7110061645507812, -0.691009521484375, -0.6710128784179688, -0.6510162353515625, -0.6310195922851562, -0.61102294921875, -0.5910263061523438, -0.5710296630859375, -0.5510330200195312, -0.531036376953125, -0.5110397338867188, -0.4910430908203125, -0.47104644775390625, -0.4510498046875, -0.43105316162109375, -0.4110565185546875, -0.39105987548828125, -0.371063232421875, -0.35106658935546875, -0.3310699462890625, -0.31107330322265625, -0.29107666015625, -0.27108001708984375, -0.2510833740234375, -0.23108673095703125, -0.211090087890625, -0.19109344482421875, -0.1710968017578125, -0.15110015869140625, -0.131103515625, -0.11110687255859375, -0.0911102294921875, -0.07111358642578125, -0.051116943359375, -0.03112030029296875, -0.0111236572265625, 0.00887298583984375, 0.02886962890625, 0.04886627197265625, 0.0688629150390625, 0.08885955810546875, 0.108856201171875, 0.12885284423828125, 0.1488494873046875, 0.16884613037109375, 0.1888427734375, 0.20883941650390625, 0.2288360595703125, 0.24883270263671875, 0.268829345703125, 0.28882598876953125, 0.3088226318359375, 0.32881927490234375, 0.34881591796875, 0.36881256103515625, 0.3888092041015625, 0.40880584716796875, 0.428802490234375, 0.44879913330078125, 0.4687957763671875, 0.48879241943359375, 0.5087890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 6.0, 8.0, 17.0, 31.0, 36.0, 99.0, 174.0, 353.0, 912.0, 2904.0, 14261.0, 106112.0, 926418.0, 2465589.0, 596569.0, 67372.0, 9834.0, 2251.0, 705.0, 306.0, 137.0, 91.0, 42.0, 14.0, 19.0, 5.0, 9.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -0.987823486328125, -0.94732666015625, -0.906829833984375, -0.8663330078125, -0.825836181640625, -0.78533935546875, -0.744842529296875, -0.704345703125, -0.663848876953125, -0.62335205078125, -0.582855224609375, -0.5423583984375, -0.501861572265625, -0.46136474609375, -0.420867919921875, -0.38037109375, -0.339874267578125, -0.29937744140625, -0.258880615234375, -0.2183837890625, -0.177886962890625, -0.13739013671875, -0.096893310546875, -0.056396484375, -0.015899658203125, 0.02459716796875, 0.065093994140625, 0.1055908203125, 0.146087646484375, 0.18658447265625, 0.227081298828125, 0.267578125, 0.308074951171875, 0.34857177734375, 0.389068603515625, 0.4295654296875, 0.470062255859375, 0.51055908203125, 0.551055908203125, 0.591552734375, 0.632049560546875, 0.67254638671875, 0.713043212890625, 0.7535400390625, 0.794036865234375, 0.83453369140625, 0.875030517578125, 0.91552734375, 0.956024169921875, 0.99652099609375, 1.037017822265625, 1.0775146484375, 1.118011474609375, 1.15850830078125, 1.199005126953125, 1.239501953125, 1.279998779296875, 1.32049560546875, 1.360992431640625, 1.4014892578125, 1.441986083984375, 1.48248291015625, 1.522979736328125, 1.5634765625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 10.0, 9.0, 20.0, 19.0, 37.0, 70.0, 91.0, 132.0, 192.0, 275.0, 396.0, 470.0, 507.0, 498.0, 412.0, 313.0, 184.0, 163.0, 96.0, 48.0, 47.0, 27.0, 12.0, 25.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1005859375, -1.0679168701171875, -1.035247802734375, -1.0025787353515625, -0.96990966796875, -0.9372406005859375, -0.904571533203125, -0.8719024658203125, -0.8392333984375, -0.8065643310546875, -0.773895263671875, -0.7412261962890625, -0.70855712890625, -0.6758880615234375, -0.643218994140625, -0.6105499267578125, -0.577880859375, -0.5452117919921875, -0.512542724609375, -0.4798736572265625, -0.44720458984375, -0.4145355224609375, -0.381866455078125, -0.3491973876953125, -0.3165283203125, -0.2838592529296875, -0.251190185546875, -0.2185211181640625, -0.18585205078125, -0.1531829833984375, -0.120513916015625, -0.0878448486328125, -0.05517578125, -0.0225067138671875, 0.010162353515625, 0.0428314208984375, 0.07550048828125, 0.1081695556640625, 0.140838623046875, 0.1735076904296875, 0.2061767578125, 0.2388458251953125, 0.271514892578125, 0.3041839599609375, 0.33685302734375, 0.3695220947265625, 0.402191162109375, 0.4348602294921875, 0.467529296875, 0.5001983642578125, 0.532867431640625, 0.5655364990234375, 0.59820556640625, 0.6308746337890625, 0.663543701171875, 0.6962127685546875, 0.7288818359375, 0.7615509033203125, 0.794219970703125, 0.8268890380859375, 0.85955810546875, 0.8922271728515625, 0.924896240234375, 0.9575653076171875, 0.990234375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 8.0, 4.0, 26.0, 29.0, 55.0, 96.0, 125.0, 139.0, 145.0, 127.0, 113.0, 78.0, 34.0, 11.0, 9.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.534097671508789, -4.368305206298828, -4.202512741088867, -4.0367207527160645, -3.8709282875061035, -3.7051358222961426, -3.5393433570861816, -3.3735508918762207, -3.207758665084839, -3.041966199874878, -2.876173973083496, -2.710381507873535, -2.544589042663574, -2.3787968158721924, -2.2130043506622314, -2.0472121238708496, -1.8814196586608887, -1.7156273126602173, -1.549834966659546, -1.384042501449585, -1.2182501554489136, -1.0524578094482422, -0.886665403842926, -0.7208729982376099, -0.5550806522369385, -0.3892882764339447, -0.22349590063095093, -0.05770352482795715, 0.10808885097503662, 0.273881196975708, 0.43967360258102417, 0.6054660081863403, 0.7712588310241699, 0.9370511770248413, 1.1028435230255127, 1.2686359882354736, 1.434428334236145, 1.6002206802368164, 1.7660131454467773, 1.9318054914474487, 2.09759783744812, 2.263390302658081, 2.429182529449463, 2.594974994659424, 2.7607674598693848, 2.9265596866607666, 3.0923521518707275, 3.2581443786621094, 3.4239368438720703, 3.5897293090820312, 3.755521535873413, 3.921314001083374, 4.087106227874756, 4.252898693084717, 4.418691158294678, 4.584483623504639, 4.750275611877441, 4.916068077087402, 5.081860542297363, 5.247652530670166, 5.413444995880127, 5.579237461090088, 5.745029926300049, 5.91082239151001, 6.076614856719971]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 5.0, 6.0, 12.0, 18.0, 16.0, 14.0, 16.0, 29.0, 24.0, 27.0, 25.0, 25.0, 26.0, 36.0, 31.0, 38.0, 44.0, 53.0, 41.0, 38.0, 50.0, 31.0, 46.0, 38.0, 36.0, 46.0, 26.0, 33.0, 23.0, 27.0, 24.0, 15.0, 20.0, 14.0, 4.0, 14.0, 6.0, 5.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.628404378890991, -2.5423898696899414, -2.4563751220703125, -2.3703603744506836, -2.284345865249634, -2.198331356048584, -2.112316608428955, -2.026301860809326, -1.9402873516082764, -1.854272723197937, -1.7682580947875977, -1.6822434663772583, -1.596228837966919, -1.5102142095565796, -1.4241995811462402, -1.3381849527359009, -1.2521703243255615, -1.1661556959152222, -1.0801410675048828, -0.9941264390945435, -0.9081118106842041, -0.8220971822738647, -0.7360825538635254, -0.650067925453186, -0.5640532970428467, -0.4780386686325073, -0.39202404022216797, -0.3060094118118286, -0.21999478340148926, -0.1339801549911499, -0.04796552658081055, 0.03804910182952881, 0.12406396865844727, 0.21007859706878662, 0.296093225479126, 0.38210785388946533, 0.4681224822998047, 0.554137110710144, 0.6401517391204834, 0.7261663675308228, 0.8121809959411621, 0.8981956243515015, 0.9842102527618408, 1.0702248811721802, 1.1562395095825195, 1.2422541379928589, 1.3282687664031982, 1.4142833948135376, 1.500298023223877, 1.5863126516342163, 1.6723272800445557, 1.758341908454895, 1.8443565368652344, 1.9303711652755737, 2.016385793685913, 2.102400302886963, 2.188415050506592, 2.2744297981262207, 2.3604443073272705, 2.4464588165283203, 2.532473564147949, 2.618488311767578, 2.704502820968628, 2.7905173301696777, 2.8765320777893066]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 11.0, 16.0, 21.0, 43.0, 62.0, 92.0, 181.0, 245.0, 454.0, 850.0, 1553.0, 2876.0, 5394.0, 9846.0, 18530.0, 38903.0, 87364.0, 182826.0, 274588.0, 217256.0, 109739.0, 48883.0, 22994.0, 11813.0, 6370.0, 3408.0, 1839.0, 1010.0, 567.0, 334.0, 180.0, 100.0, 68.0, 47.0, 24.0, 18.0, 14.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.001953125, -0.9702911376953125, -0.938629150390625, -0.9069671630859375, -0.87530517578125, -0.8436431884765625, -0.811981201171875, -0.7803192138671875, -0.7486572265625, -0.7169952392578125, -0.685333251953125, -0.6536712646484375, -0.62200927734375, -0.5903472900390625, -0.558685302734375, -0.5270233154296875, -0.495361328125, -0.4636993408203125, -0.432037353515625, -0.4003753662109375, -0.36871337890625, -0.3370513916015625, -0.305389404296875, -0.2737274169921875, -0.2420654296875, -0.2104034423828125, -0.178741455078125, -0.1470794677734375, -0.11541748046875, -0.0837554931640625, -0.052093505859375, -0.0204315185546875, 0.01123046875, 0.0428924560546875, 0.074554443359375, 0.1062164306640625, 0.13787841796875, 0.1695404052734375, 0.201202392578125, 0.2328643798828125, 0.2645263671875, 0.2961883544921875, 0.327850341796875, 0.3595123291015625, 0.39117431640625, 0.4228363037109375, 0.454498291015625, 0.4861602783203125, 0.517822265625, 0.5494842529296875, 0.581146240234375, 0.6128082275390625, 0.64447021484375, 0.6761322021484375, 0.707794189453125, 0.7394561767578125, 0.7711181640625, 0.8027801513671875, 0.834442138671875, 0.8661041259765625, 0.89776611328125, 0.9294281005859375, 0.961090087890625, 0.9927520751953125, 1.0244140625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 3.0, 5.0, 11.0, 15.0, 13.0, 19.0, 26.0, 41.0, 37.0, 50.0, 44.0, 62.0, 69.0, 62.0, 66.0, 63.0, 57.0, 42.0, 57.0, 46.0, 34.0, 36.0, 32.0, 21.0, 15.0, 24.0, 9.0, 10.0, 12.0, 13.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.7392578125, -0.7207107543945312, -0.7021636962890625, -0.6836166381835938, -0.665069580078125, -0.6465225219726562, -0.6279754638671875, -0.6094284057617188, -0.59088134765625, -0.5723342895507812, -0.5537872314453125, -0.5352401733398438, -0.516693115234375, -0.49814605712890625, -0.4795989990234375, -0.46105194091796875, -0.4425048828125, -0.42395782470703125, -0.4054107666015625, -0.38686370849609375, -0.368316650390625, -0.34976959228515625, -0.3312225341796875, -0.31267547607421875, -0.29412841796875, -0.27558135986328125, -0.2570343017578125, -0.23848724365234375, -0.219940185546875, -0.20139312744140625, -0.1828460693359375, -0.16429901123046875, -0.145751953125, -0.12720489501953125, -0.1086578369140625, -0.09011077880859375, -0.071563720703125, -0.05301666259765625, -0.0344696044921875, -0.01592254638671875, 0.00262451171875, 0.02117156982421875, 0.0397186279296875, 0.05826568603515625, 0.076812744140625, 0.09535980224609375, 0.1139068603515625, 0.13245391845703125, 0.1510009765625, 0.16954803466796875, 0.1880950927734375, 0.20664215087890625, 0.225189208984375, 0.24373626708984375, 0.2622833251953125, 0.28083038330078125, 0.29937744140625, 0.31792449951171875, 0.3364715576171875, 0.35501861572265625, 0.373565673828125, 0.39211273193359375, 0.4106597900390625, 0.42920684814453125, 0.44775390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 12.0, 9.0, 10.0, 24.0, 34.0, 29.0, 43.0, 76.0, 112.0, 158.0, 224.0, 427.0, 889.0, 1722.0, 3845.0, 9113.0, 21855.0, 54273.0, 132416.0, 260171.0, 284937.0, 161964.0, 68622.0, 27103.0, 11263.0, 4736.0, 2120.0, 1004.0, 500.0, 287.0, 202.0, 116.0, 82.0, 48.0, 44.0, 31.0, 23.0, 10.0, 8.0, 2.0, 3.0, 3.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.96923828125, -0.9347763061523438, -0.9003143310546875, -0.8658523559570312, -0.831390380859375, -0.7969284057617188, -0.7624664306640625, -0.7280044555664062, -0.69354248046875, -0.6590805053710938, -0.6246185302734375, -0.5901565551757812, -0.555694580078125, -0.5212326049804688, -0.4867706298828125, -0.45230865478515625, -0.4178466796875, -0.38338470458984375, -0.3489227294921875, -0.31446075439453125, -0.279998779296875, -0.24553680419921875, -0.2110748291015625, -0.17661285400390625, -0.14215087890625, -0.10768890380859375, -0.0732269287109375, -0.03876495361328125, -0.004302978515625, 0.03015899658203125, 0.0646209716796875, 0.09908294677734375, 0.133544921875, 0.16800689697265625, 0.2024688720703125, 0.23693084716796875, 0.271392822265625, 0.30585479736328125, 0.3403167724609375, 0.37477874755859375, 0.40924072265625, 0.44370269775390625, 0.4781646728515625, 0.5126266479492188, 0.547088623046875, 0.5815505981445312, 0.6160125732421875, 0.6504745483398438, 0.6849365234375, 0.7193984985351562, 0.7538604736328125, 0.7883224487304688, 0.822784423828125, 0.8572463989257812, 0.8917083740234375, 0.9261703491210938, 0.96063232421875, 0.9950942993164062, 1.0295562744140625, 1.0640182495117188, 1.098480224609375, 1.1329421997070312, 1.1674041748046875, 1.2018661499023438, 1.236328125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 5.0, 8.0, 15.0, 16.0, 20.0, 16.0, 33.0, 25.0, 39.0, 28.0, 32.0, 51.0, 39.0, 38.0, 59.0, 56.0, 57.0, 60.0, 51.0, 40.0, 39.0, 49.0, 35.0, 29.0, 21.0, 22.0, 20.0, 17.0, 15.0, 9.0, 17.0, 8.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.33984375, -1.2979736328125, -1.256103515625, -1.2142333984375, -1.17236328125, -1.1304931640625, -1.088623046875, -1.0467529296875, -1.0048828125, -0.9630126953125, -0.921142578125, -0.8792724609375, -0.83740234375, -0.7955322265625, -0.753662109375, -0.7117919921875, -0.669921875, -0.6280517578125, -0.586181640625, -0.5443115234375, -0.50244140625, -0.4605712890625, -0.418701171875, -0.3768310546875, -0.3349609375, -0.2930908203125, -0.251220703125, -0.2093505859375, -0.16748046875, -0.1256103515625, -0.083740234375, -0.0418701171875, 0.0, 0.0418701171875, 0.083740234375, 0.1256103515625, 0.16748046875, 0.2093505859375, 0.251220703125, 0.2930908203125, 0.3349609375, 0.3768310546875, 0.418701171875, 0.4605712890625, 0.50244140625, 0.5443115234375, 0.586181640625, 0.6280517578125, 0.669921875, 0.7117919921875, 0.753662109375, 0.7955322265625, 0.83740234375, 0.8792724609375, 0.921142578125, 0.9630126953125, 1.0048828125, 1.0467529296875, 1.088623046875, 1.1304931640625, 1.17236328125, 1.2142333984375, 1.256103515625, 1.2979736328125, 1.33984375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 4.0, 6.0, 16.0, 25.0, 34.0, 76.0, 104.0, 208.0, 319.0, 572.0, 1065.0, 1841.0, 3452.0, 6575.0, 12681.0, 25370.0, 50706.0, 97930.0, 162823.0, 208847.0, 194047.0, 132516.0, 73693.0, 36983.0, 18464.0, 9334.0, 4895.0, 2636.0, 1426.0, 798.0, 424.0, 283.0, 174.0, 82.0, 45.0, 31.0, 18.0, 10.0, 8.0, 9.0, 8.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.318603515625, -0.3091697692871094, -0.29973602294921875, -0.2903022766113281, -0.2808685302734375, -0.2714347839355469, -0.26200103759765625, -0.2525672912597656, -0.243133544921875, -0.23369979858398438, -0.22426605224609375, -0.21483230590820312, -0.2053985595703125, -0.19596481323242188, -0.18653106689453125, -0.17709732055664062, -0.16766357421875, -0.15822982788085938, -0.14879608154296875, -0.13936233520507812, -0.1299285888671875, -0.12049484252929688, -0.11106109619140625, -0.10162734985351562, -0.092193603515625, -0.08275985717773438, -0.07332611083984375, -0.06389236450195312, -0.0544586181640625, -0.045024871826171875, -0.03559112548828125, -0.026157379150390625, -0.0167236328125, -0.007289886474609375, 0.00214385986328125, 0.011577606201171875, 0.0210113525390625, 0.030445098876953125, 0.03987884521484375, 0.049312591552734375, 0.058746337890625, 0.06818008422851562, 0.07761383056640625, 0.08704757690429688, 0.0964813232421875, 0.10591506958007812, 0.11534881591796875, 0.12478256225585938, 0.13421630859375, 0.14365005493164062, 0.15308380126953125, 0.16251754760742188, 0.1719512939453125, 0.18138504028320312, 0.19081878662109375, 0.20025253295898438, 0.209686279296875, 0.21912002563476562, 0.22855377197265625, 0.23798751831054688, 0.2474212646484375, 0.2568550109863281, 0.26628875732421875, 0.2757225036621094, 0.28515625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 7.0, 8.0, 6.0, 9.0, 10.0, 21.0, 12.0, 24.0, 31.0, 27.0, 50.0, 66.0, 61.0, 80.0, 86.0, 75.0, 83.0, 68.0, 63.0, 44.0, 37.0, 34.0, 17.0, 18.0, 6.0, 11.0, 12.0, 8.0, 3.0, 4.0, 8.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.408857345581055e-05, -7.198750972747803e-05, -6.988644599914551e-05, -6.778538227081299e-05, -6.568431854248047e-05, -6.358325481414795e-05, -6.148219108581543e-05, -5.938112735748291e-05, -5.728006362915039e-05, -5.517899990081787e-05, -5.307793617248535e-05, -5.097687244415283e-05, -4.887580871582031e-05, -4.677474498748779e-05, -4.4673681259155273e-05, -4.2572617530822754e-05, -4.0471553802490234e-05, -3.8370490074157715e-05, -3.6269426345825195e-05, -3.4168362617492676e-05, -3.2067298889160156e-05, -2.9966235160827637e-05, -2.7865171432495117e-05, -2.5764107704162598e-05, -2.3663043975830078e-05, -2.156198024749756e-05, -1.946091651916504e-05, -1.735985279083252e-05, -1.52587890625e-05, -1.315772533416748e-05, -1.1056661605834961e-05, -8.955597877502441e-06, -6.854534149169922e-06, -4.753470420837402e-06, -2.652406692504883e-06, -5.513429641723633e-07, 1.5497207641601562e-06, 3.6507844924926758e-06, 5.751848220825195e-06, 7.852911949157715e-06, 9.953975677490234e-06, 1.2055039405822754e-05, 1.4156103134155273e-05, 1.6257166862487793e-05, 1.8358230590820312e-05, 2.0459294319152832e-05, 2.256035804748535e-05, 2.466142177581787e-05, 2.676248550415039e-05, 2.886354923248291e-05, 3.096461296081543e-05, 3.306567668914795e-05, 3.516674041748047e-05, 3.726780414581299e-05, 3.936886787414551e-05, 4.146993160247803e-05, 4.357099533081055e-05, 4.5672059059143066e-05, 4.7773122787475586e-05, 4.9874186515808105e-05, 5.1975250244140625e-05, 5.4076313972473145e-05, 5.6177377700805664e-05, 5.8278441429138184e-05, 6.03795051574707e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 7.0, 12.0, 18.0, 17.0, 25.0, 36.0, 60.0, 71.0, 146.0, 243.0, 426.0, 871.0, 1780.0, 3760.0, 8724.0, 21280.0, 53540.0, 126003.0, 227825.0, 266041.0, 185566.0, 89780.0, 36146.0, 14614.0, 5995.0, 2758.0, 1304.0, 578.0, 349.0, 217.0, 114.0, 77.0, 43.0, 40.0, 31.0, 15.0, 8.0, 10.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.354736328125, -0.34375, -0.332763671875, -0.32177734375, -0.310791015625, -0.2998046875, -0.288818359375, -0.27783203125, -0.266845703125, -0.255859375, -0.244873046875, -0.23388671875, -0.222900390625, -0.2119140625, -0.200927734375, -0.18994140625, -0.178955078125, -0.16796875, -0.156982421875, -0.14599609375, -0.135009765625, -0.1240234375, -0.113037109375, -0.10205078125, -0.091064453125, -0.080078125, -0.069091796875, -0.05810546875, -0.047119140625, -0.0361328125, -0.025146484375, -0.01416015625, -0.003173828125, 0.0078125, 0.018798828125, 0.02978515625, 0.040771484375, 0.0517578125, 0.062744140625, 0.07373046875, 0.084716796875, 0.095703125, 0.106689453125, 0.11767578125, 0.128662109375, 0.1396484375, 0.150634765625, 0.16162109375, 0.172607421875, 0.18359375, 0.194580078125, 0.20556640625, 0.216552734375, 0.2275390625, 0.238525390625, 0.24951171875, 0.260498046875, 0.271484375, 0.282470703125, 0.29345703125, 0.304443359375, 0.3154296875, 0.326416015625, 0.33740234375, 0.348388671875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 6.0, 7.0, 7.0, 15.0, 15.0, 16.0, 29.0, 26.0, 35.0, 38.0, 51.0, 36.0, 52.0, 51.0, 62.0, 68.0, 71.0, 66.0, 50.0, 41.0, 46.0, 45.0, 36.0, 27.0, 16.0, 20.0, 17.0, 10.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2939453125, -0.2842521667480469, -0.27455902099609375, -0.2648658752441406, -0.2551727294921875, -0.24547958374023438, -0.23578643798828125, -0.22609329223632812, -0.216400146484375, -0.20670700073242188, -0.19701385498046875, -0.18732070922851562, -0.1776275634765625, -0.16793441772460938, -0.15824127197265625, -0.14854812622070312, -0.13885498046875, -0.12916183471679688, -0.11946868896484375, -0.10977554321289062, -0.1000823974609375, -0.09038925170898438, -0.08069610595703125, -0.07100296020507812, -0.061309814453125, -0.051616668701171875, -0.04192352294921875, -0.032230377197265625, -0.0225372314453125, -0.012844085693359375, -0.00315093994140625, 0.006542205810546875, 0.0162353515625, 0.025928497314453125, 0.03562164306640625, 0.045314788818359375, 0.0550079345703125, 0.06470108032226562, 0.07439422607421875, 0.08408737182617188, 0.093780517578125, 0.10347366333007812, 0.11316680908203125, 0.12285995483398438, 0.1325531005859375, 0.14224624633789062, 0.15193939208984375, 0.16163253784179688, 0.17132568359375, 0.18101882934570312, 0.19071197509765625, 0.20040512084960938, 0.2100982666015625, 0.21979141235351562, 0.22948455810546875, 0.23917770385742188, 0.248870849609375, 0.2585639953613281, 0.26825714111328125, 0.2779502868652344, 0.2876434326171875, 0.2973365783691406, 0.30702972412109375, 0.3167228698730469, 0.326416015625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 11.0, 25.0, 55.0, 108.0, 167.0, 220.0, 179.0, 127.0, 62.0, 30.0, 11.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.666427612304688, -9.427969932556152, -9.189513206481934, -8.951055526733398, -8.71259880065918, -8.474141120910645, -8.23568344116211, -7.997226715087891, -7.7587690353393555, -7.5203118324279785, -7.281854629516602, -7.043396949768066, -6.8049397468566895, -6.5664825439453125, -6.3280253410339355, -6.089568138122559, -5.851110458374023, -5.6126532554626465, -5.3741960525512695, -5.135738372802734, -4.897281169891357, -4.6588239669799805, -4.4203667640686035, -4.181909561157227, -3.9434523582458496, -3.7049951553344727, -3.4665377140045166, -3.2280805110931396, -2.9896230697631836, -2.7511658668518066, -2.5127086639404297, -2.2742512226104736, -2.0357937812805176, -1.797336459159851, -1.5588791370391846, -1.3204219341278076, -1.0819644927978516, -0.8435072898864746, -0.6050499677658081, -0.3665926456451416, -0.1281353235244751, 0.11032198369503021, 0.3487792909145355, 0.5872365832328796, 0.8256939053535461, 1.0641511678695679, 1.3026084899902344, 1.5410658121109009, 1.7795231342315674, 2.0179803371429443, 2.2564377784729004, 2.4948949813842773, 2.7333524227142334, 2.9718096256256104, 3.2102670669555664, 3.4487242698669434, 3.6871814727783203, 3.9256386756896973, 4.164095878601074, 4.402553558349609, 4.641010761260986, 4.879467964172363, 5.11792516708374, 5.356382369995117, 5.594840049743652]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 5.0, 6.0, 3.0, 6.0, 14.0, 11.0, 13.0, 18.0, 13.0, 15.0, 21.0, 21.0, 24.0, 35.0, 24.0, 30.0, 32.0, 31.0, 51.0, 38.0, 41.0, 39.0, 37.0, 53.0, 37.0, 47.0, 26.0, 36.0, 31.0, 33.0, 31.0, 17.0, 21.0, 20.0, 21.0, 22.0, 11.0, 14.0, 9.0, 6.0, 9.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.26035213470459, -3.161606788635254, -3.062861204147339, -2.964115858078003, -2.865370273590088, -2.766624927520752, -2.667879581451416, -2.569133996963501, -2.470388650894165, -2.371643304824829, -2.272897720336914, -2.174152374267578, -2.075406789779663, -1.9766614437103271, -1.8779159784317017, -1.7791705131530762, -1.6804250478744507, -1.5816795825958252, -1.4829341173171997, -1.3841886520385742, -1.2854433059692383, -1.1866978406906128, -1.0879523754119873, -0.9892069697380066, -0.8904615044593811, -0.7917160391807556, -0.6929706335067749, -0.5942251682281494, -0.4954797327518463, -0.3967342972755432, -0.2979888319969177, -0.199243426322937, -0.10049796104431152, -0.001752518117427826, 0.09699292480945587, 0.19573837518692017, 0.29448381066322327, 0.39322924613952637, 0.49197471141815186, 0.5907201170921326, 0.6894655823707581, 0.7882110476493835, 0.8869564533233643, 0.9857019186019897, 1.0844473838806152, 1.1831927299499512, 1.2819383144378662, 1.3806836605072021, 1.4794291257858276, 1.5781745910644531, 1.6769200563430786, 1.775665521621704, 1.87441086769104, 1.9731563329696655, 2.071901798248291, 2.170647144317627, 2.269392728805542, 2.368138074874878, 2.466883659362793, 2.565629005432129, 2.664374589920044, 2.76311993598938, 2.861865520477295, 2.960610866546631, 3.059356212615967]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 1.0, 13.0, 17.0, 15.0, 20.0, 34.0, 60.0, 66.0, 127.0, 151.0, 293.0, 472.0, 841.0, 1592.0, 3074.0, 7121.0, 16618.0, 43477.0, 131657.0, 474828.0, 1335159.0, 1419976.0, 525986.0, 148319.0, 49613.0, 19220.0, 7867.0, 3666.0, 1700.0, 945.0, 544.0, 318.0, 183.0, 120.0, 78.0, 38.0, 25.0, 13.0, 8.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.576171875, -0.5592498779296875, -0.542327880859375, -0.5254058837890625, -0.50848388671875, -0.4915618896484375, -0.474639892578125, -0.4577178955078125, -0.4407958984375, -0.4238739013671875, -0.406951904296875, -0.3900299072265625, -0.37310791015625, -0.3561859130859375, -0.339263916015625, -0.3223419189453125, -0.305419921875, -0.2884979248046875, -0.271575927734375, -0.2546539306640625, -0.23773193359375, -0.2208099365234375, -0.203887939453125, -0.1869659423828125, -0.1700439453125, -0.1531219482421875, -0.136199951171875, -0.1192779541015625, -0.10235595703125, -0.0854339599609375, -0.068511962890625, -0.0515899658203125, -0.03466796875, -0.0177459716796875, -0.000823974609375, 0.0160980224609375, 0.03302001953125, 0.0499420166015625, 0.066864013671875, 0.0837860107421875, 0.1007080078125, 0.1176300048828125, 0.134552001953125, 0.1514739990234375, 0.16839599609375, 0.1853179931640625, 0.202239990234375, 0.2191619873046875, 0.236083984375, 0.2530059814453125, 0.269927978515625, 0.2868499755859375, 0.30377197265625, 0.3206939697265625, 0.337615966796875, 0.3545379638671875, 0.3714599609375, 0.3883819580078125, 0.405303955078125, 0.4222259521484375, 0.43914794921875, 0.4560699462890625, 0.472991943359375, 0.4899139404296875, 0.5068359375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 14.0, 20.0, 19.0, 21.0, 33.0, 41.0, 53.0, 56.0, 69.0, 49.0, 49.0, 78.0, 56.0, 66.0, 69.0, 53.0, 38.0, 34.0, 34.0, 31.0, 20.0, 20.0, 15.0, 14.0, 7.0, 9.0, 4.0, 12.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.708984375, -0.6897048950195312, -0.6704254150390625, -0.6511459350585938, -0.631866455078125, -0.6125869750976562, -0.5933074951171875, -0.5740280151367188, -0.55474853515625, -0.5354690551757812, -0.5161895751953125, -0.49691009521484375, -0.477630615234375, -0.45835113525390625, -0.4390716552734375, -0.41979217529296875, -0.4005126953125, -0.38123321533203125, -0.3619537353515625, -0.34267425537109375, -0.323394775390625, -0.30411529541015625, -0.2848358154296875, -0.26555633544921875, -0.24627685546875, -0.22699737548828125, -0.2077178955078125, -0.18843841552734375, -0.169158935546875, -0.14987945556640625, -0.1305999755859375, -0.11132049560546875, -0.092041015625, -0.07276153564453125, -0.0534820556640625, -0.03420257568359375, -0.014923095703125, 0.00435638427734375, 0.0236358642578125, 0.04291534423828125, 0.06219482421875, 0.08147430419921875, 0.1007537841796875, 0.12003326416015625, 0.139312744140625, 0.15859222412109375, 0.1778717041015625, 0.19715118408203125, 0.2164306640625, 0.23571014404296875, 0.2549896240234375, 0.27426910400390625, 0.293548583984375, 0.31282806396484375, 0.3321075439453125, 0.35138702392578125, 0.37066650390625, 0.38994598388671875, 0.4092254638671875, 0.42850494384765625, 0.447784423828125, 0.46706390380859375, 0.4863433837890625, 0.5056228637695312, 0.52490234375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 13.0, 10.0, 15.0, 28.0, 18.0, 42.0, 63.0, 95.0, 165.0, 276.0, 483.0, 1196.0, 3402.0, 11977.0, 51917.0, 259615.0, 1227465.0, 1932467.0, 561869.0, 110187.0, 23224.0, 6108.0, 1904.0, 750.0, 376.0, 205.0, 123.0, 72.0, 61.0, 42.0, 27.0, 18.0, 16.0, 8.0, 9.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.83154296875, -0.8031005859375, -0.774658203125, -0.7462158203125, -0.7177734375, -0.6893310546875, -0.660888671875, -0.6324462890625, -0.60400390625, -0.5755615234375, -0.547119140625, -0.5186767578125, -0.490234375, -0.4617919921875, -0.433349609375, -0.4049072265625, -0.37646484375, -0.3480224609375, -0.319580078125, -0.2911376953125, -0.2626953125, -0.2342529296875, -0.205810546875, -0.1773681640625, -0.14892578125, -0.1204833984375, -0.092041015625, -0.0635986328125, -0.03515625, -0.0067138671875, 0.021728515625, 0.0501708984375, 0.07861328125, 0.1070556640625, 0.135498046875, 0.1639404296875, 0.1923828125, 0.2208251953125, 0.249267578125, 0.2777099609375, 0.30615234375, 0.3345947265625, 0.363037109375, 0.3914794921875, 0.419921875, 0.4483642578125, 0.476806640625, 0.5052490234375, 0.53369140625, 0.5621337890625, 0.590576171875, 0.6190185546875, 0.6474609375, 0.6759033203125, 0.704345703125, 0.7327880859375, 0.76123046875, 0.7896728515625, 0.818115234375, 0.8465576171875, 0.875, 0.9034423828125, 0.931884765625, 0.9603271484375, 0.98876953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 0.0, 4.0, 9.0, 12.0, 12.0, 16.0, 32.0, 23.0, 53.0, 73.0, 74.0, 113.0, 135.0, 196.0, 235.0, 292.0, 333.0, 372.0, 375.0, 346.0, 287.0, 286.0, 187.0, 153.0, 102.0, 110.0, 58.0, 62.0, 31.0, 24.0, 22.0, 10.0, 12.0, 6.0, 6.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.71337890625, -0.69189453125, -0.67041015625, -0.64892578125, -0.62744140625, -0.60595703125, -0.58447265625, -0.56298828125, -0.54150390625, -0.52001953125, -0.49853515625, -0.47705078125, -0.45556640625, -0.43408203125, -0.41259765625, -0.39111328125, -0.36962890625, -0.34814453125, -0.32666015625, -0.30517578125, -0.28369140625, -0.26220703125, -0.24072265625, -0.21923828125, -0.19775390625, -0.17626953125, -0.15478515625, -0.13330078125, -0.11181640625, -0.09033203125, -0.06884765625, -0.04736328125, -0.02587890625, -0.00439453125, 0.01708984375, 0.03857421875, 0.06005859375, 0.08154296875, 0.10302734375, 0.12451171875, 0.14599609375, 0.16748046875, 0.18896484375, 0.21044921875, 0.23193359375, 0.25341796875, 0.27490234375, 0.29638671875, 0.31787109375, 0.33935546875, 0.36083984375, 0.38232421875, 0.40380859375, 0.42529296875, 0.44677734375, 0.46826171875, 0.48974609375, 0.51123046875, 0.53271484375, 0.55419921875, 0.57568359375, 0.59716796875, 0.61865234375, 0.64013671875, 0.66162109375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 7.0, 10.0, 9.0, 13.0, 24.0, 27.0, 50.0, 72.0, 94.0, 100.0, 121.0, 111.0, 106.0, 75.0, 59.0, 41.0, 34.0, 25.0, 14.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4649033546447754, -2.3436295986175537, -2.222355604171753, -2.1010818481445312, -1.97980797290802, -1.8585340976715088, -1.7372602224349976, -1.6159863471984863, -1.4947125911712646, -1.3734387159347534, -1.2521648406982422, -1.1308910846710205, -1.0096172094345093, -0.888343334197998, -0.7670694589614868, -0.6457956433296204, -0.5245217084884644, -0.4032478630542755, -0.28197401762008667, -0.16070014238357544, -0.0394262969493866, 0.08184754848480225, 0.20312142372131348, 0.32439523935317993, 0.44566911458969116, 0.5669429898262024, 0.6882168054580688, 0.8094906806945801, 0.9307645559310913, 1.0520384311676025, 1.1733121871948242, 1.2945860624313354, 1.4158599376678467, 1.537133812904358, 1.6584076881408691, 1.7796814441680908, 1.900955319404602, 2.0222291946411133, 2.143503189086914, 2.2647769451141357, 2.3860507011413574, 2.507324457168579, 2.62859845161438, 2.7498722076416016, 2.8711462020874023, 2.992419958114624, 3.1136937141418457, 3.2349677085876465, 3.3562417030334473, 3.477515459060669, 3.5987894535064697, 3.7200632095336914, 3.841337203979492, 3.962610960006714, 4.0838847160339355, 4.205158710479736, 4.326432228088379, 4.44770622253418, 4.568979740142822, 4.690253734588623, 4.811527729034424, 4.932801246643066, 5.054075241088867, 5.175349235534668, 5.296623229980469]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 1.0, 11.0, 4.0, 7.0, 3.0, 7.0, 7.0, 11.0, 14.0, 12.0, 26.0, 22.0, 31.0, 29.0, 37.0, 24.0, 29.0, 32.0, 37.0, 43.0, 31.0, 45.0, 44.0, 33.0, 45.0, 39.0, 36.0, 32.0, 32.0, 37.0, 30.0, 38.0, 21.0, 31.0, 24.0, 13.0, 14.0, 9.0, 15.0, 8.0, 9.0, 3.0, 3.0, 1.0, 3.0, 5.0, 8.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1536037921905518, -2.0860636234283447, -2.018523693084717, -1.9509835243225098, -1.8834433555603027, -1.8159033060073853, -1.7483632564544678, -1.6808230876922607, -1.6132830381393433, -1.5457429885864258, -1.4782028198242188, -1.4106627702713013, -1.3431227207183838, -1.2755825519561768, -1.2080425024032593, -1.1405024528503418, -1.0729622840881348, -1.0054222345352173, -0.9378820657730103, -0.8703420162200928, -0.8028019070625305, -0.7352617979049683, -0.6677217483520508, -0.6001816391944885, -0.5326415300369263, -0.465101420879364, -0.39756134152412415, -0.3300212621688843, -0.262481153011322, -0.19494104385375977, -0.1274009644985199, -0.05986088514328003, 0.007679462432861328, 0.07521955668926239, 0.14275965094566345, 0.21029974520206451, 0.2778398394584656, 0.34537994861602783, 0.4129200279712677, 0.48046010732650757, 0.5480002164840698, 0.6155403256416321, 0.6830804347991943, 0.7506204843521118, 0.8181605935096741, 0.8857007026672363, 0.9532407522201538, 1.0207808017730713, 1.0883209705352783, 1.1558610200881958, 1.2234011888504028, 1.2909412384033203, 1.3584814071655273, 1.4260214567184448, 1.4935615062713623, 1.5611016750335693, 1.6286417245864868, 1.6961817741394043, 1.7637219429016113, 1.8312619924545288, 1.8988020420074463, 1.9663422107696533, 2.0338823795318604, 2.1014223098754883, 2.1689624786376953]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 4.0, 4.0, 9.0, 13.0, 24.0, 29.0, 53.0, 74.0, 130.0, 213.0, 404.0, 734.0, 1263.0, 2472.0, 4709.0, 9478.0, 18823.0, 37585.0, 74820.0, 144655.0, 228472.0, 228564.0, 144949.0, 74995.0, 37325.0, 18986.0, 9561.0, 4778.0, 2562.0, 1221.0, 683.0, 376.0, 207.0, 140.0, 78.0, 62.0, 29.0, 22.0, 17.0, 14.0, 13.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7470703125, -0.7203903198242188, -0.6937103271484375, -0.6670303344726562, -0.640350341796875, -0.6136703491210938, -0.5869903564453125, -0.5603103637695312, -0.53363037109375, -0.5069503784179688, -0.4802703857421875, -0.45359039306640625, -0.426910400390625, -0.40023040771484375, -0.3735504150390625, -0.34687042236328125, -0.3201904296875, -0.29351043701171875, -0.2668304443359375, -0.24015045166015625, -0.213470458984375, -0.18679046630859375, -0.1601104736328125, -0.13343048095703125, -0.10675048828125, -0.08007049560546875, -0.0533905029296875, -0.02671051025390625, -3.0517578125e-05, 0.02664947509765625, 0.0533294677734375, 0.08000946044921875, 0.106689453125, 0.13336944580078125, 0.1600494384765625, 0.18672943115234375, 0.213409423828125, 0.24008941650390625, 0.2667694091796875, 0.29344940185546875, 0.32012939453125, 0.34680938720703125, 0.3734893798828125, 0.40016937255859375, 0.426849365234375, 0.45352935791015625, 0.4802093505859375, 0.5068893432617188, 0.5335693359375, 0.5602493286132812, 0.5869293212890625, 0.6136093139648438, 0.640289306640625, 0.6669692993164062, 0.6936492919921875, 0.7203292846679688, 0.74700927734375, 0.7736892700195312, 0.8003692626953125, 0.8270492553710938, 0.853729248046875, 0.8804092407226562, 0.9070892333984375, 0.9337692260742188, 0.96044921875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 7.0, 11.0, 15.0, 21.0, 21.0, 28.0, 31.0, 50.0, 45.0, 58.0, 61.0, 76.0, 59.0, 55.0, 64.0, 41.0, 69.0, 36.0, 52.0, 45.0, 24.0, 35.0, 22.0, 15.0, 15.0, 8.0, 11.0, 5.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.67919921875, -0.6610641479492188, -0.6429290771484375, -0.6247940063476562, -0.606658935546875, -0.5885238647460938, -0.5703887939453125, -0.5522537231445312, -0.53411865234375, -0.5159835815429688, -0.4978485107421875, -0.47971343994140625, -0.461578369140625, -0.44344329833984375, -0.4253082275390625, -0.40717315673828125, -0.3890380859375, -0.37090301513671875, -0.3527679443359375, -0.33463287353515625, -0.316497802734375, -0.29836273193359375, -0.2802276611328125, -0.26209259033203125, -0.24395751953125, -0.22582244873046875, -0.2076873779296875, -0.18955230712890625, -0.171417236328125, -0.15328216552734375, -0.1351470947265625, -0.11701202392578125, -0.098876953125, -0.08074188232421875, -0.0626068115234375, -0.04447174072265625, -0.026336669921875, -0.00820159912109375, 0.0099334716796875, 0.02806854248046875, 0.04620361328125, 0.06433868408203125, 0.0824737548828125, 0.10060882568359375, 0.118743896484375, 0.13687896728515625, 0.1550140380859375, 0.17314910888671875, 0.1912841796875, 0.20941925048828125, 0.2275543212890625, 0.24568939208984375, 0.263824462890625, 0.28195953369140625, 0.3000946044921875, 0.31822967529296875, 0.33636474609375, 0.35449981689453125, 0.3726348876953125, 0.39076995849609375, 0.408905029296875, 0.42704010009765625, 0.4451751708984375, 0.46331024169921875, 0.4814453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 9.0, 7.0, 11.0, 10.0, 15.0, 11.0, 17.0, 20.0, 31.0, 36.0, 53.0, 71.0, 163.0, 355.0, 1012.0, 3077.0, 8901.0, 24888.0, 66111.0, 162608.0, 301723.0, 269648.0, 129148.0, 51223.0, 18911.0, 6731.0, 2315.0, 772.0, 276.0, 120.0, 63.0, 47.0, 24.0, 28.0, 22.0, 23.0, 21.0, 16.0, 9.0, 4.0, 3.0, 7.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.294921875, -1.257781982421875, -1.22064208984375, -1.183502197265625, -1.1463623046875, -1.109222412109375, -1.07208251953125, -1.034942626953125, -0.997802734375, -0.960662841796875, -0.92352294921875, -0.886383056640625, -0.8492431640625, -0.812103271484375, -0.77496337890625, -0.737823486328125, -0.70068359375, -0.663543701171875, -0.62640380859375, -0.589263916015625, -0.5521240234375, -0.514984130859375, -0.47784423828125, -0.440704345703125, -0.403564453125, -0.366424560546875, -0.32928466796875, -0.292144775390625, -0.2550048828125, -0.217864990234375, -0.18072509765625, -0.143585205078125, -0.1064453125, -0.069305419921875, -0.03216552734375, 0.004974365234375, 0.0421142578125, 0.079254150390625, 0.11639404296875, 0.153533935546875, 0.190673828125, 0.227813720703125, 0.26495361328125, 0.302093505859375, 0.3392333984375, 0.376373291015625, 0.41351318359375, 0.450653076171875, 0.48779296875, 0.524932861328125, 0.56207275390625, 0.599212646484375, 0.6363525390625, 0.673492431640625, 0.71063232421875, 0.747772216796875, 0.784912109375, 0.822052001953125, 0.85919189453125, 0.896331787109375, 0.9334716796875, 0.970611572265625, 1.00775146484375, 1.044891357421875, 1.08203125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 5.0, 3.0, 4.0, 8.0, 8.0, 12.0, 24.0, 16.0, 20.0, 17.0, 22.0, 24.0, 18.0, 32.0, 25.0, 33.0, 32.0, 45.0, 35.0, 30.0, 40.0, 35.0, 35.0, 46.0, 34.0, 31.0, 32.0, 35.0, 26.0, 31.0, 23.0, 31.0, 28.0, 28.0, 22.0, 19.0, 14.0, 14.0, 10.0, 19.0, 9.0, 4.0, 9.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9658203125, -0.9326629638671875, -0.899505615234375, -0.8663482666015625, -0.83319091796875, -0.8000335693359375, -0.766876220703125, -0.7337188720703125, -0.7005615234375, -0.6674041748046875, -0.634246826171875, -0.6010894775390625, -0.56793212890625, -0.5347747802734375, -0.501617431640625, -0.4684600830078125, -0.435302734375, -0.4021453857421875, -0.368988037109375, -0.3358306884765625, -0.30267333984375, -0.2695159912109375, -0.236358642578125, -0.2032012939453125, -0.1700439453125, -0.1368865966796875, -0.103729248046875, -0.0705718994140625, -0.03741455078125, -0.0042572021484375, 0.028900146484375, 0.0620574951171875, 0.09521484375, 0.1283721923828125, 0.161529541015625, 0.1946868896484375, 0.22784423828125, 0.2610015869140625, 0.294158935546875, 0.3273162841796875, 0.3604736328125, 0.3936309814453125, 0.426788330078125, 0.4599456787109375, 0.49310302734375, 0.5262603759765625, 0.559417724609375, 0.5925750732421875, 0.625732421875, 0.6588897705078125, 0.692047119140625, 0.7252044677734375, 0.75836181640625, 0.7915191650390625, 0.824676513671875, 0.8578338623046875, 0.8909912109375, 0.9241485595703125, 0.957305908203125, 0.9904632568359375, 1.02362060546875, 1.0567779541015625, 1.089935302734375, 1.1230926513671875, 1.15625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 7.0, 7.0, 9.0, 19.0, 23.0, 33.0, 57.0, 80.0, 93.0, 138.0, 262.0, 338.0, 502.0, 742.0, 1152.0, 1737.0, 2588.0, 3924.0, 6130.0, 9652.0, 15558.0, 24678.0, 39053.0, 60544.0, 87235.0, 117878.0, 139226.0, 140487.0, 122249.0, 92880.0, 65018.0, 42748.0, 27198.0, 16646.0, 10607.0, 6527.0, 4334.0, 2729.0, 1758.0, 1197.0, 771.0, 547.0, 363.0, 278.0, 179.0, 121.0, 89.0, 46.0, 55.0, 22.0, 18.0, 10.0, 7.0, 5.0, 4.0, 1.0, 3.0, 2.0], "bins": [-0.2056884765625, -0.19947242736816406, -0.19325637817382812, -0.1870403289794922, -0.18082427978515625, -0.1746082305908203, -0.16839218139648438, -0.16217613220214844, -0.1559600830078125, -0.14974403381347656, -0.14352798461914062, -0.1373119354248047, -0.13109588623046875, -0.12487983703613281, -0.11866378784179688, -0.11244773864746094, -0.106231689453125, -0.10001564025878906, -0.09379959106445312, -0.08758354187011719, -0.08136749267578125, -0.07515144348144531, -0.06893539428710938, -0.06271934509277344, -0.0565032958984375, -0.05028724670410156, -0.044071197509765625, -0.03785514831542969, -0.03163909912109375, -0.025423049926757812, -0.019207000732421875, -0.012990951538085938, -0.00677490234375, -0.0005588531494140625, 0.005657196044921875, 0.011873245239257812, 0.01808929443359375, 0.024305343627929688, 0.030521392822265625, 0.03673744201660156, 0.0429534912109375, 0.04916954040527344, 0.055385589599609375, 0.06160163879394531, 0.06781768798828125, 0.07403373718261719, 0.08024978637695312, 0.08646583557128906, 0.092681884765625, 0.09889793395996094, 0.10511398315429688, 0.11133003234863281, 0.11754608154296875, 0.12376213073730469, 0.12997817993164062, 0.13619422912597656, 0.1424102783203125, 0.14862632751464844, 0.15484237670898438, 0.1610584259033203, 0.16727447509765625, 0.1734905242919922, 0.17970657348632812, 0.18592262268066406, 0.192138671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 1.0, 6.0, 4.0, 4.0, 10.0, 12.0, 12.0, 24.0, 30.0, 38.0, 45.0, 51.0, 82.0, 83.0, 100.0, 92.0, 95.0, 78.0, 51.0, 41.0, 30.0, 22.0, 21.0, 20.0, 11.0, 8.0, 11.0, 7.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.243322372436523e-05, -7.983669638633728e-05, -7.724016904830933e-05, -7.464364171028137e-05, -7.204711437225342e-05, -6.945058703422546e-05, -6.685405969619751e-05, -6.425753235816956e-05, -6.16610050201416e-05, -5.906447768211365e-05, -5.646795034408569e-05, -5.387142300605774e-05, -5.1274895668029785e-05, -4.867836833000183e-05, -4.608184099197388e-05, -4.348531365394592e-05, -4.088878631591797e-05, -3.8292258977890015e-05, -3.569573163986206e-05, -3.3099204301834106e-05, -3.0502676963806152e-05, -2.7906149625778198e-05, -2.5309622287750244e-05, -2.271309494972229e-05, -2.0116567611694336e-05, -1.7520040273666382e-05, -1.4923512935638428e-05, -1.2326985597610474e-05, -9.73045825958252e-06, -7.1339309215545654e-06, -4.537403583526611e-06, -1.9408762454986572e-06, 6.556510925292969e-07, 3.252178430557251e-06, 5.848705768585205e-06, 8.44523310661316e-06, 1.1041760444641113e-05, 1.3638287782669067e-05, 1.623481512069702e-05, 1.8831342458724976e-05, 2.142786979675293e-05, 2.4024397134780884e-05, 2.6620924472808838e-05, 2.9217451810836792e-05, 3.1813979148864746e-05, 3.44105064868927e-05, 3.7007033824920654e-05, 3.960356116294861e-05, 4.220008850097656e-05, 4.4796615839004517e-05, 4.739314317703247e-05, 4.9989670515060425e-05, 5.258619785308838e-05, 5.518272519111633e-05, 5.777925252914429e-05, 6.037577986717224e-05, 6.29723072052002e-05, 6.556883454322815e-05, 6.81653618812561e-05, 7.076188921928406e-05, 7.335841655731201e-05, 7.595494389533997e-05, 7.855147123336792e-05, 8.114799857139587e-05, 8.374452590942383e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 5.0, 14.0, 17.0, 25.0, 41.0, 65.0, 138.0, 238.0, 413.0, 794.0, 1484.0, 2918.0, 5932.0, 13249.0, 30159.0, 67553.0, 135779.0, 213356.0, 233029.0, 171118.0, 93386.0, 43045.0, 19033.0, 8412.0, 4079.0, 1979.0, 1069.0, 534.0, 289.0, 174.0, 90.0, 55.0, 24.0, 17.0, 20.0, 10.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.245849609375, -0.23681640625, -0.227783203125, -0.21875, -0.209716796875, -0.20068359375, -0.191650390625, -0.1826171875, -0.173583984375, -0.16455078125, -0.155517578125, -0.146484375, -0.137451171875, -0.12841796875, -0.119384765625, -0.1103515625, -0.101318359375, -0.09228515625, -0.083251953125, -0.07421875, -0.065185546875, -0.05615234375, -0.047119140625, -0.0380859375, -0.029052734375, -0.02001953125, -0.010986328125, -0.001953125, 0.007080078125, 0.01611328125, 0.025146484375, 0.0341796875, 0.043212890625, 0.05224609375, 0.061279296875, 0.0703125, 0.079345703125, 0.08837890625, 0.097412109375, 0.1064453125, 0.115478515625, 0.12451171875, 0.133544921875, 0.142578125, 0.151611328125, 0.16064453125, 0.169677734375, 0.1787109375, 0.187744140625, 0.19677734375, 0.205810546875, 0.21484375, 0.223876953125, 0.23291015625, 0.241943359375, 0.2509765625, 0.260009765625, 0.26904296875, 0.278076171875, 0.287109375, 0.296142578125, 0.30517578125, 0.314208984375, 0.3232421875, 0.332275390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 11.0, 4.0, 4.0, 3.0, 6.0, 11.0, 17.0, 17.0, 22.0, 30.0, 59.0, 42.0, 55.0, 51.0, 59.0, 66.0, 67.0, 64.0, 68.0, 61.0, 53.0, 51.0, 41.0, 33.0, 24.0, 32.0, 13.0, 8.0, 10.0, 6.0, 5.0, 6.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34228515625, -0.3329734802246094, -0.32366180419921875, -0.3143501281738281, -0.3050384521484375, -0.2957267761230469, -0.28641510009765625, -0.2771034240722656, -0.267791748046875, -0.2584800720214844, -0.24916839599609375, -0.23985671997070312, -0.2305450439453125, -0.22123336791992188, -0.21192169189453125, -0.20261001586914062, -0.19329833984375, -0.18398666381835938, -0.17467498779296875, -0.16536331176757812, -0.1560516357421875, -0.14673995971679688, -0.13742828369140625, -0.12811660766601562, -0.118804931640625, -0.10949325561523438, -0.10018157958984375, -0.09086990356445312, -0.0815582275390625, -0.07224655151367188, -0.06293487548828125, -0.053623199462890625, -0.0443115234375, -0.034999847412109375, -0.02568817138671875, -0.016376495361328125, -0.0070648193359375, 0.002246856689453125, 0.01155853271484375, 0.020870208740234375, 0.030181884765625, 0.039493560791015625, 0.04880523681640625, 0.058116912841796875, 0.0674285888671875, 0.07674026489257812, 0.08605194091796875, 0.09536361694335938, 0.10467529296875, 0.11398696899414062, 0.12329864501953125, 0.13261032104492188, 0.1419219970703125, 0.15123367309570312, 0.16054534912109375, 0.16985702514648438, 0.179168701171875, 0.18848037719726562, 0.19779205322265625, 0.20710372924804688, 0.2164154052734375, 0.22572708129882812, 0.23503875732421875, 0.24435043334960938, 0.253662109375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 14.0, 15.0, 35.0, 23.0, 40.0, 49.0, 58.0, 74.0, 75.0, 96.0, 86.0, 81.0, 90.0, 64.0, 47.0, 41.0, 34.0, 30.0, 13.0, 12.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.165337562561035, -5.0510101318359375, -4.936683177947998, -4.8223557472229, -4.708028316497803, -4.593700885772705, -4.479373931884766, -4.365046501159668, -4.25071907043457, -4.136391639709473, -4.022064685821533, -3.9077372550964355, -3.793409824371338, -3.6790826320648193, -3.564755439758301, -3.450428009033203, -3.3361008167266846, -3.221773624420166, -3.1074461936950684, -2.99311900138855, -2.878791570663452, -2.7644643783569336, -2.650136947631836, -2.5358097553253174, -2.421482563018799, -2.3071553707122803, -2.1928279399871826, -2.078500747680664, -1.9641733169555664, -1.8498461246490479, -1.7355188131332397, -1.6211915016174316, -1.506864070892334, -1.3925367593765259, -1.2782094478607178, -1.1638822555541992, -1.0495548248291016, -0.9352275729179382, -0.8209003210067749, -0.7065730094909668, -0.5922456979751587, -0.4779183864593506, -0.36359110474586487, -0.24926382303237915, -0.13493651151657104, -0.02060920000076294, 0.09371805191040039, 0.2080453634262085, 0.3223726749420166, 0.4366999864578247, 0.5510272979736328, 0.6653545498847961, 0.7796818614006042, 0.8940091729164124, 1.0083364248275757, 1.1226637363433838, 1.236991047859192, 1.351318359375, 1.465645670890808, 1.5799729824066162, 1.6943001747131348, 1.8086276054382324, 1.922954797744751, 2.0372819900512695, 2.151609420776367]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 4.0, 7.0, 5.0, 6.0, 10.0, 17.0, 19.0, 16.0, 17.0, 18.0, 18.0, 26.0, 35.0, 31.0, 32.0, 37.0, 41.0, 35.0, 42.0, 44.0, 41.0, 42.0, 38.0, 33.0, 43.0, 28.0, 31.0, 34.0, 19.0, 33.0, 33.0, 34.0, 24.0, 6.0, 11.0, 15.0, 14.0, 18.0, 5.0, 11.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.139646530151367, -3.030673027038574, -2.9216995239257812, -2.8127260208129883, -2.7037525177001953, -2.5947790145874023, -2.4858055114746094, -2.3768320083618164, -2.2678585052490234, -2.1588850021362305, -2.0499114990234375, -1.9409379959106445, -1.8319644927978516, -1.7229909896850586, -1.6140176057815552, -1.5050441026687622, -1.3960707187652588, -1.2870972156524658, -1.1781237125396729, -1.0691502094268799, -0.9601767659187317, -0.8512032628059387, -0.7422298192977905, -0.6332563161849976, -0.5242828130722046, -0.4153093099594116, -0.30633583664894104, -0.19736236333847046, -0.08838886022567749, 0.02058464288711548, 0.12955808639526367, 0.23853158950805664, 0.3475048542022705, 0.4564783573150635, 0.5654518604278564, 0.6744253039360046, 0.7833988070487976, 0.8923723101615906, 1.0013457536697388, 1.1103192567825317, 1.2192927598953247, 1.3282662630081177, 1.4372397661209106, 1.546213150024414, 1.655186653137207, 1.76416015625, 1.873133659362793, 1.982107162475586, 2.091080665588379, 2.200054168701172, 2.309027671813965, 2.418001174926758, 2.526974678039551, 2.6359481811523438, 2.7449216842651367, 2.8538951873779297, 2.9628686904907227, 3.0718421936035156, 3.1808156967163086, 3.2897891998291016, 3.3987627029418945, 3.5077362060546875, 3.6167097091674805, 3.7256832122802734, 3.8346564769744873]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 11.0, 20.0, 14.0, 25.0, 42.0, 65.0, 109.0, 222.0, 414.0, 1007.0, 2819.0, 8744.0, 34391.0, 189913.0, 1406660.0, 2113413.0, 357765.0, 57806.0, 13864.0, 4328.0, 1460.0, 591.0, 258.0, 123.0, 60.0, 39.0, 33.0, 20.0, 18.0, 11.0, 10.0, 6.0, 4.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0654296875, -1.0359649658203125, -1.006500244140625, -0.9770355224609375, -0.94757080078125, -0.9181060791015625, -0.888641357421875, -0.8591766357421875, -0.8297119140625, -0.8002471923828125, -0.770782470703125, -0.7413177490234375, -0.71185302734375, -0.6823883056640625, -0.652923583984375, -0.6234588623046875, -0.593994140625, -0.5645294189453125, -0.535064697265625, -0.5055999755859375, -0.47613525390625, -0.4466705322265625, -0.417205810546875, -0.3877410888671875, -0.3582763671875, -0.3288116455078125, -0.299346923828125, -0.2698822021484375, -0.24041748046875, -0.2109527587890625, -0.181488037109375, -0.1520233154296875, -0.12255859375, -0.0930938720703125, -0.063629150390625, -0.0341644287109375, -0.00469970703125, 0.0247650146484375, 0.054229736328125, 0.0836944580078125, 0.1131591796875, 0.1426239013671875, 0.172088623046875, 0.2015533447265625, 0.23101806640625, 0.2604827880859375, 0.289947509765625, 0.3194122314453125, 0.348876953125, 0.3783416748046875, 0.407806396484375, 0.4372711181640625, 0.46673583984375, 0.4962005615234375, 0.525665283203125, 0.5551300048828125, 0.5845947265625, 0.6140594482421875, 0.643524169921875, 0.6729888916015625, 0.70245361328125, 0.7319183349609375, 0.761383056640625, 0.7908477783203125, 0.8203125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 3.0, 5.0, 7.0, 11.0, 6.0, 23.0, 23.0, 35.0, 33.0, 34.0, 45.0, 48.0, 62.0, 56.0, 60.0, 54.0, 39.0, 60.0, 57.0, 36.0, 42.0, 30.0, 31.0, 37.0, 26.0, 28.0, 25.0, 25.0, 14.0, 8.0, 12.0, 10.0, 5.0, 4.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.6787109375, -0.6614799499511719, -0.6442489624023438, -0.6270179748535156, -0.6097869873046875, -0.5925559997558594, -0.5753250122070312, -0.5580940246582031, -0.540863037109375, -0.5236320495605469, -0.5064010620117188, -0.4891700744628906, -0.4719390869140625, -0.4547080993652344, -0.43747711181640625, -0.4202461242675781, -0.40301513671875, -0.3857841491699219, -0.36855316162109375, -0.3513221740722656, -0.3340911865234375, -0.3168601989746094, -0.29962921142578125, -0.2823982238769531, -0.265167236328125, -0.24793624877929688, -0.23070526123046875, -0.21347427368164062, -0.1962432861328125, -0.17901229858398438, -0.16178131103515625, -0.14455032348632812, -0.1273193359375, -0.11008834838867188, -0.09285736083984375, -0.07562637329101562, -0.0583953857421875, -0.041164398193359375, -0.02393341064453125, -0.006702423095703125, 0.010528564453125, 0.027759552001953125, 0.04499053955078125, 0.062221527099609375, 0.0794525146484375, 0.09668350219726562, 0.11391448974609375, 0.13114547729492188, 0.14837646484375, 0.16560745239257812, 0.18283843994140625, 0.20006942749023438, 0.2173004150390625, 0.23453140258789062, 0.25176239013671875, 0.2689933776855469, 0.286224365234375, 0.3034553527832031, 0.32068634033203125, 0.3379173278808594, 0.3551483154296875, 0.3723793029785156, 0.38961029052734375, 0.4068412780761719, 0.424072265625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 4.0, 12.0, 14.0, 17.0, 17.0, 27.0, 34.0, 68.0, 93.0, 178.0, 329.0, 746.0, 1695.0, 5170.0, 18048.0, 74717.0, 346941.0, 1426956.0, 1715263.0, 469387.0, 100683.0, 23545.0, 6431.0, 2151.0, 822.0, 359.0, 198.0, 134.0, 79.0, 36.0, 29.0, 24.0, 14.0, 16.0, 8.0, 6.0, 12.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8330078125, -0.8062210083007812, -0.7794342041015625, -0.7526473999023438, -0.725860595703125, -0.6990737915039062, -0.6722869873046875, -0.6455001831054688, -0.61871337890625, -0.5919265747070312, -0.5651397705078125, -0.5383529663085938, -0.511566162109375, -0.48477935791015625, -0.4579925537109375, -0.43120574951171875, -0.4044189453125, -0.37763214111328125, -0.3508453369140625, -0.32405853271484375, -0.297271728515625, -0.27048492431640625, -0.2436981201171875, -0.21691131591796875, -0.19012451171875, -0.16333770751953125, -0.1365509033203125, -0.10976409912109375, -0.082977294921875, -0.05619049072265625, -0.0294036865234375, -0.00261688232421875, 0.024169921875, 0.05095672607421875, 0.0777435302734375, 0.10453033447265625, 0.131317138671875, 0.15810394287109375, 0.1848907470703125, 0.21167755126953125, 0.23846435546875, 0.26525115966796875, 0.2920379638671875, 0.31882476806640625, 0.345611572265625, 0.37239837646484375, 0.3991851806640625, 0.42597198486328125, 0.4527587890625, 0.47954559326171875, 0.5063323974609375, 0.5331192016601562, 0.559906005859375, 0.5866928100585938, 0.6134796142578125, 0.6402664184570312, 0.66705322265625, 0.6938400268554688, 0.7206268310546875, 0.7474136352539062, 0.774200439453125, 0.8009872436523438, 0.8277740478515625, 0.8545608520507812, 0.88134765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 11.0, 11.0, 12.0, 24.0, 22.0, 44.0, 69.0, 70.0, 89.0, 117.0, 153.0, 227.0, 263.0, 328.0, 347.0, 438.0, 404.0, 319.0, 279.0, 211.0, 164.0, 113.0, 85.0, 82.0, 51.0, 37.0, 25.0, 24.0, 7.0, 15.0, 6.0, 8.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72021484375, -0.69873046875, -0.67724609375, -0.65576171875, -0.63427734375, -0.61279296875, -0.59130859375, -0.56982421875, -0.54833984375, -0.52685546875, -0.50537109375, -0.48388671875, -0.46240234375, -0.44091796875, -0.41943359375, -0.39794921875, -0.37646484375, -0.35498046875, -0.33349609375, -0.31201171875, -0.29052734375, -0.26904296875, -0.24755859375, -0.22607421875, -0.20458984375, -0.18310546875, -0.16162109375, -0.14013671875, -0.11865234375, -0.09716796875, -0.07568359375, -0.05419921875, -0.03271484375, -0.01123046875, 0.01025390625, 0.03173828125, 0.05322265625, 0.07470703125, 0.09619140625, 0.11767578125, 0.13916015625, 0.16064453125, 0.18212890625, 0.20361328125, 0.22509765625, 0.24658203125, 0.26806640625, 0.28955078125, 0.31103515625, 0.33251953125, 0.35400390625, 0.37548828125, 0.39697265625, 0.41845703125, 0.43994140625, 0.46142578125, 0.48291015625, 0.50439453125, 0.52587890625, 0.54736328125, 0.56884765625, 0.59033203125, 0.61181640625, 0.63330078125, 0.65478515625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 12.0, 13.0, 31.0, 35.0, 38.0, 53.0, 66.0, 95.0, 107.0, 107.0, 102.0, 84.0, 77.0, 58.0, 41.0, 31.0, 22.0, 10.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.374434471130371, -3.2557883262634277, -3.1371421813964844, -3.01849627494812, -2.8998501300811768, -2.7812039852142334, -2.66255784034729, -2.543911933898926, -2.4252657890319824, -2.306619644165039, -2.1879734992980957, -2.0693275928497314, -1.950681447982788, -1.8320353031158447, -1.7133891582489014, -1.5947431325912476, -1.4760969877243042, -1.3574508428573608, -1.238804817199707, -1.1201586723327637, -1.0015126466751099, -0.8828665018081665, -0.7642204165458679, -0.6455743312835693, -0.5269282460212708, -0.40828216075897217, -0.2896360754966736, -0.1709899604320526, -0.05234387516975403, 0.06630223989486694, 0.18494832515716553, 0.3035944104194641, 0.4222404956817627, 0.5408865809440613, 0.6595326662063599, 0.7781788110733032, 0.896824836730957, 1.0154709815979004, 1.1341171264648438, 1.2527631521224976, 1.3714091777801514, 1.4900553226470947, 1.6087013483047485, 1.727347493171692, 1.8459935188293457, 1.964639663696289, 2.0832858085632324, 2.201931953430176, 2.320578098297119, 2.4392242431640625, 2.557870388031006, 2.67651629447937, 2.7951624393463135, 2.913808584213257, 3.0324547290802, 3.1511006355285645, 3.269746780395508, 3.388392925262451, 3.5070390701293945, 3.625684976577759, 3.744331121444702, 3.8629772663116455, 3.981623411178589, 4.100269317626953, 4.2189154624938965]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 7.0, 4.0, 10.0, 13.0, 9.0, 11.0, 14.0, 21.0, 17.0, 26.0, 32.0, 32.0, 25.0, 36.0, 36.0, 33.0, 41.0, 29.0, 37.0, 43.0, 39.0, 50.0, 59.0, 29.0, 39.0, 39.0, 32.0, 38.0, 29.0, 25.0, 21.0, 23.0, 24.0, 12.0, 11.0, 11.0, 9.0, 8.0, 7.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.135352611541748, -2.058927536010742, -1.9825023412704468, -1.9060771465301514, -1.8296520709991455, -1.7532269954681396, -1.6768018007278442, -1.6003766059875488, -1.523951530456543, -1.447526454925537, -1.3711012601852417, -1.2946760654449463, -1.2182509899139404, -1.1418259143829346, -1.0654007196426392, -0.9889755845069885, -0.9125504493713379, -0.8361253142356873, -0.7597001791000366, -0.683275043964386, -0.6068499088287354, -0.5304247736930847, -0.4539996385574341, -0.37757450342178345, -0.3011493682861328, -0.22472423315048218, -0.14829909801483154, -0.07187396287918091, 0.0045511722564697266, 0.08097630739212036, 0.157401442527771, 0.23382657766342163, 0.31025147438049316, 0.3866766095161438, 0.46310174465179443, 0.5395268797874451, 0.6159520149230957, 0.6923771500587463, 0.768802285194397, 0.8452274203300476, 0.9216525554656982, 0.9980776906013489, 1.0745028257369995, 1.150928020477295, 1.2273530960083008, 1.3037781715393066, 1.380203366279602, 1.4566285610198975, 1.5330536365509033, 1.6094787120819092, 1.6859039068222046, 1.7623291015625, 1.8387541770935059, 1.9151792526245117, 1.9916044473648071, 2.0680296421051025, 2.1444547176361084, 2.2208797931671143, 2.297305107116699, 2.373730182647705, 2.450155258178711, 2.526580333709717, 2.6030054092407227, 2.6794307231903076, 2.7558557987213135]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 10.0, 24.0, 33.0, 43.0, 88.0, 125.0, 273.0, 565.0, 1066.0, 2285.0, 4765.0, 9941.0, 22112.0, 49570.0, 112199.0, 223060.0, 278580.0, 185131.0, 87824.0, 38297.0, 17267.0, 7972.0, 3766.0, 1777.0, 848.0, 431.0, 217.0, 106.0, 63.0, 40.0, 31.0, 18.0, 8.0, 5.0, 1.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6357421875, -1.5866851806640625, -1.537628173828125, -1.4885711669921875, -1.43951416015625, -1.3904571533203125, -1.341400146484375, -1.2923431396484375, -1.2432861328125, -1.1942291259765625, -1.145172119140625, -1.0961151123046875, -1.04705810546875, -0.9980010986328125, -0.948944091796875, -0.8998870849609375, -0.850830078125, -0.8017730712890625, -0.752716064453125, -0.7036590576171875, -0.65460205078125, -0.6055450439453125, -0.556488037109375, -0.5074310302734375, -0.4583740234375, -0.4093170166015625, -0.360260009765625, -0.3112030029296875, -0.26214599609375, -0.2130889892578125, -0.164031982421875, -0.1149749755859375, -0.06591796875, -0.0168609619140625, 0.032196044921875, 0.0812530517578125, 0.13031005859375, 0.1793670654296875, 0.228424072265625, 0.2774810791015625, 0.3265380859375, 0.3755950927734375, 0.424652099609375, 0.4737091064453125, 0.52276611328125, 0.5718231201171875, 0.620880126953125, 0.6699371337890625, 0.718994140625, 0.7680511474609375, 0.817108154296875, 0.8661651611328125, 0.91522216796875, 0.9642791748046875, 1.013336181640625, 1.0623931884765625, 1.1114501953125, 1.1605072021484375, 1.209564208984375, 1.2586212158203125, 1.30767822265625, 1.3567352294921875, 1.405792236328125, 1.4548492431640625, 1.50390625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 1.0, 7.0, 6.0, 7.0, 14.0, 24.0, 26.0, 32.0, 30.0, 41.0, 47.0, 46.0, 47.0, 63.0, 62.0, 66.0, 54.0, 51.0, 49.0, 53.0, 41.0, 43.0, 35.0, 29.0, 29.0, 26.0, 13.0, 17.0, 15.0, 11.0, 7.0, 4.0, 3.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.66015625, -0.6427803039550781, -0.6254043579101562, -0.6080284118652344, -0.5906524658203125, -0.5732765197753906, -0.5559005737304688, -0.5385246276855469, -0.521148681640625, -0.5037727355957031, -0.48639678955078125, -0.4690208435058594, -0.4516448974609375, -0.4342689514160156, -0.41689300537109375, -0.3995170593261719, -0.38214111328125, -0.3647651672363281, -0.34738922119140625, -0.3300132751464844, -0.3126373291015625, -0.2952613830566406, -0.27788543701171875, -0.2605094909667969, -0.243133544921875, -0.22575759887695312, -0.20838165283203125, -0.19100570678710938, -0.1736297607421875, -0.15625381469726562, -0.13887786865234375, -0.12150192260742188, -0.1041259765625, -0.08675003051757812, -0.06937408447265625, -0.051998138427734375, -0.0346221923828125, -0.017246246337890625, 0.00012969970703125, 0.017505645751953125, 0.034881591796875, 0.052257537841796875, 0.06963348388671875, 0.08700942993164062, 0.1043853759765625, 0.12176132202148438, 0.13913726806640625, 0.15651321411132812, 0.17388916015625, 0.19126510620117188, 0.20864105224609375, 0.22601699829101562, 0.2433929443359375, 0.2607688903808594, 0.27814483642578125, 0.2955207824707031, 0.312896728515625, 0.3302726745605469, 0.34764862060546875, 0.3650245666503906, 0.3824005126953125, 0.3997764587402344, 0.41715240478515625, 0.4345283508300781, 0.451904296875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 4.0, 3.0, 7.0, 11.0, 13.0, 18.0, 27.0, 37.0, 43.0, 73.0, 117.0, 194.0, 331.0, 659.0, 1304.0, 2969.0, 6975.0, 17119.0, 43483.0, 102824.0, 200784.0, 268836.0, 211113.0, 110832.0, 47871.0, 19165.0, 7584.0, 3144.0, 1380.0, 679.0, 373.0, 192.0, 120.0, 99.0, 62.0, 36.0, 29.0, 16.0, 14.0, 13.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.361328125, -1.3195037841796875, -1.277679443359375, -1.2358551025390625, -1.19403076171875, -1.1522064208984375, -1.110382080078125, -1.0685577392578125, -1.0267333984375, -0.9849090576171875, -0.943084716796875, -0.9012603759765625, -0.85943603515625, -0.8176116943359375, -0.775787353515625, -0.7339630126953125, -0.692138671875, -0.6503143310546875, -0.608489990234375, -0.5666656494140625, -0.52484130859375, -0.4830169677734375, -0.441192626953125, -0.3993682861328125, -0.3575439453125, -0.3157196044921875, -0.273895263671875, -0.2320709228515625, -0.19024658203125, -0.1484222412109375, -0.106597900390625, -0.0647735595703125, -0.02294921875, 0.0188751220703125, 0.060699462890625, 0.1025238037109375, 0.14434814453125, 0.1861724853515625, 0.227996826171875, 0.2698211669921875, 0.3116455078125, 0.3534698486328125, 0.395294189453125, 0.4371185302734375, 0.47894287109375, 0.5207672119140625, 0.562591552734375, 0.6044158935546875, 0.646240234375, 0.6880645751953125, 0.729888916015625, 0.7717132568359375, 0.81353759765625, 0.8553619384765625, 0.897186279296875, 0.9390106201171875, 0.9808349609375, 1.0226593017578125, 1.064483642578125, 1.1063079833984375, 1.14813232421875, 1.1899566650390625, 1.231781005859375, 1.2736053466796875, 1.3154296875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 6.0, 13.0, 15.0, 11.0, 24.0, 18.0, 26.0, 28.0, 35.0, 36.0, 48.0, 38.0, 45.0, 50.0, 51.0, 45.0, 63.0, 56.0, 40.0, 30.0, 46.0, 44.0, 36.0, 30.0, 27.0, 25.0, 23.0, 19.0, 12.0, 9.0, 7.0, 10.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4248046875, -1.38055419921875, -1.3363037109375, -1.29205322265625, -1.247802734375, -1.20355224609375, -1.1593017578125, -1.11505126953125, -1.07080078125, -1.02655029296875, -0.9822998046875, -0.93804931640625, -0.893798828125, -0.84954833984375, -0.8052978515625, -0.76104736328125, -0.716796875, -0.67254638671875, -0.6282958984375, -0.58404541015625, -0.539794921875, -0.49554443359375, -0.4512939453125, -0.40704345703125, -0.36279296875, -0.31854248046875, -0.2742919921875, -0.23004150390625, -0.185791015625, -0.14154052734375, -0.0972900390625, -0.05303955078125, -0.0087890625, 0.03546142578125, 0.0797119140625, 0.12396240234375, 0.168212890625, 0.21246337890625, 0.2567138671875, 0.30096435546875, 0.34521484375, 0.38946533203125, 0.4337158203125, 0.47796630859375, 0.522216796875, 0.56646728515625, 0.6107177734375, 0.65496826171875, 0.69921875, 0.74346923828125, 0.7877197265625, 0.83197021484375, 0.876220703125, 0.92047119140625, 0.9647216796875, 1.00897216796875, 1.05322265625, 1.09747314453125, 1.1417236328125, 1.18597412109375, 1.230224609375, 1.27447509765625, 1.3187255859375, 1.36297607421875, 1.4072265625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 3.0, 7.0, 12.0, 16.0, 24.0, 39.0, 68.0, 107.0, 152.0, 312.0, 489.0, 817.0, 1283.0, 2341.0, 3847.0, 6480.0, 11201.0, 19331.0, 32870.0, 55923.0, 90832.0, 138066.0, 175418.0, 170916.0, 130125.0, 84251.0, 50805.0, 30373.0, 17390.0, 10470.0, 5934.0, 3544.0, 2026.0, 1177.0, 769.0, 458.0, 265.0, 150.0, 89.0, 69.0, 40.0, 18.0, 17.0, 18.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.38623046875, -0.3754768371582031, -0.36472320556640625, -0.3539695739746094, -0.3432159423828125, -0.3324623107910156, -0.32170867919921875, -0.3109550476074219, -0.300201416015625, -0.2894477844238281, -0.27869415283203125, -0.2679405212402344, -0.2571868896484375, -0.24643325805664062, -0.23567962646484375, -0.22492599487304688, -0.21417236328125, -0.20341873168945312, -0.19266510009765625, -0.18191146850585938, -0.1711578369140625, -0.16040420532226562, -0.14965057373046875, -0.13889694213867188, -0.128143310546875, -0.11738967895507812, -0.10663604736328125, -0.09588241577148438, -0.0851287841796875, -0.07437515258789062, -0.06362152099609375, -0.052867889404296875, -0.0421142578125, -0.031360626220703125, -0.02060699462890625, -0.009853363037109375, 0.0009002685546875, 0.011653900146484375, 0.02240753173828125, 0.033161163330078125, 0.043914794921875, 0.054668426513671875, 0.06542205810546875, 0.07617568969726562, 0.0869293212890625, 0.09768295288085938, 0.10843658447265625, 0.11919021606445312, 0.12994384765625, 0.14069747924804688, 0.15145111083984375, 0.16220474243164062, 0.1729583740234375, 0.18371200561523438, 0.19446563720703125, 0.20521926879882812, 0.215972900390625, 0.22672653198242188, 0.23748016357421875, 0.24823379516601562, 0.2589874267578125, 0.2697410583496094, 0.28049468994140625, 0.2912483215332031, 0.302001953125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 7.0, 12.0, 10.0, 18.0, 30.0, 30.0, 45.0, 59.0, 72.0, 85.0, 93.0, 99.0, 103.0, 81.0, 65.0, 36.0, 25.0, 26.0, 16.0, 19.0, 11.0, 8.0, 8.0, 5.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001647472381591797, -0.00016005337238311768, -0.00015535950660705566, -0.00015066564083099365, -0.00014597177505493164, -0.00014127790927886963, -0.00013658404350280762, -0.0001318901777267456, -0.0001271963119506836, -0.00012250244617462158, -0.00011780858039855957, -0.00011311471462249756, -0.00010842084884643555, -0.00010372698307037354, -9.903311729431152e-05, -9.433925151824951e-05, -8.96453857421875e-05, -8.495151996612549e-05, -8.025765419006348e-05, -7.556378841400146e-05, -7.086992263793945e-05, -6.617605686187744e-05, -6.148219108581543e-05, -5.678832530975342e-05, -5.2094459533691406e-05, -4.7400593757629395e-05, -4.270672798156738e-05, -3.801286220550537e-05, -3.331899642944336e-05, -2.8625130653381348e-05, -2.3931264877319336e-05, -1.9237399101257324e-05, -1.4543533325195312e-05, -9.8496675491333e-06, -5.155801773071289e-06, -4.6193599700927734e-07, 4.231929779052734e-06, 8.925795555114746e-06, 1.3619661331176758e-05, 1.831352710723877e-05, 2.300739288330078e-05, 2.7701258659362793e-05, 3.2395124435424805e-05, 3.7088990211486816e-05, 4.178285598754883e-05, 4.647672176361084e-05, 5.117058753967285e-05, 5.586445331573486e-05, 6.0558319091796875e-05, 6.525218486785889e-05, 6.99460506439209e-05, 7.463991641998291e-05, 7.933378219604492e-05, 8.402764797210693e-05, 8.872151374816895e-05, 9.341537952423096e-05, 9.810924530029297e-05, 0.00010280311107635498, 0.00010749697685241699, 0.000112190842628479, 0.00011688470840454102, 0.00012157857418060303, 0.00012627243995666504, 0.00013096630573272705, 0.00013566017150878906]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 9.0, 9.0, 7.0, 8.0, 17.0, 25.0, 41.0, 70.0, 126.0, 198.0, 353.0, 771.0, 1482.0, 3235.0, 7089.0, 16625.0, 40058.0, 97966.0, 216839.0, 304819.0, 203815.0, 90486.0, 36912.0, 15027.0, 6634.0, 2972.0, 1422.0, 736.0, 338.0, 196.0, 97.0, 69.0, 39.0, 21.0, 22.0, 8.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.56396484375, -0.5480575561523438, -0.5321502685546875, -0.5162429809570312, -0.500335693359375, -0.48442840576171875, -0.4685211181640625, -0.45261383056640625, -0.43670654296875, -0.42079925537109375, -0.4048919677734375, -0.38898468017578125, -0.373077392578125, -0.35717010498046875, -0.3412628173828125, -0.32535552978515625, -0.3094482421875, -0.29354095458984375, -0.2776336669921875, -0.26172637939453125, -0.245819091796875, -0.22991180419921875, -0.2140045166015625, -0.19809722900390625, -0.18218994140625, -0.16628265380859375, -0.1503753662109375, -0.13446807861328125, -0.118560791015625, -0.10265350341796875, -0.0867462158203125, -0.07083892822265625, -0.054931640625, -0.03902435302734375, -0.0231170654296875, -0.00720977783203125, 0.008697509765625, 0.02460479736328125, 0.0405120849609375, 0.05641937255859375, 0.07232666015625, 0.08823394775390625, 0.1041412353515625, 0.12004852294921875, 0.135955810546875, 0.15186309814453125, 0.1677703857421875, 0.18367767333984375, 0.1995849609375, 0.21549224853515625, 0.2313995361328125, 0.24730682373046875, 0.263214111328125, 0.27912139892578125, 0.2950286865234375, 0.31093597412109375, 0.32684326171875, 0.34275054931640625, 0.3586578369140625, 0.37456512451171875, 0.390472412109375, 0.40637969970703125, 0.4222869873046875, 0.43819427490234375, 0.4541015625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 6.0, 8.0, 9.0, 12.0, 13.0, 11.0, 13.0, 33.0, 28.0, 38.0, 46.0, 80.0, 61.0, 78.0, 81.0, 78.0, 73.0, 66.0, 51.0, 51.0, 31.0, 32.0, 23.0, 17.0, 10.0, 9.0, 11.0, 6.0, 12.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.368896484375, -0.35562896728515625, -0.3423614501953125, -0.32909393310546875, -0.315826416015625, -0.30255889892578125, -0.2892913818359375, -0.27602386474609375, -0.26275634765625, -0.24948883056640625, -0.2362213134765625, -0.22295379638671875, -0.209686279296875, -0.19641876220703125, -0.1831512451171875, -0.16988372802734375, -0.1566162109375, -0.14334869384765625, -0.1300811767578125, -0.11681365966796875, -0.103546142578125, -0.09027862548828125, -0.0770111083984375, -0.06374359130859375, -0.05047607421875, -0.03720855712890625, -0.0239410400390625, -0.01067352294921875, 0.002593994140625, 0.01586151123046875, 0.0291290283203125, 0.04239654541015625, 0.0556640625, 0.06893157958984375, 0.0821990966796875, 0.09546661376953125, 0.108734130859375, 0.12200164794921875, 0.1352691650390625, 0.14853668212890625, 0.16180419921875, 0.17507171630859375, 0.1883392333984375, 0.20160675048828125, 0.214874267578125, 0.22814178466796875, 0.2414093017578125, 0.25467681884765625, 0.2679443359375, 0.28121185302734375, 0.2944793701171875, 0.30774688720703125, 0.321014404296875, 0.33428192138671875, 0.3475494384765625, 0.36081695556640625, 0.37408447265625, 0.38735198974609375, 0.4006195068359375, 0.41388702392578125, 0.427154541015625, 0.44042205810546875, 0.4536895751953125, 0.46695709228515625, 0.480224609375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 9.0, 17.0, 19.0, 29.0, 50.0, 60.0, 65.0, 96.0, 103.0, 110.0, 108.0, 92.0, 72.0, 56.0, 40.0, 26.0, 27.0, 14.0, 10.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.291038513183594, -8.096464157104492, -7.901888847351074, -7.707314491271973, -7.512739658355713, -7.318164825439453, -7.123589992523193, -6.929015159606934, -6.734440803527832, -6.539865970611572, -6.3452911376953125, -6.150716781616211, -5.956141948699951, -5.761567115783691, -5.566992282867432, -5.372417449951172, -5.177842617034912, -4.983267784118652, -4.788692951202393, -4.594118118286133, -4.399543762207031, -4.2049689292907715, -4.010394096374512, -3.815819263458252, -3.6212446689605713, -3.4266698360443115, -3.232095241546631, -3.037520408630371, -2.8429455757141113, -2.6483709812164307, -2.453796148300171, -2.2592215538024902, -2.0646471977233887, -1.8700724840164185, -1.6754977703094482, -1.4809229373931885, -1.2863482236862183, -1.091773509979248, -0.8971986770629883, -0.7026239633560181, -0.5080492496490479, -0.31347450613975525, -0.11889976263046265, 0.07567501068115234, 0.27024972438812256, 0.4648244380950928, 0.6593992710113525, 0.8539739847183228, 1.048548698425293, 1.2431234121322632, 1.4376981258392334, 1.6322729587554932, 1.8268476724624634, 2.0214223861694336, 2.2159972190856934, 2.410572052001953, 2.605146646499634, 2.7997214794158936, 2.994296073913574, 3.188870906829834, 3.3834457397460938, 3.5780203342437744, 3.772595167160034, 3.967169761657715, 4.161744594573975]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 7.0, 5.0, 12.0, 9.0, 14.0, 12.0, 7.0, 15.0, 26.0, 25.0, 29.0, 25.0, 37.0, 43.0, 42.0, 26.0, 32.0, 34.0, 42.0, 54.0, 53.0, 54.0, 39.0, 42.0, 28.0, 34.0, 34.0, 29.0, 26.0, 26.0, 22.0, 21.0, 18.0, 14.0, 10.0, 10.0, 14.0, 10.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.663191795349121, -4.525661468505859, -4.3881306648254395, -4.250600337982178, -4.113069534301758, -3.975539207458496, -3.8380086421966553, -3.7004780769348145, -3.5629475116729736, -3.425416946411133, -3.287886381149292, -3.150355815887451, -3.0128254890441895, -2.8752946853637695, -2.737764358520508, -2.600233793258667, -2.462703227996826, -2.3251726627349854, -2.1876420974731445, -2.0501115322113037, -1.9125810861587524, -1.7750505208969116, -1.6375200748443604, -1.4999895095825195, -1.3624589443206787, -1.224928379058838, -1.087397813796997, -0.9498673677444458, -0.812336802482605, -0.6748062372207642, -0.5372757315635681, -0.39974522590637207, -0.26221466064453125, -0.12468412518501282, 0.012846410274505615, 0.15037694573402405, 0.2879074811935425, 0.4254380464553833, 0.5629685521125793, 0.7004990577697754, 0.8380296230316162, 0.975560188293457, 1.1130907535552979, 1.2506211996078491, 1.38815176486969, 1.5256823301315308, 1.663212776184082, 1.8007433414459229, 1.9382739067077637, 2.0758044719696045, 2.2133350372314453, 2.350865602493286, 2.488396167755127, 2.6259264945983887, 2.7634570598602295, 2.9009876251220703, 3.038518190383911, 3.176048755645752, 3.3135793209075928, 3.4511098861694336, 3.5886402130126953, 3.7261710166931152, 3.863701343536377, 4.001232147216797, 4.138762474060059]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 7.0, 9.0, 4.0, 18.0, 24.0, 41.0, 48.0, 85.0, 147.0, 255.0, 469.0, 1021.0, 2238.0, 5214.0, 13675.0, 39916.0, 143967.0, 668621.0, 1924416.0, 1069167.0, 233141.0, 59547.0, 19168.0, 7337.0, 2994.0, 1318.0, 661.0, 339.0, 168.0, 95.0, 54.0, 32.0, 31.0, 14.0, 12.0, 9.0, 7.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0], "bins": [-1.0361328125, -1.010009765625, -0.98388671875, -0.957763671875, -0.931640625, -0.905517578125, -0.87939453125, -0.853271484375, -0.8271484375, -0.801025390625, -0.77490234375, -0.748779296875, -0.72265625, -0.696533203125, -0.67041015625, -0.644287109375, -0.6181640625, -0.592041015625, -0.56591796875, -0.539794921875, -0.513671875, -0.487548828125, -0.46142578125, -0.435302734375, -0.4091796875, -0.383056640625, -0.35693359375, -0.330810546875, -0.3046875, -0.278564453125, -0.25244140625, -0.226318359375, -0.2001953125, -0.174072265625, -0.14794921875, -0.121826171875, -0.095703125, -0.069580078125, -0.04345703125, -0.017333984375, 0.0087890625, 0.034912109375, 0.06103515625, 0.087158203125, 0.11328125, 0.139404296875, 0.16552734375, 0.191650390625, 0.2177734375, 0.243896484375, 0.27001953125, 0.296142578125, 0.322265625, 0.348388671875, 0.37451171875, 0.400634765625, 0.4267578125, 0.452880859375, 0.47900390625, 0.505126953125, 0.53125, 0.557373046875, 0.58349609375, 0.609619140625, 0.6357421875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 5.0, 10.0, 15.0, 9.0, 23.0, 26.0, 15.0, 37.0, 47.0, 39.0, 42.0, 43.0, 61.0, 58.0, 62.0, 65.0, 52.0, 54.0, 60.0, 42.0, 39.0, 39.0, 34.0, 32.0, 17.0, 16.0, 22.0, 11.0, 7.0, 7.0, 4.0, 3.0, 1.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76904296875, -0.7471389770507812, -0.7252349853515625, -0.7033309936523438, -0.681427001953125, -0.6595230102539062, -0.6376190185546875, -0.6157150268554688, -0.59381103515625, -0.5719070434570312, -0.5500030517578125, -0.5280990600585938, -0.506195068359375, -0.48429107666015625, -0.4623870849609375, -0.44048309326171875, -0.4185791015625, -0.39667510986328125, -0.3747711181640625, -0.35286712646484375, -0.330963134765625, -0.30905914306640625, -0.2871551513671875, -0.26525115966796875, -0.24334716796875, -0.22144317626953125, -0.1995391845703125, -0.17763519287109375, -0.155731201171875, -0.13382720947265625, -0.1119232177734375, -0.09001922607421875, -0.068115234375, -0.04621124267578125, -0.0243072509765625, -0.00240325927734375, 0.019500732421875, 0.04140472412109375, 0.0633087158203125, 0.08521270751953125, 0.10711669921875, 0.12902069091796875, 0.1509246826171875, 0.17282867431640625, 0.194732666015625, 0.21663665771484375, 0.2385406494140625, 0.26044464111328125, 0.2823486328125, 0.30425262451171875, 0.3261566162109375, 0.34806060791015625, 0.369964599609375, 0.39186859130859375, 0.4137725830078125, 0.43567657470703125, 0.45758056640625, 0.47948455810546875, 0.5013885498046875, 0.5232925415039062, 0.545196533203125, 0.5671005249023438, 0.5890045166015625, 0.6109085083007812, 0.6328125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 11.0, 6.0, 3.0, 11.0, 7.0, 11.0, 30.0, 26.0, 54.0, 68.0, 136.0, 189.0, 353.0, 619.0, 1116.0, 2352.0, 4886.0, 11323.0, 28686.0, 82537.0, 258473.0, 814809.0, 1642971.0, 907873.0, 290665.0, 92175.0, 32022.0, 12299.0, 5225.0, 2450.0, 1249.0, 712.0, 331.0, 215.0, 132.0, 94.0, 52.0, 34.0, 28.0, 19.0, 11.0, 10.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.724609375, -0.7000885009765625, -0.675567626953125, -0.6510467529296875, -0.62652587890625, -0.6020050048828125, -0.577484130859375, -0.5529632568359375, -0.5284423828125, -0.5039215087890625, -0.479400634765625, -0.4548797607421875, -0.43035888671875, -0.4058380126953125, -0.381317138671875, -0.3567962646484375, -0.332275390625, -0.3077545166015625, -0.283233642578125, -0.2587127685546875, -0.23419189453125, -0.2096710205078125, -0.185150146484375, -0.1606292724609375, -0.1361083984375, -0.1115875244140625, -0.087066650390625, -0.0625457763671875, -0.03802490234375, -0.0135040283203125, 0.011016845703125, 0.0355377197265625, 0.06005859375, 0.0845794677734375, 0.109100341796875, 0.1336212158203125, 0.15814208984375, 0.1826629638671875, 0.207183837890625, 0.2317047119140625, 0.2562255859375, 0.2807464599609375, 0.305267333984375, 0.3297882080078125, 0.35430908203125, 0.3788299560546875, 0.403350830078125, 0.4278717041015625, 0.452392578125, 0.4769134521484375, 0.501434326171875, 0.5259552001953125, 0.55047607421875, 0.5749969482421875, 0.599517822265625, 0.6240386962890625, 0.6485595703125, 0.6730804443359375, 0.697601318359375, 0.7221221923828125, 0.74664306640625, 0.7711639404296875, 0.795684814453125, 0.8202056884765625, 0.8447265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 6.0, 11.0, 12.0, 15.0, 16.0, 26.0, 55.0, 74.0, 85.0, 131.0, 171.0, 260.0, 365.0, 448.0, 496.0, 518.0, 376.0, 307.0, 197.0, 163.0, 107.0, 75.0, 59.0, 30.0, 20.0, 11.0, 11.0, 13.0, 7.0, 1.0, 5.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.134765625, -1.10113525390625, -1.0675048828125, -1.03387451171875, -1.000244140625, -0.96661376953125, -0.9329833984375, -0.89935302734375, -0.86572265625, -0.83209228515625, -0.7984619140625, -0.76483154296875, -0.731201171875, -0.69757080078125, -0.6639404296875, -0.63031005859375, -0.5966796875, -0.56304931640625, -0.5294189453125, -0.49578857421875, -0.462158203125, -0.42852783203125, -0.3948974609375, -0.36126708984375, -0.32763671875, -0.29400634765625, -0.2603759765625, -0.22674560546875, -0.193115234375, -0.15948486328125, -0.1258544921875, -0.09222412109375, -0.05859375, -0.02496337890625, 0.0086669921875, 0.04229736328125, 0.075927734375, 0.10955810546875, 0.1431884765625, 0.17681884765625, 0.21044921875, 0.24407958984375, 0.2777099609375, 0.31134033203125, 0.344970703125, 0.37860107421875, 0.4122314453125, 0.44586181640625, 0.4794921875, 0.51312255859375, 0.5467529296875, 0.58038330078125, 0.614013671875, 0.64764404296875, 0.6812744140625, 0.71490478515625, 0.74853515625, 0.78216552734375, 0.8157958984375, 0.84942626953125, 0.883056640625, 0.91668701171875, 0.9503173828125, 0.98394775390625, 1.017578125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 7.0, 3.0, 13.0, 20.0, 23.0, 35.0, 38.0, 42.0, 54.0, 72.0, 78.0, 86.0, 83.0, 86.0, 84.0, 59.0, 55.0, 54.0, 36.0, 19.0, 14.0, 16.0, 16.0, 6.0, 4.0, 7.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.2583112716674805, -2.1259701251983643, -1.993628740310669, -1.8612875938415527, -1.728946328163147, -1.5966050624847412, -1.464263916015625, -1.3319226503372192, -1.1995813846588135, -1.0672401189804077, -0.9348989129066467, -0.8025577068328857, -0.67021644115448, -0.5378751754760742, -0.40553396940231323, -0.27319276332855225, -0.14085149765014648, -0.00851026177406311, 0.12383097410202026, 0.25617220997810364, 0.388513445854187, 0.5208547115325928, 0.6531959176063538, 0.7855371236801147, 0.9178783893585205, 1.0502196550369263, 1.182560920715332, 1.3149020671844482, 1.447243332862854, 1.5795845985412598, 1.711925745010376, 1.8442670106887817, 1.9766082763671875, 2.1089494228363037, 2.241290807723999, 2.3736319541931152, 2.5059733390808105, 2.6383144855499268, 2.770655632019043, 2.9029970169067383, 3.0353381633758545, 3.1676793098449707, 3.300020694732666, 3.4323618412017822, 3.5647029876708984, 3.6970443725585938, 3.82938551902771, 3.961726665496826, 4.0940680503845215, 4.226409435272217, 4.358750343322754, 4.491091728210449, 4.6234331130981445, 4.75577449798584, 4.888115406036377, 5.020456790924072, 5.152797698974609, 5.285139083862305, 5.417479991912842, 5.549821376800537, 5.682162761688232, 5.8145036697387695, 5.946845054626465, 6.07918643951416, 6.2115278244018555]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 6.0, 4.0, 8.0, 8.0, 11.0, 5.0, 14.0, 16.0, 14.0, 16.0, 29.0, 24.0, 25.0, 29.0, 30.0, 48.0, 48.0, 38.0, 44.0, 51.0, 49.0, 50.0, 55.0, 35.0, 44.0, 38.0, 36.0, 48.0, 36.0, 29.0, 21.0, 20.0, 23.0, 3.0, 15.0, 8.0, 6.0, 8.0, 6.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7908551692962646, -3.6747348308563232, -3.558614730834961, -3.4424943923950195, -3.326374053955078, -3.2102537155151367, -3.0941333770751953, -2.978013277053833, -2.8618929386138916, -2.74577260017395, -2.629652500152588, -2.5135321617126465, -2.397411823272705, -2.2812914848327637, -2.1651711463928223, -2.04905104637146, -1.9329307079315186, -1.8168103694915771, -1.7006901502609253, -1.5845699310302734, -1.468449592590332, -1.3523292541503906, -1.2362090349197388, -1.120088815689087, -1.0039684772491455, -0.8878481984138489, -0.7717279195785522, -0.6556076407432556, -0.539487361907959, -0.42336708307266235, -0.3072468042373657, -0.1911265254020691, -0.07500600814819336, 0.04111427068710327, 0.1572345495223999, 0.27335482835769653, 0.38947510719299316, 0.5055953860282898, 0.6217156648635864, 0.7378359436988831, 0.8539562225341797, 0.9700765013694763, 1.086196780204773, 1.2023169994354248, 1.3184373378753662, 1.4345576763153076, 1.5506778955459595, 1.6667981147766113, 1.7829184532165527, 1.8990387916564941, 2.0151591300964355, 2.131279230117798, 2.2473995685577393, 2.3635199069976807, 2.479640007019043, 2.5957603454589844, 2.711880683898926, 2.828001022338867, 2.9441213607788086, 3.060241460800171, 3.1763617992401123, 3.2924821376800537, 3.408602237701416, 3.5247225761413574, 3.640842914581299]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 11.0, 8.0, 16.0, 21.0, 36.0, 35.0, 59.0, 102.0, 135.0, 236.0, 355.0, 625.0, 1072.0, 1939.0, 3261.0, 5729.0, 9774.0, 16690.0, 28914.0, 53039.0, 100637.0, 187754.0, 246169.0, 179182.0, 95997.0, 50368.0, 27819.0, 15870.0, 9493.0, 5531.0, 3143.0, 1802.0, 1138.0, 629.0, 345.0, 228.0, 122.0, 82.0, 55.0, 39.0, 27.0, 28.0, 15.0, 6.0, 10.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.0341796875, -1.0032730102539062, -0.9723663330078125, -0.9414596557617188, -0.910552978515625, -0.8796463012695312, -0.8487396240234375, -0.8178329467773438, -0.78692626953125, -0.7560195922851562, -0.7251129150390625, -0.6942062377929688, -0.663299560546875, -0.6323928833007812, -0.6014862060546875, -0.5705795288085938, -0.5396728515625, -0.5087661743164062, -0.4778594970703125, -0.44695281982421875, -0.416046142578125, -0.38513946533203125, -0.3542327880859375, -0.32332611083984375, -0.29241943359375, -0.26151275634765625, -0.2306060791015625, -0.19969940185546875, -0.168792724609375, -0.13788604736328125, -0.1069793701171875, -0.07607269287109375, -0.045166015625, -0.01425933837890625, 0.0166473388671875, 0.04755401611328125, 0.078460693359375, 0.10936737060546875, 0.1402740478515625, 0.17118072509765625, 0.20208740234375, 0.23299407958984375, 0.2639007568359375, 0.29480743408203125, 0.325714111328125, 0.35662078857421875, 0.3875274658203125, 0.41843414306640625, 0.4493408203125, 0.48024749755859375, 0.5111541748046875, 0.5420608520507812, 0.572967529296875, 0.6038742065429688, 0.6347808837890625, 0.6656875610351562, 0.69659423828125, 0.7275009155273438, 0.7584075927734375, 0.7893142700195312, 0.820220947265625, 0.8511276245117188, 0.8820343017578125, 0.9129409790039062, 0.94384765625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 6.0, 4.0, 4.0, 11.0, 13.0, 22.0, 22.0, 36.0, 36.0, 34.0, 36.0, 55.0, 48.0, 57.0, 68.0, 64.0, 49.0, 58.0, 59.0, 49.0, 44.0, 32.0, 44.0, 29.0, 28.0, 24.0, 14.0, 16.0, 12.0, 12.0, 6.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77783203125, -0.7567977905273438, -0.7357635498046875, -0.7147293090820312, -0.693695068359375, -0.6726608276367188, -0.6516265869140625, -0.6305923461914062, -0.60955810546875, -0.5885238647460938, -0.5674896240234375, -0.5464553833007812, -0.525421142578125, -0.5043869018554688, -0.4833526611328125, -0.46231842041015625, -0.4412841796875, -0.42024993896484375, -0.3992156982421875, -0.37818145751953125, -0.357147216796875, -0.33611297607421875, -0.3150787353515625, -0.29404449462890625, -0.27301025390625, -0.25197601318359375, -0.2309417724609375, -0.20990753173828125, -0.188873291015625, -0.16783905029296875, -0.1468048095703125, -0.12577056884765625, -0.104736328125, -0.08370208740234375, -0.0626678466796875, -0.04163360595703125, -0.020599365234375, 0.00043487548828125, 0.0214691162109375, 0.04250335693359375, 0.06353759765625, 0.08457183837890625, 0.1056060791015625, 0.12664031982421875, 0.147674560546875, 0.16870880126953125, 0.1897430419921875, 0.21077728271484375, 0.2318115234375, 0.25284576416015625, 0.2738800048828125, 0.29491424560546875, 0.315948486328125, 0.33698272705078125, 0.3580169677734375, 0.37905120849609375, 0.40008544921875, 0.42111968994140625, 0.4421539306640625, 0.46318817138671875, 0.484222412109375, 0.5052566528320312, 0.5262908935546875, 0.5473251342773438, 0.568359375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 9.0, 12.0, 7.0, 11.0, 22.0, 24.0, 39.0, 53.0, 87.0, 144.0, 217.0, 372.0, 1025.0, 3637.0, 14996.0, 66855.0, 294094.0, 479627.0, 144600.0, 32259.0, 7266.0, 1840.0, 595.0, 302.0, 168.0, 90.0, 59.0, 39.0, 29.0, 23.0, 17.0, 8.0, 9.0, 7.0, 6.0, 3.0, 3.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.345703125, -2.281005859375, -2.21630859375, -2.151611328125, -2.0869140625, -2.022216796875, -1.95751953125, -1.892822265625, -1.828125, -1.763427734375, -1.69873046875, -1.634033203125, -1.5693359375, -1.504638671875, -1.43994140625, -1.375244140625, -1.310546875, -1.245849609375, -1.18115234375, -1.116455078125, -1.0517578125, -0.987060546875, -0.92236328125, -0.857666015625, -0.79296875, -0.728271484375, -0.66357421875, -0.598876953125, -0.5341796875, -0.469482421875, -0.40478515625, -0.340087890625, -0.275390625, -0.210693359375, -0.14599609375, -0.081298828125, -0.0166015625, 0.048095703125, 0.11279296875, 0.177490234375, 0.2421875, 0.306884765625, 0.37158203125, 0.436279296875, 0.5009765625, 0.565673828125, 0.63037109375, 0.695068359375, 0.759765625, 0.824462890625, 0.88916015625, 0.953857421875, 1.0185546875, 1.083251953125, 1.14794921875, 1.212646484375, 1.27734375, 1.342041015625, 1.40673828125, 1.471435546875, 1.5361328125, 1.600830078125, 1.66552734375, 1.730224609375, 1.794921875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 14.0, 11.0, 12.0, 12.0, 13.0, 23.0, 26.0, 16.0, 30.0, 27.0, 26.0, 39.0, 42.0, 68.0, 42.0, 42.0, 40.0, 27.0, 47.0, 48.0, 46.0, 36.0, 45.0, 35.0, 32.0, 33.0, 31.0, 24.0, 28.0, 14.0, 11.0, 9.0, 11.0, 3.0, 7.0, 6.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.509765625, -1.4622955322265625, -1.414825439453125, -1.3673553466796875, -1.31988525390625, -1.2724151611328125, -1.224945068359375, -1.1774749755859375, -1.1300048828125, -1.0825347900390625, -1.035064697265625, -0.9875946044921875, -0.94012451171875, -0.8926544189453125, -0.845184326171875, -0.7977142333984375, -0.750244140625, -0.7027740478515625, -0.655303955078125, -0.6078338623046875, -0.56036376953125, -0.5128936767578125, -0.465423583984375, -0.4179534912109375, -0.3704833984375, -0.3230133056640625, -0.275543212890625, -0.2280731201171875, -0.18060302734375, -0.1331329345703125, -0.085662841796875, -0.0381927490234375, 0.00927734375, 0.0567474365234375, 0.104217529296875, 0.1516876220703125, 0.19915771484375, 0.2466278076171875, 0.294097900390625, 0.3415679931640625, 0.3890380859375, 0.4365081787109375, 0.483978271484375, 0.5314483642578125, 0.57891845703125, 0.6263885498046875, 0.673858642578125, 0.7213287353515625, 0.768798828125, 0.8162689208984375, 0.863739013671875, 0.9112091064453125, 0.95867919921875, 1.0061492919921875, 1.053619384765625, 1.1010894775390625, 1.1485595703125, 1.1960296630859375, 1.243499755859375, 1.2909698486328125, 1.33843994140625, 1.3859100341796875, 1.433380126953125, 1.4808502197265625, 1.5283203125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 9.0, 6.0, 7.0, 21.0, 20.0, 23.0, 53.0, 63.0, 101.0, 214.0, 335.0, 557.0, 920.0, 1694.0, 2942.0, 5040.0, 8675.0, 15192.0, 25940.0, 46092.0, 85549.0, 157558.0, 228310.0, 202168.0, 119765.0, 64007.0, 35010.0, 20461.0, 11694.0, 6858.0, 3972.0, 2221.0, 1273.0, 740.0, 400.0, 253.0, 140.0, 106.0, 68.0, 33.0, 23.0, 16.0, 10.0, 4.0, 3.0, 3.0, 9.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.430908203125, -0.4173431396484375, -0.403778076171875, -0.3902130126953125, -0.37664794921875, -0.3630828857421875, -0.349517822265625, -0.3359527587890625, -0.3223876953125, -0.3088226318359375, -0.295257568359375, -0.2816925048828125, -0.26812744140625, -0.2545623779296875, -0.240997314453125, -0.2274322509765625, -0.2138671875, -0.2003021240234375, -0.186737060546875, -0.1731719970703125, -0.15960693359375, -0.1460418701171875, -0.132476806640625, -0.1189117431640625, -0.1053466796875, -0.0917816162109375, -0.078216552734375, -0.0646514892578125, -0.05108642578125, -0.0375213623046875, -0.023956298828125, -0.0103912353515625, 0.003173828125, 0.0167388916015625, 0.030303955078125, 0.0438690185546875, 0.05743408203125, 0.0709991455078125, 0.084564208984375, 0.0981292724609375, 0.1116943359375, 0.1252593994140625, 0.138824462890625, 0.1523895263671875, 0.16595458984375, 0.1795196533203125, 0.193084716796875, 0.2066497802734375, 0.22021484375, 0.2337799072265625, 0.247344970703125, 0.2609100341796875, 0.27447509765625, 0.2880401611328125, 0.301605224609375, 0.3151702880859375, 0.3287353515625, 0.3423004150390625, 0.355865478515625, 0.3694305419921875, 0.38299560546875, 0.3965606689453125, 0.410125732421875, 0.4236907958984375, 0.437255859375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 7.0, 2.0, 4.0, 9.0, 6.0, 9.0, 6.0, 18.0, 17.0, 18.0, 23.0, 19.0, 33.0, 48.0, 63.0, 82.0, 93.0, 92.0, 85.0, 76.0, 49.0, 51.0, 34.0, 24.0, 19.0, 14.0, 16.0, 6.0, 10.0, 5.0, 3.0, 8.0, 7.0, 6.0, 3.0, 2.0, 5.0, 3.0, 5.0, 2.0, 4.0, 1.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.28640365600586e-05, -8.959788829088211e-05, -8.633174002170563e-05, -8.306559175252914e-05, -7.979944348335266e-05, -7.653329521417618e-05, -7.32671469449997e-05, -7.000099867582321e-05, -6.673485040664673e-05, -6.346870213747025e-05, -6.020255386829376e-05, -5.693640559911728e-05, -5.3670257329940796e-05, -5.040410906076431e-05, -4.713796079158783e-05, -4.3871812522411346e-05, -4.060566425323486e-05, -3.733951598405838e-05, -3.40733677148819e-05, -3.0807219445705414e-05, -2.754107117652893e-05, -2.4274922907352448e-05, -2.1008774638175964e-05, -1.774262636899948e-05, -1.4476478099822998e-05, -1.1210329830646515e-05, -7.944181561470032e-06, -4.678033292293549e-06, -1.4118850231170654e-06, 1.8542632460594177e-06, 5.120411515235901e-06, 8.386559784412384e-06, 1.1652708053588867e-05, 1.491885632276535e-05, 1.8185004591941833e-05, 2.1451152861118317e-05, 2.47173011302948e-05, 2.7983449399471283e-05, 3.1249597668647766e-05, 3.451574593782425e-05, 3.778189420700073e-05, 4.1048042476177216e-05, 4.43141907453537e-05, 4.758033901453018e-05, 5.0846487283706665e-05, 5.411263555288315e-05, 5.737878382205963e-05, 6.0644932091236115e-05, 6.39110803604126e-05, 6.717722862958908e-05, 7.044337689876556e-05, 7.370952516794205e-05, 7.697567343711853e-05, 8.024182170629501e-05, 8.35079699754715e-05, 8.677411824464798e-05, 9.004026651382446e-05, 9.330641478300095e-05, 9.657256305217743e-05, 9.983871132135391e-05, 0.0001031048595905304, 0.00010637100785970688, 0.00010963715612888336, 0.00011290330439805984, 0.00011616945266723633]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 6.0, 10.0, 12.0, 33.0, 29.0, 55.0, 90.0, 117.0, 208.0, 352.0, 664.0, 1267.0, 2686.0, 5731.0, 13270.0, 29175.0, 68690.0, 187337.0, 363788.0, 228212.0, 83489.0, 34661.0, 15532.0, 6776.0, 3062.0, 1491.0, 745.0, 379.0, 250.0, 140.0, 83.0, 70.0, 45.0, 30.0, 18.0, 15.0, 12.0, 10.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.599609375, -0.5806350708007812, -0.5616607666015625, -0.5426864624023438, -0.523712158203125, -0.5047378540039062, -0.4857635498046875, -0.46678924560546875, -0.44781494140625, -0.42884063720703125, -0.4098663330078125, -0.39089202880859375, -0.371917724609375, -0.35294342041015625, -0.3339691162109375, -0.31499481201171875, -0.2960205078125, -0.27704620361328125, -0.2580718994140625, -0.23909759521484375, -0.220123291015625, -0.20114898681640625, -0.1821746826171875, -0.16320037841796875, -0.14422607421875, -0.12525177001953125, -0.1062774658203125, -0.08730316162109375, -0.068328857421875, -0.04935455322265625, -0.0303802490234375, -0.01140594482421875, 0.007568359375, 0.02654266357421875, 0.0455169677734375, 0.06449127197265625, 0.083465576171875, 0.10243988037109375, 0.1214141845703125, 0.14038848876953125, 0.15936279296875, 0.17833709716796875, 0.1973114013671875, 0.21628570556640625, 0.235260009765625, 0.25423431396484375, 0.2732086181640625, 0.29218292236328125, 0.3111572265625, 0.33013153076171875, 0.3491058349609375, 0.36808013916015625, 0.387054443359375, 0.40602874755859375, 0.4250030517578125, 0.44397735595703125, 0.46295166015625, 0.48192596435546875, 0.5009002685546875, 0.5198745727539062, 0.538848876953125, 0.5578231811523438, 0.5767974853515625, 0.5957717895507812, 0.61474609375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 14.0, 9.0, 7.0, 17.0, 15.0, 17.0, 23.0, 21.0, 22.0, 30.0, 32.0, 55.0, 55.0, 59.0, 58.0, 74.0, 89.0, 72.0, 56.0, 38.0, 41.0, 36.0, 31.0, 28.0, 12.0, 16.0, 15.0, 7.0, 9.0, 4.0, 7.0, 6.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4384765625, -0.42369842529296875, -0.4089202880859375, -0.39414215087890625, -0.379364013671875, -0.36458587646484375, -0.3498077392578125, -0.33502960205078125, -0.32025146484375, -0.30547332763671875, -0.2906951904296875, -0.27591705322265625, -0.261138916015625, -0.24636077880859375, -0.2315826416015625, -0.21680450439453125, -0.2020263671875, -0.18724822998046875, -0.1724700927734375, -0.15769195556640625, -0.142913818359375, -0.12813568115234375, -0.1133575439453125, -0.09857940673828125, -0.08380126953125, -0.06902313232421875, -0.0542449951171875, -0.03946685791015625, -0.024688720703125, -0.00991058349609375, 0.0048675537109375, 0.01964569091796875, 0.034423828125, 0.04920196533203125, 0.0639801025390625, 0.07875823974609375, 0.093536376953125, 0.10831451416015625, 0.1230926513671875, 0.13787078857421875, 0.15264892578125, 0.16742706298828125, 0.1822052001953125, 0.19698333740234375, 0.211761474609375, 0.22653961181640625, 0.2413177490234375, 0.25609588623046875, 0.2708740234375, 0.28565216064453125, 0.3004302978515625, 0.31520843505859375, 0.329986572265625, 0.34476470947265625, 0.3595428466796875, 0.37432098388671875, 0.38909912109375, 0.40387725830078125, 0.4186553955078125, 0.43343353271484375, 0.448211669921875, 0.46298980712890625, 0.4777679443359375, 0.49254608154296875, 0.50732421875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 11.0, 10.0, 25.0, 27.0, 44.0, 63.0, 77.0, 103.0, 106.0, 107.0, 101.0, 98.0, 62.0, 64.0, 27.0, 31.0, 19.0, 5.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.739638328552246, -5.550715923309326, -5.361793518066406, -5.172871112823486, -4.983948707580566, -4.7950263023376465, -4.606103897094727, -4.417181015014648, -4.228259086608887, -4.039336681365967, -3.850414276123047, -3.661491870880127, -3.472569465637207, -3.283647060394287, -3.094724416732788, -2.905802011489868, -2.716879367828369, -2.527956962585449, -2.3390345573425293, -2.1501121520996094, -1.9611896276474, -1.77226722240448, -1.5833446979522705, -1.3944222927093506, -1.2054998874664307, -1.0165774822235107, -0.827655017375946, -0.6387325525283813, -0.4498101472854614, -0.2608877420425415, -0.07196521759033203, 0.11695718765258789, 0.3058795928955078, 0.4948020279407501, 0.6837244629859924, 0.8726469278335571, 1.061569333076477, 1.250491738319397, 1.4394142627716064, 1.6283366680145264, 1.8172590732574463, 2.006181478500366, 2.195103883743286, 2.384026527404785, 2.572948932647705, 2.761871337890625, 2.950793743133545, 3.139716148376465, 3.3286385536193848, 3.5175609588623047, 3.7064833641052246, 3.8954057693481445, 4.0843281745910645, 4.273250579833984, 4.4621734619140625, 4.651095390319824, 4.840018272399902, 5.028940677642822, 5.217863082885742, 5.406785488128662, 5.595707893371582, 5.784630298614502, 5.973552703857422, 6.1624755859375, 6.351397514343262]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 6.0, 4.0, 4.0, 2.0, 8.0, 7.0, 8.0, 8.0, 9.0, 11.0, 21.0, 21.0, 16.0, 19.0, 26.0, 35.0, 23.0, 31.0, 34.0, 27.0, 42.0, 36.0, 31.0, 45.0, 61.0, 39.0, 43.0, 43.0, 27.0, 33.0, 32.0, 37.0, 24.0, 25.0, 21.0, 18.0, 24.0, 21.0, 17.0, 17.0, 10.0, 10.0, 9.0, 10.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.052926540374756, -3.934877395629883, -3.8168282508850098, -3.6987788677215576, -3.5807297229766846, -3.4626805782318115, -3.3446311950683594, -3.2265820503234863, -3.1085329055786133, -2.9904837608337402, -2.872434616088867, -2.754385232925415, -2.636336088180542, -2.518286943435669, -2.400237560272217, -2.2821884155273438, -2.1641392707824707, -2.0460901260375977, -1.928040862083435, -1.8099915981292725, -1.6919424533843994, -1.5738933086395264, -1.4558440446853638, -1.3377947807312012, -1.2197456359863281, -1.101696491241455, -0.9836472272872925, -0.8655980229377747, -0.7475488185882568, -0.629499614238739, -0.5114504098892212, -0.39340120553970337, -0.27535200119018555, -0.15730279684066772, -0.0392535924911499, 0.07879561185836792, 0.19684481620788574, 0.31489402055740356, 0.4329432249069214, 0.5509924292564392, 0.669041633605957, 0.7870908379554749, 0.9051400423049927, 1.0231893062591553, 1.1412384510040283, 1.2592875957489014, 1.377336859703064, 1.4953861236572266, 1.6134352684020996, 1.7314844131469727, 1.8495336771011353, 1.9675829410552979, 2.085632085800171, 2.203681230545044, 2.321730613708496, 2.439779758453369, 2.557828903198242, 2.6758780479431152, 2.7939271926879883, 2.9119765758514404, 3.0300257205963135, 3.1480748653411865, 3.2661242485046387, 3.3841733932495117, 3.5022225379943848]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 11.0, 15.0, 33.0, 49.0, 54.0, 108.0, 164.0, 207.0, 333.0, 594.0, 933.0, 1537.0, 2661.0, 4830.0, 9349.0, 19329.0, 44527.0, 115126.0, 338284.0, 959199.0, 1488951.0, 780827.0, 263371.0, 91706.0, 36715.0, 16459.0, 8219.0, 4379.0, 2460.0, 1391.0, 898.0, 527.0, 329.0, 227.0, 153.0, 127.0, 55.0, 52.0, 22.0, 20.0, 16.0, 8.0, 8.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.66259765625, -0.6427536010742188, -0.6229095458984375, -0.6030654907226562, -0.583221435546875, -0.5633773803710938, -0.5435333251953125, -0.5236892700195312, -0.50384521484375, -0.48400115966796875, -0.4641571044921875, -0.44431304931640625, -0.424468994140625, -0.40462493896484375, -0.3847808837890625, -0.36493682861328125, -0.3450927734375, -0.32524871826171875, -0.3054046630859375, -0.28556060791015625, -0.265716552734375, -0.24587249755859375, -0.2260284423828125, -0.20618438720703125, -0.18634033203125, -0.16649627685546875, -0.1466522216796875, -0.12680816650390625, -0.106964111328125, -0.08712005615234375, -0.0672760009765625, -0.04743194580078125, -0.027587890625, -0.00774383544921875, 0.0121002197265625, 0.03194427490234375, 0.051788330078125, 0.07163238525390625, 0.0914764404296875, 0.11132049560546875, 0.13116455078125, 0.15100860595703125, 0.1708526611328125, 0.19069671630859375, 0.210540771484375, 0.23038482666015625, 0.2502288818359375, 0.27007293701171875, 0.2899169921875, 0.30976104736328125, 0.3296051025390625, 0.34944915771484375, 0.369293212890625, 0.38913726806640625, 0.4089813232421875, 0.42882537841796875, 0.44866943359375, 0.46851348876953125, 0.4883575439453125, 0.5082015991210938, 0.528045654296875, 0.5478897094726562, 0.5677337646484375, 0.5875778198242188, 0.607421875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 6.0, 5.0, 8.0, 14.0, 19.0, 11.0, 19.0, 22.0, 30.0, 38.0, 43.0, 44.0, 34.0, 48.0, 57.0, 40.0, 56.0, 51.0, 42.0, 50.0, 53.0, 45.0, 47.0, 33.0, 35.0, 30.0, 24.0, 15.0, 18.0, 15.0, 10.0, 9.0, 5.0, 5.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.705078125, -0.6855545043945312, -0.6660308837890625, -0.6465072631835938, -0.626983642578125, -0.6074600219726562, -0.5879364013671875, -0.5684127807617188, -0.54888916015625, -0.5293655395507812, -0.5098419189453125, -0.49031829833984375, -0.470794677734375, -0.45127105712890625, -0.4317474365234375, -0.41222381591796875, -0.3927001953125, -0.37317657470703125, -0.3536529541015625, -0.33412933349609375, -0.314605712890625, -0.29508209228515625, -0.2755584716796875, -0.25603485107421875, -0.23651123046875, -0.21698760986328125, -0.1974639892578125, -0.17794036865234375, -0.158416748046875, -0.13889312744140625, -0.1193695068359375, -0.09984588623046875, -0.080322265625, -0.06079864501953125, -0.0412750244140625, -0.02175140380859375, -0.002227783203125, 0.01729583740234375, 0.0368194580078125, 0.05634307861328125, 0.07586669921875, 0.09539031982421875, 0.1149139404296875, 0.13443756103515625, 0.153961181640625, 0.17348480224609375, 0.1930084228515625, 0.21253204345703125, 0.2320556640625, 0.25157928466796875, 0.2711029052734375, 0.29062652587890625, 0.310150146484375, 0.32967376708984375, 0.3491973876953125, 0.36872100830078125, 0.38824462890625, 0.40776824951171875, 0.4272918701171875, 0.44681549072265625, 0.466339111328125, 0.48586273193359375, 0.5053863525390625, 0.5249099731445312, 0.54443359375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 7.0, 7.0, 10.0, 16.0, 24.0, 44.0, 66.0, 105.0, 153.0, 255.0, 478.0, 885.0, 1815.0, 4144.0, 10674.0, 32850.0, 126209.0, 552259.0, 1870336.0, 1210069.0, 284315.0, 67456.0, 19494.0, 6844.0, 2824.0, 1297.0, 677.0, 370.0, 220.0, 138.0, 79.0, 55.0, 37.0, 16.0, 21.0, 6.0, 12.0, 3.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0], "bins": [-1.3857421875, -1.350006103515625, -1.31427001953125, -1.278533935546875, -1.2427978515625, -1.207061767578125, -1.17132568359375, -1.135589599609375, -1.099853515625, -1.064117431640625, -1.02838134765625, -0.992645263671875, -0.9569091796875, -0.921173095703125, -0.88543701171875, -0.849700927734375, -0.81396484375, -0.778228759765625, -0.74249267578125, -0.706756591796875, -0.6710205078125, -0.635284423828125, -0.59954833984375, -0.563812255859375, -0.528076171875, -0.492340087890625, -0.45660400390625, -0.420867919921875, -0.3851318359375, -0.349395751953125, -0.31365966796875, -0.277923583984375, -0.2421875, -0.206451416015625, -0.17071533203125, -0.134979248046875, -0.0992431640625, -0.063507080078125, -0.02777099609375, 0.007965087890625, 0.043701171875, 0.079437255859375, 0.11517333984375, 0.150909423828125, 0.1866455078125, 0.222381591796875, 0.25811767578125, 0.293853759765625, 0.32958984375, 0.365325927734375, 0.40106201171875, 0.436798095703125, 0.4725341796875, 0.508270263671875, 0.54400634765625, 0.579742431640625, 0.615478515625, 0.651214599609375, 0.68695068359375, 0.722686767578125, 0.7584228515625, 0.794158935546875, 0.82989501953125, 0.865631103515625, 0.9013671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 10.0, 8.0, 19.0, 32.0, 43.0, 64.0, 104.0, 168.0, 238.0, 361.0, 540.0, 662.0, 597.0, 413.0, 313.0, 172.0, 111.0, 65.0, 49.0, 37.0, 22.0, 12.0, 9.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8095703125, -1.765045166015625, -1.72052001953125, -1.675994873046875, -1.6314697265625, -1.586944580078125, -1.54241943359375, -1.497894287109375, -1.453369140625, -1.408843994140625, -1.36431884765625, -1.319793701171875, -1.2752685546875, -1.230743408203125, -1.18621826171875, -1.141693115234375, -1.09716796875, -1.052642822265625, -1.00811767578125, -0.963592529296875, -0.9190673828125, -0.874542236328125, -0.83001708984375, -0.785491943359375, -0.740966796875, -0.696441650390625, -0.65191650390625, -0.607391357421875, -0.5628662109375, -0.518341064453125, -0.47381591796875, -0.429290771484375, -0.384765625, -0.340240478515625, -0.29571533203125, -0.251190185546875, -0.2066650390625, -0.162139892578125, -0.11761474609375, -0.073089599609375, -0.028564453125, 0.015960693359375, 0.06048583984375, 0.105010986328125, 0.1495361328125, 0.194061279296875, 0.23858642578125, 0.283111572265625, 0.32763671875, 0.372161865234375, 0.41668701171875, 0.461212158203125, 0.5057373046875, 0.550262451171875, 0.59478759765625, 0.639312744140625, 0.683837890625, 0.728363037109375, 0.77288818359375, 0.817413330078125, 0.8619384765625, 0.906463623046875, 0.95098876953125, 0.995513916015625, 1.0400390625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 5.0, 9.0, 14.0, 16.0, 26.0, 40.0, 41.0, 54.0, 84.0, 80.0, 107.0, 121.0, 84.0, 79.0, 64.0, 45.0, 52.0, 26.0, 19.0, 18.0, 12.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.287752628326416, -3.1130199432373047, -2.9382874965667725, -2.763554811477661, -2.588822364807129, -2.4140896797180176, -2.2393569946289062, -2.064624309539795, -1.8898918628692627, -1.715159296989441, -1.5404267311096191, -1.3656940460205078, -1.190961480140686, -1.0162289142608643, -0.8414962291717529, -0.6667636632919312, -0.4920310974121094, -0.3172985017299652, -0.14256590604782104, 0.03216671943664551, 0.20689928531646729, 0.38163185119628906, 0.5563645362854004, 0.7310971021652222, 0.905829668045044, 1.0805622339248657, 1.2552947998046875, 1.4300274848937988, 1.6047600507736206, 1.7794926166534424, 1.9542253017425537, 2.128957748413086, 2.303689956665039, 2.4784226417541504, 2.6531550884246826, 2.827887773513794, 3.002620220184326, 3.1773529052734375, 3.352085590362549, 3.52681827545166, 3.7015507221221924, 3.8762834072113037, 4.051015853881836, 4.225748538970947, 4.400481224060059, 4.575213432312012, 4.749946594238281, 4.924678802490234, 5.099411487579346, 5.274144172668457, 5.448876857757568, 5.62360954284668, 5.798341751098633, 5.973074436187744, 6.1478071212768555, 6.322539806365967, 6.497272491455078, 6.6720051765441895, 6.846737861633301, 7.021470069885254, 7.196202754974365, 7.370935440063477, 7.545668125152588, 7.720400810241699, 7.895133018493652]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 8.0, 8.0, 7.0, 11.0, 9.0, 14.0, 10.0, 12.0, 18.0, 22.0, 22.0, 34.0, 29.0, 19.0, 46.0, 43.0, 41.0, 43.0, 43.0, 50.0, 56.0, 45.0, 29.0, 41.0, 45.0, 34.0, 33.0, 41.0, 22.0, 28.0, 28.0, 31.0, 16.0, 14.0, 16.0, 8.0, 5.0, 5.0, 4.0, 6.0, 0.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4336986541748047, -3.3201985359191895, -3.206698417663574, -3.09319806098938, -2.9796979427337646, -2.8661978244781494, -2.752697467803955, -2.63919734954834, -2.5256972312927246, -2.4121971130371094, -2.298696994781494, -2.1851966381073, -2.0716965198516846, -1.9581964015960693, -1.8446961641311646, -1.7311959266662598, -1.6176958084106445, -1.5041956901550293, -1.3906954526901245, -1.2771952152252197, -1.1636950969696045, -1.0501949787139893, -0.9366947412490845, -0.8231945633888245, -0.7096943855285645, -0.5961942076683044, -0.48269402980804443, -0.3691938519477844, -0.2556936740875244, -0.1421934962272644, -0.028693318367004395, 0.08480685949325562, 0.19830703735351562, 0.31180721521377563, 0.42530739307403564, 0.5388075709342957, 0.6523077487945557, 0.7658079266548157, 0.8793081045150757, 0.9928082823753357, 1.1063084602355957, 1.219808578491211, 1.3333088159561157, 1.4468090534210205, 1.5603091716766357, 1.673809289932251, 1.7873095273971558, 1.9008097648620605, 2.014309883117676, 2.127810001373291, 2.2413101196289062, 2.3548104763031006, 2.468310594558716, 2.581810712814331, 2.6953110694885254, 2.8088111877441406, 2.922311305999756, 3.035811424255371, 3.1493115425109863, 3.2628118991851807, 3.376312017440796, 3.489812135696411, 3.6033124923706055, 3.7168126106262207, 3.830312728881836]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 8.0, 4.0, 3.0, 17.0, 23.0, 32.0, 49.0, 90.0, 107.0, 224.0, 288.0, 461.0, 663.0, 1086.0, 1769.0, 2825.0, 4553.0, 7685.0, 12724.0, 21234.0, 36425.0, 62915.0, 109410.0, 175936.0, 210226.0, 162963.0, 98424.0, 56644.0, 32968.0, 19339.0, 11334.0, 6848.0, 4289.0, 2565.0, 1578.0, 1012.0, 618.0, 392.0, 299.0, 167.0, 115.0, 76.0, 49.0, 37.0, 31.0, 20.0, 11.0, 7.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.001953125, -0.9710311889648438, -0.9401092529296875, -0.9091873168945312, -0.878265380859375, -0.8473434448242188, -0.8164215087890625, -0.7854995727539062, -0.75457763671875, -0.7236557006835938, -0.6927337646484375, -0.6618118286132812, -0.630889892578125, -0.5999679565429688, -0.5690460205078125, -0.5381240844726562, -0.5072021484375, -0.47628021240234375, -0.4453582763671875, -0.41443634033203125, -0.383514404296875, -0.35259246826171875, -0.3216705322265625, -0.29074859619140625, -0.25982666015625, -0.22890472412109375, -0.1979827880859375, -0.16706085205078125, -0.136138916015625, -0.10521697998046875, -0.0742950439453125, -0.04337310791015625, -0.012451171875, 0.01847076416015625, 0.0493927001953125, 0.08031463623046875, 0.111236572265625, 0.14215850830078125, 0.1730804443359375, 0.20400238037109375, 0.23492431640625, 0.26584625244140625, 0.2967681884765625, 0.32769012451171875, 0.358612060546875, 0.38953399658203125, 0.4204559326171875, 0.45137786865234375, 0.4822998046875, 0.5132217407226562, 0.5441436767578125, 0.5750656127929688, 0.605987548828125, 0.6369094848632812, 0.6678314208984375, 0.6987533569335938, 0.72967529296875, 0.7605972290039062, 0.7915191650390625, 0.8224411010742188, 0.853363037109375, 0.8842849731445312, 0.9152069091796875, 0.9461288452148438, 0.97705078125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 6.0, 14.0, 16.0, 11.0, 21.0, 17.0, 23.0, 28.0, 38.0, 28.0, 46.0, 37.0, 53.0, 43.0, 44.0, 65.0, 47.0, 58.0, 50.0, 34.0, 48.0, 35.0, 31.0, 27.0, 34.0, 29.0, 21.0, 9.0, 13.0, 17.0, 14.0, 8.0, 4.0, 4.0, 7.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.66259765625, -0.6431427001953125, -0.623687744140625, -0.6042327880859375, -0.58477783203125, -0.5653228759765625, -0.545867919921875, -0.5264129638671875, -0.5069580078125, -0.4875030517578125, -0.468048095703125, -0.4485931396484375, -0.42913818359375, -0.4096832275390625, -0.390228271484375, -0.3707733154296875, -0.351318359375, -0.3318634033203125, -0.312408447265625, -0.2929534912109375, -0.27349853515625, -0.2540435791015625, -0.234588623046875, -0.2151336669921875, -0.1956787109375, -0.1762237548828125, -0.156768798828125, -0.1373138427734375, -0.11785888671875, -0.0984039306640625, -0.078948974609375, -0.0594940185546875, -0.0400390625, -0.0205841064453125, -0.001129150390625, 0.0183258056640625, 0.03778076171875, 0.0572357177734375, 0.076690673828125, 0.0961456298828125, 0.1156005859375, 0.1350555419921875, 0.154510498046875, 0.1739654541015625, 0.19342041015625, 0.2128753662109375, 0.232330322265625, 0.2517852783203125, 0.271240234375, 0.2906951904296875, 0.310150146484375, 0.3296051025390625, 0.34906005859375, 0.3685150146484375, 0.387969970703125, 0.4074249267578125, 0.4268798828125, 0.4463348388671875, 0.465789794921875, 0.4852447509765625, 0.50469970703125, 0.5241546630859375, 0.543609619140625, 0.5630645751953125, 0.58251953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 6.0, 6.0, 8.0, 9.0, 6.0, 18.0, 22.0, 40.0, 43.0, 56.0, 78.0, 149.0, 262.0, 567.0, 1455.0, 3550.0, 9838.0, 28513.0, 82114.0, 244122.0, 396558.0, 185347.0, 61792.0, 21482.0, 7579.0, 2725.0, 1059.0, 456.0, 274.0, 131.0, 81.0, 52.0, 49.0, 16.0, 19.0, 18.0, 11.0, 14.0, 3.0, 6.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6591796875, -1.5985565185546875, -1.537933349609375, -1.4773101806640625, -1.41668701171875, -1.3560638427734375, -1.295440673828125, -1.2348175048828125, -1.1741943359375, -1.1135711669921875, -1.052947998046875, -0.9923248291015625, -0.93170166015625, -0.8710784912109375, -0.810455322265625, -0.7498321533203125, -0.689208984375, -0.6285858154296875, -0.567962646484375, -0.5073394775390625, -0.44671630859375, -0.3860931396484375, -0.325469970703125, -0.2648468017578125, -0.2042236328125, -0.1436004638671875, -0.082977294921875, -0.0223541259765625, 0.03826904296875, 0.0988922119140625, 0.159515380859375, 0.2201385498046875, 0.28076171875, 0.3413848876953125, 0.402008056640625, 0.4626312255859375, 0.52325439453125, 0.5838775634765625, 0.644500732421875, 0.7051239013671875, 0.7657470703125, 0.8263702392578125, 0.886993408203125, 0.9476165771484375, 1.00823974609375, 1.0688629150390625, 1.129486083984375, 1.1901092529296875, 1.250732421875, 1.3113555908203125, 1.371978759765625, 1.4326019287109375, 1.49322509765625, 1.5538482666015625, 1.614471435546875, 1.6750946044921875, 1.7357177734375, 1.7963409423828125, 1.856964111328125, 1.9175872802734375, 1.97821044921875, 2.0388336181640625, 2.099456787109375, 2.1600799560546875, 2.220703125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 8.0, 10.0, 6.0, 9.0, 12.0, 12.0, 13.0, 16.0, 19.0, 20.0, 28.0, 22.0, 26.0, 40.0, 34.0, 32.0, 34.0, 39.0, 39.0, 28.0, 45.0, 42.0, 45.0, 40.0, 32.0, 33.0, 35.0, 24.0, 37.0, 20.0, 22.0, 26.0, 23.0, 17.0, 20.0, 12.0, 13.0, 10.0, 10.0, 4.0, 7.0, 9.0, 2.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.58984375, -1.5397186279296875, -1.489593505859375, -1.4394683837890625, -1.38934326171875, -1.3392181396484375, -1.289093017578125, -1.2389678955078125, -1.1888427734375, -1.1387176513671875, -1.088592529296875, -1.0384674072265625, -0.98834228515625, -0.9382171630859375, -0.888092041015625, -0.8379669189453125, -0.787841796875, -0.7377166748046875, -0.687591552734375, -0.6374664306640625, -0.58734130859375, -0.5372161865234375, -0.487091064453125, -0.4369659423828125, -0.3868408203125, -0.3367156982421875, -0.286590576171875, -0.2364654541015625, -0.18634033203125, -0.1362152099609375, -0.086090087890625, -0.0359649658203125, 0.01416015625, 0.0642852783203125, 0.114410400390625, 0.1645355224609375, 0.21466064453125, 0.2647857666015625, 0.314910888671875, 0.3650360107421875, 0.4151611328125, 0.4652862548828125, 0.515411376953125, 0.5655364990234375, 0.61566162109375, 0.6657867431640625, 0.715911865234375, 0.7660369873046875, 0.816162109375, 0.8662872314453125, 0.916412353515625, 0.9665374755859375, 1.01666259765625, 1.0667877197265625, 1.116912841796875, 1.1670379638671875, 1.2171630859375, 1.2672882080078125, 1.317413330078125, 1.3675384521484375, 1.41766357421875, 1.4677886962890625, 1.517913818359375, 1.5680389404296875, 1.6181640625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 3.0, 5.0, 10.0, 20.0, 29.0, 36.0, 47.0, 104.0, 146.0, 243.0, 317.0, 558.0, 890.0, 1412.0, 2525.0, 4081.0, 6706.0, 11210.0, 18629.0, 30892.0, 50507.0, 81846.0, 127121.0, 170456.0, 175321.0, 135562.0, 88917.0, 55479.0, 33775.0, 20387.0, 12412.0, 7417.0, 4589.0, 2674.0, 1660.0, 968.0, 641.0, 358.0, 218.0, 130.0, 110.0, 52.0, 32.0, 23.0, 16.0, 4.0, 6.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.425537109375, -0.4122772216796875, -0.399017333984375, -0.3857574462890625, -0.37249755859375, -0.3592376708984375, -0.345977783203125, -0.3327178955078125, -0.3194580078125, -0.3061981201171875, -0.292938232421875, -0.2796783447265625, -0.26641845703125, -0.2531585693359375, -0.239898681640625, -0.2266387939453125, -0.21337890625, -0.2001190185546875, -0.186859130859375, -0.1735992431640625, -0.16033935546875, -0.1470794677734375, -0.133819580078125, -0.1205596923828125, -0.1072998046875, -0.0940399169921875, -0.080780029296875, -0.0675201416015625, -0.05426025390625, -0.0410003662109375, -0.027740478515625, -0.0144805908203125, -0.001220703125, 0.0120391845703125, 0.025299072265625, 0.0385589599609375, 0.05181884765625, 0.0650787353515625, 0.078338623046875, 0.0915985107421875, 0.1048583984375, 0.1181182861328125, 0.131378173828125, 0.1446380615234375, 0.15789794921875, 0.1711578369140625, 0.184417724609375, 0.1976776123046875, 0.2109375, 0.2241973876953125, 0.237457275390625, 0.2507171630859375, 0.26397705078125, 0.2772369384765625, 0.290496826171875, 0.3037567138671875, 0.3170166015625, 0.3302764892578125, 0.343536376953125, 0.3567962646484375, 0.37005615234375, 0.3833160400390625, 0.396575927734375, 0.4098358154296875, 0.423095703125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 6.0, 7.0, 10.0, 5.0, 10.0, 9.0, 18.0, 18.0, 19.0, 27.0, 34.0, 32.0, 58.0, 60.0, 76.0, 79.0, 84.0, 72.0, 71.0, 47.0, 42.0, 37.0, 33.0, 28.0, 25.0, 15.0, 16.0, 4.0, 9.0, 13.0, 9.0, 1.0, 6.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013327598571777344, -0.0001289844512939453, -0.0001246929168701172, -0.00012040138244628906, -0.00011610984802246094, -0.00011181831359863281, -0.00010752677917480469, -0.00010323524475097656, -9.894371032714844e-05, -9.465217590332031e-05, -9.036064147949219e-05, -8.606910705566406e-05, -8.177757263183594e-05, -7.748603820800781e-05, -7.319450378417969e-05, -6.890296936035156e-05, -6.461143493652344e-05, -6.031990051269531e-05, -5.602836608886719e-05, -5.173683166503906e-05, -4.744529724121094e-05, -4.315376281738281e-05, -3.886222839355469e-05, -3.457069396972656e-05, -3.0279159545898438e-05, -2.5987625122070312e-05, -2.1696090698242188e-05, -1.7404556274414062e-05, -1.3113021850585938e-05, -8.821487426757812e-06, -4.5299530029296875e-06, -2.384185791015625e-07, 4.0531158447265625e-06, 8.344650268554688e-06, 1.2636184692382812e-05, 1.6927719116210938e-05, 2.1219253540039062e-05, 2.5510787963867188e-05, 2.9802322387695312e-05, 3.409385681152344e-05, 3.838539123535156e-05, 4.267692565917969e-05, 4.696846008300781e-05, 5.125999450683594e-05, 5.555152893066406e-05, 5.984306335449219e-05, 6.413459777832031e-05, 6.842613220214844e-05, 7.271766662597656e-05, 7.700920104980469e-05, 8.130073547363281e-05, 8.559226989746094e-05, 8.988380432128906e-05, 9.417533874511719e-05, 9.846687316894531e-05, 0.00010275840759277344, 0.00010704994201660156, 0.00011134147644042969, 0.00011563301086425781, 0.00011992454528808594, 0.00012421607971191406, 0.0001285076141357422, 0.0001327991485595703, 0.00013709068298339844, 0.00014138221740722656]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 5.0, 1.0, 9.0, 18.0, 8.0, 17.0, 27.0, 35.0, 51.0, 76.0, 100.0, 172.0, 296.0, 429.0, 664.0, 1157.0, 1937.0, 3445.0, 6132.0, 10679.0, 19762.0, 35942.0, 66699.0, 121483.0, 194455.0, 218700.0, 160817.0, 93170.0, 50782.0, 26894.0, 15169.0, 8343.0, 4661.0, 2596.0, 1465.0, 887.0, 523.0, 324.0, 231.0, 131.0, 89.0, 55.0, 43.0, 25.0, 22.0, 6.0, 7.0, 7.0, 10.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.441162109375, -0.4260902404785156, -0.41101837158203125, -0.3959465026855469, -0.3808746337890625, -0.3658027648925781, -0.35073089599609375, -0.3356590270996094, -0.320587158203125, -0.3055152893066406, -0.29044342041015625, -0.2753715515136719, -0.2602996826171875, -0.24522781372070312, -0.23015594482421875, -0.21508407592773438, -0.20001220703125, -0.18494033813476562, -0.16986846923828125, -0.15479660034179688, -0.1397247314453125, -0.12465286254882812, -0.10958099365234375, -0.09450912475585938, -0.079437255859375, -0.06436538696289062, -0.04929351806640625, -0.034221649169921875, -0.0191497802734375, -0.004077911376953125, 0.01099395751953125, 0.026065826416015625, 0.0411376953125, 0.056209564208984375, 0.07128143310546875, 0.08635330200195312, 0.1014251708984375, 0.11649703979492188, 0.13156890869140625, 0.14664077758789062, 0.161712646484375, 0.17678451538085938, 0.19185638427734375, 0.20692825317382812, 0.2220001220703125, 0.23707199096679688, 0.25214385986328125, 0.2672157287597656, 0.28228759765625, 0.2973594665527344, 0.31243133544921875, 0.3275032043457031, 0.3425750732421875, 0.3576469421386719, 0.37271881103515625, 0.3877906799316406, 0.402862548828125, 0.4179344177246094, 0.43300628662109375, 0.4480781555175781, 0.4631500244140625, 0.4782218933105469, 0.49329376220703125, 0.5083656311035156, 0.5234375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 7.0, 4.0, 9.0, 7.0, 5.0, 9.0, 6.0, 14.0, 18.0, 19.0, 25.0, 36.0, 28.0, 32.0, 51.0, 51.0, 56.0, 55.0, 55.0, 67.0, 67.0, 63.0, 35.0, 51.0, 29.0, 35.0, 23.0, 24.0, 12.0, 16.0, 19.0, 10.0, 12.0, 8.0, 9.0, 6.0, 5.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.428466796875, -0.4132575988769531, -0.39804840087890625, -0.3828392028808594, -0.3676300048828125, -0.3524208068847656, -0.33721160888671875, -0.3220024108886719, -0.306793212890625, -0.2915840148925781, -0.27637481689453125, -0.2611656188964844, -0.2459564208984375, -0.23074722290039062, -0.21553802490234375, -0.20032882690429688, -0.18511962890625, -0.16991043090820312, -0.15470123291015625, -0.13949203491210938, -0.1242828369140625, -0.10907363891601562, -0.09386444091796875, -0.07865524291992188, -0.063446044921875, -0.048236846923828125, -0.03302764892578125, -0.017818450927734375, -0.0026092529296875, 0.012599945068359375, 0.02780914306640625, 0.043018341064453125, 0.0582275390625, 0.07343673706054688, 0.08864593505859375, 0.10385513305664062, 0.1190643310546875, 0.13427352905273438, 0.14948272705078125, 0.16469192504882812, 0.179901123046875, 0.19511032104492188, 0.21031951904296875, 0.22552871704101562, 0.2407379150390625, 0.2559471130371094, 0.27115631103515625, 0.2863655090332031, 0.30157470703125, 0.3167839050292969, 0.33199310302734375, 0.3472023010253906, 0.3624114990234375, 0.3776206970214844, 0.39282989501953125, 0.4080390930175781, 0.423248291015625, 0.4384574890136719, 0.45366668701171875, 0.4688758850097656, 0.4840850830078125, 0.4992942810058594, 0.5145034790039062, 0.5297126770019531, 0.544921875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 9.0, 18.0, 25.0, 54.0, 109.0, 160.0, 166.0, 191.0, 120.0, 76.0, 45.0, 18.0, 12.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.12574577331543, -6.730582237243652, -6.335419178009033, -5.940255641937256, -5.545092582702637, -5.149929046630859, -4.754765510559082, -4.359602451324463, -3.9644391536712646, -3.5692758560180664, -3.174112558364868, -2.77894926071167, -2.3837857246398926, -1.9886225461959839, -1.593459129333496, -1.1982958316802979, -0.8031325340270996, -0.407969206571579, -0.01280587911605835, 0.38235747814178467, 0.7775207757949829, 1.1726840734481812, 1.567847490310669, 1.9630107879638672, 2.3581740856170654, 2.7533373832702637, 3.148500680923462, 3.54366397857666, 3.9388275146484375, 4.333990573883057, 4.729154109954834, 5.124317169189453, 5.5194807052612305, 5.914644241333008, 6.309807300567627, 6.704970836639404, 7.100133895874023, 7.495297431945801, 7.890460968017578, 8.285623550415039, 8.680787086486816, 9.075950622558594, 9.471114158630371, 9.866276741027832, 10.26144027709961, 10.656603813171387, 11.051767349243164, 11.446929931640625, 11.842094421386719, 12.237257957458496, 12.632421493530273, 13.027584075927734, 13.422747611999512, 13.817911148071289, 14.213074684143066, 14.608238220214844, 15.003400802612305, 15.398564338684082, 15.79372787475586, 16.18889045715332, 16.584054946899414, 16.979217529296875, 17.374380111694336, 17.76954460144043, 18.16470718383789]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 6.0, 11.0, 3.0, 7.0, 9.0, 8.0, 9.0, 7.0, 16.0, 12.0, 21.0, 21.0, 20.0, 30.0, 33.0, 32.0, 33.0, 44.0, 33.0, 50.0, 48.0, 36.0, 43.0, 44.0, 38.0, 37.0, 33.0, 34.0, 30.0, 23.0, 27.0, 33.0, 20.0, 31.0, 16.0, 18.0, 7.0, 17.0, 11.0, 18.0, 7.0, 9.0, 2.0, 6.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.15986442565918, -4.025243759155273, -3.890622615814209, -3.7560017108917236, -3.6213808059692383, -3.486760139465332, -3.3521392345428467, -3.2175183296203613, -3.082897424697876, -2.9482765197753906, -2.8136556148529053, -2.67903470993042, -2.5444140434265137, -2.409792900085449, -2.275172233581543, -2.1405513286590576, -2.0059304237365723, -1.871309518814087, -1.7366886138916016, -1.6020678281784058, -1.4674469232559204, -1.332826018333435, -1.1982052326202393, -1.063584327697754, -0.9289634227752686, -0.7943425178527832, -0.6597216725349426, -0.525100827217102, -0.3904799222946167, -0.25585901737213135, -0.12123817205429077, 0.013382673263549805, 0.14800405502319336, 0.2826249301433563, 0.4172458052635193, 0.5518666505813599, 0.6864875555038452, 0.8211084604263306, 0.9557293057441711, 1.0903501510620117, 1.224971055984497, 1.3595919609069824, 1.4942128658294678, 1.6288336515426636, 1.763454556465149, 1.8980754613876343, 2.03269624710083, 2.1673171520233154, 2.301938056945801, 2.436558961868286, 2.5711798667907715, 2.705800771713257, 2.840421676635742, 2.9750423431396484, 3.109663248062134, 3.244284152984619, 3.3789050579071045, 3.51352596282959, 3.648146867752075, 3.7827677726745605, 3.917388439178467, 4.052009582519531, 4.1866302490234375, 4.321250915527344, 4.455872058868408]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 7.0, 12.0, 14.0, 18.0, 26.0, 52.0, 82.0, 127.0, 291.0, 473.0, 1024.0, 2474.0, 5996.0, 16252.0, 49047.0, 172269.0, 693818.0, 2025447.0, 909561.0, 223102.0, 61417.0, 20080.0, 7068.0, 2940.0, 1280.0, 602.0, 324.0, 166.0, 108.0, 57.0, 35.0, 30.0, 19.0, 18.0, 8.0, 5.0, 2.0, 6.0, 4.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.142578125, -1.1104812622070312, -1.0783843994140625, -1.0462875366210938, -1.014190673828125, -0.9820938110351562, -0.9499969482421875, -0.9179000854492188, -0.88580322265625, -0.8537063598632812, -0.8216094970703125, -0.7895126342773438, -0.757415771484375, -0.7253189086914062, -0.6932220458984375, -0.6611251831054688, -0.6290283203125, -0.5969314575195312, -0.5648345947265625, -0.5327377319335938, -0.500640869140625, -0.46854400634765625, -0.4364471435546875, -0.40435028076171875, -0.37225341796875, -0.34015655517578125, -0.3080596923828125, -0.27596282958984375, -0.243865966796875, -0.21176910400390625, -0.1796722412109375, -0.14757537841796875, -0.115478515625, -0.08338165283203125, -0.0512847900390625, -0.01918792724609375, 0.012908935546875, 0.04500579833984375, 0.0771026611328125, 0.10919952392578125, 0.14129638671875, 0.17339324951171875, 0.2054901123046875, 0.23758697509765625, 0.269683837890625, 0.30178070068359375, 0.3338775634765625, 0.36597442626953125, 0.3980712890625, 0.43016815185546875, 0.4622650146484375, 0.49436187744140625, 0.526458740234375, 0.5585556030273438, 0.5906524658203125, 0.6227493286132812, 0.65484619140625, 0.6869430541992188, 0.7190399169921875, 0.7511367797851562, 0.783233642578125, 0.8153305053710938, 0.8474273681640625, 0.8795242309570312, 0.91162109375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 11.0, 8.0, 4.0, 10.0, 23.0, 13.0, 17.0, 21.0, 25.0, 26.0, 30.0, 42.0, 36.0, 39.0, 44.0, 31.0, 46.0, 46.0, 44.0, 40.0, 45.0, 36.0, 35.0, 35.0, 45.0, 37.0, 36.0, 24.0, 28.0, 21.0, 16.0, 13.0, 13.0, 15.0, 10.0, 7.0, 3.0, 10.0, 5.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.66259765625, -0.642822265625, -0.623046875, -0.603271484375, -0.58349609375, -0.563720703125, -0.5439453125, -0.524169921875, -0.50439453125, -0.484619140625, -0.46484375, -0.445068359375, -0.42529296875, -0.405517578125, -0.3857421875, -0.365966796875, -0.34619140625, -0.326416015625, -0.306640625, -0.286865234375, -0.26708984375, -0.247314453125, -0.2275390625, -0.207763671875, -0.18798828125, -0.168212890625, -0.1484375, -0.128662109375, -0.10888671875, -0.089111328125, -0.0693359375, -0.049560546875, -0.02978515625, -0.010009765625, 0.009765625, 0.029541015625, 0.04931640625, 0.069091796875, 0.0888671875, 0.108642578125, 0.12841796875, 0.148193359375, 0.16796875, 0.187744140625, 0.20751953125, 0.227294921875, 0.2470703125, 0.266845703125, 0.28662109375, 0.306396484375, 0.326171875, 0.345947265625, 0.36572265625, 0.385498046875, 0.4052734375, 0.425048828125, 0.44482421875, 0.464599609375, 0.484375, 0.504150390625, 0.52392578125, 0.543701171875, 0.5634765625, 0.583251953125, 0.60302734375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 7.0, 3.0, 9.0, 13.0, 26.0, 17.0, 19.0, 42.0, 56.0, 74.0, 120.0, 186.0, 337.0, 551.0, 1132.0, 2458.0, 6087.0, 19666.0, 80063.0, 418327.0, 2036870.0, 1321659.0, 236668.0, 48612.0, 12856.0, 4457.0, 1823.0, 873.0, 470.0, 262.0, 154.0, 116.0, 77.0, 43.0, 37.0, 21.0, 19.0, 19.0, 14.0, 7.0, 5.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.8740234375, -1.815155029296875, -1.75628662109375, -1.697418212890625, -1.6385498046875, -1.579681396484375, -1.52081298828125, -1.461944580078125, -1.403076171875, -1.344207763671875, -1.28533935546875, -1.226470947265625, -1.1676025390625, -1.108734130859375, -1.04986572265625, -0.990997314453125, -0.93212890625, -0.873260498046875, -0.81439208984375, -0.755523681640625, -0.6966552734375, -0.637786865234375, -0.57891845703125, -0.520050048828125, -0.461181640625, -0.402313232421875, -0.34344482421875, -0.284576416015625, -0.2257080078125, -0.166839599609375, -0.10797119140625, -0.049102783203125, 0.009765625, 0.068634033203125, 0.12750244140625, 0.186370849609375, 0.2452392578125, 0.304107666015625, 0.36297607421875, 0.421844482421875, 0.480712890625, 0.539581298828125, 0.59844970703125, 0.657318115234375, 0.7161865234375, 0.775054931640625, 0.83392333984375, 0.892791748046875, 0.95166015625, 1.010528564453125, 1.06939697265625, 1.128265380859375, 1.1871337890625, 1.246002197265625, 1.30487060546875, 1.363739013671875, 1.422607421875, 1.481475830078125, 1.54034423828125, 1.599212646484375, 1.6580810546875, 1.716949462890625, 1.77581787109375, 1.834686279296875, 1.8935546875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 6.0, 13.0, 27.0, 38.0, 42.0, 83.0, 115.0, 185.0, 239.0, 374.0, 546.0, 631.0, 585.0, 375.0, 288.0, 172.0, 118.0, 71.0, 64.0, 31.0, 22.0, 9.0, 8.0, 9.0, 1.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.001953125, -1.9502410888671875, -1.898529052734375, -1.8468170166015625, -1.79510498046875, -1.7433929443359375, -1.691680908203125, -1.6399688720703125, -1.5882568359375, -1.5365447998046875, -1.484832763671875, -1.4331207275390625, -1.38140869140625, -1.3296966552734375, -1.277984619140625, -1.2262725830078125, -1.174560546875, -1.1228485107421875, -1.071136474609375, -1.0194244384765625, -0.96771240234375, -0.9160003662109375, -0.864288330078125, -0.8125762939453125, -0.7608642578125, -0.7091522216796875, -0.657440185546875, -0.6057281494140625, -0.55401611328125, -0.5023040771484375, -0.450592041015625, -0.3988800048828125, -0.34716796875, -0.2954559326171875, -0.243743896484375, -0.1920318603515625, -0.14031982421875, -0.0886077880859375, -0.036895751953125, 0.0148162841796875, 0.0665283203125, 0.1182403564453125, 0.169952392578125, 0.2216644287109375, 0.27337646484375, 0.3250885009765625, 0.376800537109375, 0.4285125732421875, 0.480224609375, 0.5319366455078125, 0.583648681640625, 0.6353607177734375, 0.68707275390625, 0.7387847900390625, 0.790496826171875, 0.8422088623046875, 0.8939208984375, 0.9456329345703125, 0.997344970703125, 1.0490570068359375, 1.10076904296875, 1.1524810791015625, 1.204193115234375, 1.2559051513671875, 1.3076171875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 7.0, 12.0, 11.0, 11.0, 21.0, 29.0, 42.0, 60.0, 75.0, 96.0, 97.0, 78.0, 87.0, 88.0, 87.0, 59.0, 37.0, 38.0, 25.0, 16.0, 11.0, 7.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.661835670471191, -4.454137802124023, -4.2464399337768555, -4.0387420654296875, -3.8310444355010986, -3.6233468055725098, -3.415648937225342, -3.207951068878174, -3.000253200531006, -2.792555332183838, -2.584857702255249, -2.377159833908081, -2.169461965560913, -1.9617642164230347, -1.7540664672851562, -1.5463685989379883, -1.3386709690093994, -1.130973219871521, -0.923275351524353, -0.7155776023864746, -0.5078797936439514, -0.3001819849014282, -0.0924842357635498, 0.11521363258361816, 0.3229113817214966, 0.5306091904640198, 0.738306999206543, 0.9460047483444214, 1.1537024974822998, 1.3614003658294678, 1.5690981149673462, 1.7767959833145142, 1.9844937324523926, 2.1921916007995605, 2.3998892307281494, 2.6075870990753174, 2.8152849674224854, 3.022982597351074, 3.230680465698242, 3.43837833404541, 3.646076202392578, 3.853774070739746, 4.061471939086914, 4.269169807434082, 4.476867198944092, 4.68456506729126, 4.892262935638428, 5.099960803985596, 5.3076581954956055, 5.515356063842773, 5.723053932189941, 5.930751800537109, 6.138449192047119, 6.346147060394287, 6.553844928741455, 6.761542797088623, 6.969240665435791, 7.176938533782959, 7.384636402130127, 7.592333793640137, 7.800031661987305, 8.007729530334473, 8.21542739868164, 8.423125267028809, 8.630823135375977]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 10.0, 5.0, 9.0, 5.0, 9.0, 11.0, 16.0, 17.0, 19.0, 16.0, 33.0, 32.0, 19.0, 33.0, 30.0, 41.0, 51.0, 37.0, 40.0, 44.0, 40.0, 39.0, 42.0, 32.0, 52.0, 34.0, 28.0, 33.0, 26.0, 38.0, 24.0, 22.0, 21.0, 8.0, 16.0, 7.0, 13.0, 5.0, 12.0, 11.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-4.264338493347168, -4.136053562164307, -4.007768154144287, -3.879483222961426, -3.7511980533599854, -3.622912883758545, -3.4946279525756836, -3.366342782974243, -3.2380576133728027, -3.1097724437713623, -2.981487274169922, -2.8532023429870605, -2.72491717338562, -2.5966320037841797, -2.4683470726013184, -2.340061902999878, -2.2117767333984375, -2.083491563796997, -1.9552065134048462, -1.8269214630126953, -1.6986362934112549, -1.5703511238098145, -1.4420660734176636, -1.3137810230255127, -1.1854958534240723, -1.0572106838226318, -0.928925633430481, -0.8006405234336853, -0.6723554134368896, -0.544070303440094, -0.41578519344329834, -0.2875000834465027, -0.15921473503112793, -0.030929625034332275, 0.09735548496246338, 0.22564059495925903, 0.3539257049560547, 0.48221081495285034, 0.610495924949646, 0.7387810349464417, 0.8670661449432373, 0.995351254940033, 1.1236363649368286, 1.2519214153289795, 1.38020658493042, 1.5084917545318604, 1.6367768049240112, 1.765061855316162, 1.8933470249176025, 2.021632194519043, 2.1499171257019043, 2.2782022953033447, 2.406487464904785, 2.5347726345062256, 2.663057804107666, 2.7913427352905273, 2.9196279048919678, 3.047913074493408, 3.1761980056762695, 3.30448317527771, 3.4327683448791504, 3.561053514480591, 3.6893386840820312, 3.8176236152648926, 3.945908784866333]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 5.0, 7.0, 4.0, 9.0, 15.0, 22.0, 30.0, 45.0, 82.0, 122.0, 148.0, 259.0, 384.0, 624.0, 970.0, 1424.0, 2155.0, 3316.0, 4830.0, 7367.0, 10750.0, 16048.0, 24094.0, 37921.0, 63248.0, 111664.0, 179352.0, 203765.0, 149855.0, 87051.0, 50432.0, 31073.0, 20370.0, 13813.0, 9248.0, 6062.0, 4075.0, 2727.0, 1787.0, 1177.0, 795.0, 506.0, 338.0, 204.0, 140.0, 96.0, 51.0, 37.0, 23.0, 17.0, 14.0, 6.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7197265625, -0.6959609985351562, -0.6721954345703125, -0.6484298706054688, -0.624664306640625, -0.6008987426757812, -0.5771331787109375, -0.5533676147460938, -0.52960205078125, -0.5058364868164062, -0.4820709228515625, -0.45830535888671875, -0.434539794921875, -0.41077423095703125, -0.3870086669921875, -0.36324310302734375, -0.3394775390625, -0.31571197509765625, -0.2919464111328125, -0.26818084716796875, -0.244415283203125, -0.22064971923828125, -0.1968841552734375, -0.17311859130859375, -0.14935302734375, -0.12558746337890625, -0.1018218994140625, -0.07805633544921875, -0.054290771484375, -0.03052520751953125, -0.0067596435546875, 0.01700592041015625, 0.040771484375, 0.06453704833984375, 0.0883026123046875, 0.11206817626953125, 0.135833740234375, 0.15959930419921875, 0.1833648681640625, 0.20713043212890625, 0.23089599609375, 0.25466156005859375, 0.2784271240234375, 0.30219268798828125, 0.325958251953125, 0.34972381591796875, 0.3734893798828125, 0.39725494384765625, 0.4210205078125, 0.44478607177734375, 0.4685516357421875, 0.49231719970703125, 0.516082763671875, 0.5398483276367188, 0.5636138916015625, 0.5873794555664062, 0.61114501953125, 0.6349105834960938, 0.6586761474609375, 0.6824417114257812, 0.706207275390625, 0.7299728393554688, 0.7537384033203125, 0.7775039672851562, 0.80126953125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 8.0, 12.0, 4.0, 11.0, 13.0, 22.0, 12.0, 16.0, 25.0, 39.0, 41.0, 31.0, 29.0, 26.0, 45.0, 43.0, 35.0, 33.0, 43.0, 45.0, 41.0, 38.0, 43.0, 34.0, 29.0, 34.0, 39.0, 26.0, 23.0, 23.0, 17.0, 23.0, 12.0, 7.0, 21.0, 7.0, 11.0, 8.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0], "bins": [-0.69580078125, -0.6762924194335938, -0.6567840576171875, -0.6372756958007812, -0.617767333984375, -0.5982589721679688, -0.5787506103515625, -0.5592422485351562, -0.53973388671875, -0.5202255249023438, -0.5007171630859375, -0.48120880126953125, -0.461700439453125, -0.44219207763671875, -0.4226837158203125, -0.40317535400390625, -0.3836669921875, -0.36415863037109375, -0.3446502685546875, -0.32514190673828125, -0.305633544921875, -0.28612518310546875, -0.2666168212890625, -0.24710845947265625, -0.22760009765625, -0.20809173583984375, -0.1885833740234375, -0.16907501220703125, -0.149566650390625, -0.13005828857421875, -0.1105499267578125, -0.09104156494140625, -0.071533203125, -0.05202484130859375, -0.0325164794921875, -0.01300811767578125, 0.006500244140625, 0.02600860595703125, 0.0455169677734375, 0.06502532958984375, 0.08453369140625, 0.10404205322265625, 0.1235504150390625, 0.14305877685546875, 0.162567138671875, 0.18207550048828125, 0.2015838623046875, 0.22109222412109375, 0.2406005859375, 0.26010894775390625, 0.2796173095703125, 0.29912567138671875, 0.318634033203125, 0.33814239501953125, 0.3576507568359375, 0.37715911865234375, 0.39666748046875, 0.41617584228515625, 0.4356842041015625, 0.45519256591796875, 0.474700927734375, 0.49420928955078125, 0.5137176513671875, 0.5332260131835938, 0.552734375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 4.0, 11.0, 14.0, 19.0, 22.0, 30.0, 26.0, 48.0, 70.0, 110.0, 266.0, 637.0, 1739.0, 5315.0, 16099.0, 53728.0, 244382.0, 544961.0, 130736.0, 33901.0, 10566.0, 3615.0, 1239.0, 462.0, 209.0, 117.0, 64.0, 42.0, 22.0, 25.0, 23.0, 14.0, 8.0, 9.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.6171875, -2.540924072265625, -2.46466064453125, -2.388397216796875, -2.3121337890625, -2.235870361328125, -2.15960693359375, -2.083343505859375, -2.007080078125, -1.930816650390625, -1.85455322265625, -1.778289794921875, -1.7020263671875, -1.625762939453125, -1.54949951171875, -1.473236083984375, -1.39697265625, -1.320709228515625, -1.24444580078125, -1.168182373046875, -1.0919189453125, -1.015655517578125, -0.93939208984375, -0.863128662109375, -0.786865234375, -0.710601806640625, -0.63433837890625, -0.558074951171875, -0.4818115234375, -0.405548095703125, -0.32928466796875, -0.253021240234375, -0.1767578125, -0.100494384765625, -0.02423095703125, 0.052032470703125, 0.1282958984375, 0.204559326171875, 0.28082275390625, 0.357086181640625, 0.433349609375, 0.509613037109375, 0.58587646484375, 0.662139892578125, 0.7384033203125, 0.814666748046875, 0.89093017578125, 0.967193603515625, 1.04345703125, 1.119720458984375, 1.19598388671875, 1.272247314453125, 1.3485107421875, 1.424774169921875, 1.50103759765625, 1.577301025390625, 1.653564453125, 1.729827880859375, 1.80609130859375, 1.882354736328125, 1.9586181640625, 2.034881591796875, 2.11114501953125, 2.187408447265625, 2.263671875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 7.0, 7.0, 6.0, 13.0, 16.0, 9.0, 18.0, 21.0, 26.0, 31.0, 32.0, 38.0, 55.0, 56.0, 38.0, 44.0, 42.0, 45.0, 60.0, 54.0, 45.0, 41.0, 48.0, 37.0, 35.0, 28.0, 20.0, 22.0, 23.0, 20.0, 15.0, 10.0, 11.0, 5.0, 6.0, 1.0, 1.0, 5.0, 0.0, 1.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.078125, -2.00494384765625, -1.9317626953125, -1.85858154296875, -1.785400390625, -1.71221923828125, -1.6390380859375, -1.56585693359375, -1.49267578125, -1.41949462890625, -1.3463134765625, -1.27313232421875, -1.199951171875, -1.12677001953125, -1.0535888671875, -0.98040771484375, -0.9072265625, -0.83404541015625, -0.7608642578125, -0.68768310546875, -0.614501953125, -0.54132080078125, -0.4681396484375, -0.39495849609375, -0.32177734375, -0.24859619140625, -0.1754150390625, -0.10223388671875, -0.029052734375, 0.04412841796875, 0.1173095703125, 0.19049072265625, 0.263671875, 0.33685302734375, 0.4100341796875, 0.48321533203125, 0.556396484375, 0.62957763671875, 0.7027587890625, 0.77593994140625, 0.84912109375, 0.92230224609375, 0.9954833984375, 1.06866455078125, 1.141845703125, 1.21502685546875, 1.2882080078125, 1.36138916015625, 1.4345703125, 1.50775146484375, 1.5809326171875, 1.65411376953125, 1.727294921875, 1.80047607421875, 1.8736572265625, 1.94683837890625, 2.02001953125, 2.09320068359375, 2.1663818359375, 2.23956298828125, 2.312744140625, 2.38592529296875, 2.4591064453125, 2.53228759765625, 2.60546875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 0.0, 7.0, 4.0, 4.0, 5.0, 14.0, 21.0, 18.0, 31.0, 44.0, 83.0, 141.0, 203.0, 348.0, 638.0, 1031.0, 1738.0, 2928.0, 5043.0, 8804.0, 15078.0, 26171.0, 46661.0, 90145.0, 193206.0, 288317.0, 180248.0, 84722.0, 43483.0, 24746.0, 14245.0, 8482.0, 4859.0, 2932.0, 1609.0, 1003.0, 609.0, 330.0, 238.0, 137.0, 87.0, 51.0, 26.0, 21.0, 18.0, 9.0, 8.0, 4.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.564453125, -0.5452880859375, -0.526123046875, -0.5069580078125, -0.48779296875, -0.4686279296875, -0.449462890625, -0.4302978515625, -0.4111328125, -0.3919677734375, -0.372802734375, -0.3536376953125, -0.33447265625, -0.3153076171875, -0.296142578125, -0.2769775390625, -0.2578125, -0.2386474609375, -0.219482421875, -0.2003173828125, -0.18115234375, -0.1619873046875, -0.142822265625, -0.1236572265625, -0.1044921875, -0.0853271484375, -0.066162109375, -0.0469970703125, -0.02783203125, -0.0086669921875, 0.010498046875, 0.0296630859375, 0.048828125, 0.0679931640625, 0.087158203125, 0.1063232421875, 0.12548828125, 0.1446533203125, 0.163818359375, 0.1829833984375, 0.2021484375, 0.2213134765625, 0.240478515625, 0.2596435546875, 0.27880859375, 0.2979736328125, 0.317138671875, 0.3363037109375, 0.35546875, 0.3746337890625, 0.393798828125, 0.4129638671875, 0.43212890625, 0.4512939453125, 0.470458984375, 0.4896240234375, 0.5087890625, 0.5279541015625, 0.547119140625, 0.5662841796875, 0.58544921875, 0.6046142578125, 0.623779296875, 0.6429443359375, 0.662109375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 3.0, 4.0, 10.0, 9.0, 9.0, 14.0, 13.0, 17.0, 17.0, 29.0, 41.0, 84.0, 121.0, 149.0, 131.0, 77.0, 71.0, 47.0, 32.0, 25.0, 26.0, 13.0, 9.0, 4.0, 6.0, 9.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017189979553222656, -0.00016592629253864288, -0.0001599527895450592, -0.00015397928655147552, -0.00014800578355789185, -0.00014203228056430817, -0.0001360587775707245, -0.0001300852745771408, -0.00012411177158355713, -0.00011813826858997345, -0.00011216476559638977, -0.00010619126260280609, -0.00010021775960922241, -9.424425661563873e-05, -8.827075362205505e-05, -8.229725062847137e-05, -7.63237476348877e-05, -7.035024464130402e-05, -6.437674164772034e-05, -5.840323865413666e-05, -5.242973566055298e-05, -4.64562326669693e-05, -4.048272967338562e-05, -3.450922667980194e-05, -2.8535723686218262e-05, -2.2562220692634583e-05, -1.6588717699050903e-05, -1.0615214705467224e-05, -4.641711711883545e-06, 1.3317912817001343e-06, 7.3052942752838135e-06, 1.3278797268867493e-05, 1.9252300262451172e-05, 2.522580325603485e-05, 3.119930624961853e-05, 3.717280924320221e-05, 4.314631223678589e-05, 4.911981523036957e-05, 5.509331822395325e-05, 6.106682121753693e-05, 6.70403242111206e-05, 7.301382720470428e-05, 7.898733019828796e-05, 8.496083319187164e-05, 9.093433618545532e-05, 9.6907839179039e-05, 0.00010288134217262268, 0.00010885484516620636, 0.00011482834815979004, 0.00012080185115337372, 0.0001267753541469574, 0.00013274885714054108, 0.00013872236013412476, 0.00014469586312770844, 0.00015066936612129211, 0.0001566428691148758, 0.00016261637210845947, 0.00016858987510204315, 0.00017456337809562683, 0.0001805368810892105, 0.0001865103840827942, 0.00019248388707637787, 0.00019845739006996155, 0.00020443089306354523, 0.0002104043960571289]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 9.0, 20.0, 33.0, 37.0, 66.0, 101.0, 177.0, 304.0, 653.0, 1231.0, 2453.0, 5321.0, 11963.0, 26482.0, 59394.0, 148174.0, 366104.0, 258005.0, 94123.0, 40392.0, 17962.0, 8027.0, 3795.0, 1780.0, 901.0, 454.0, 255.0, 135.0, 87.0, 42.0, 32.0, 13.0, 10.0, 10.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.015625, -0.9887313842773438, -0.9618377685546875, -0.9349441528320312, -0.908050537109375, -0.8811569213867188, -0.8542633056640625, -0.8273696899414062, -0.80047607421875, -0.7735824584960938, -0.7466888427734375, -0.7197952270507812, -0.692901611328125, -0.6660079956054688, -0.6391143798828125, -0.6122207641601562, -0.5853271484375, -0.5584335327148438, -0.5315399169921875, -0.5046463012695312, -0.477752685546875, -0.45085906982421875, -0.4239654541015625, -0.39707183837890625, -0.37017822265625, -0.34328460693359375, -0.3163909912109375, -0.28949737548828125, -0.262603759765625, -0.23571014404296875, -0.2088165283203125, -0.18192291259765625, -0.155029296875, -0.12813568115234375, -0.1012420654296875, -0.07434844970703125, -0.047454833984375, -0.02056121826171875, 0.0063323974609375, 0.03322601318359375, 0.06011962890625, 0.08701324462890625, 0.1139068603515625, 0.14080047607421875, 0.167694091796875, 0.19458770751953125, 0.2214813232421875, 0.24837493896484375, 0.2752685546875, 0.30216217041015625, 0.3290557861328125, 0.35594940185546875, 0.382843017578125, 0.40973663330078125, 0.4366302490234375, 0.46352386474609375, 0.49041748046875, 0.5173110961914062, 0.5442047119140625, 0.5710983276367188, 0.597991943359375, 0.6248855590820312, 0.6517791748046875, 0.6786727905273438, 0.70556640625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 6.0, 9.0, 8.0, 10.0, 17.0, 26.0, 23.0, 43.0, 51.0, 69.0, 94.0, 147.0, 143.0, 109.0, 56.0, 52.0, 38.0, 32.0, 13.0, 16.0, 12.0, 5.0, 7.0, 7.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.966796875, -0.9295501708984375, -0.892303466796875, -0.8550567626953125, -0.81781005859375, -0.7805633544921875, -0.743316650390625, -0.7060699462890625, -0.6688232421875, -0.6315765380859375, -0.594329833984375, -0.5570831298828125, -0.51983642578125, -0.4825897216796875, -0.445343017578125, -0.4080963134765625, -0.370849609375, -0.3336029052734375, -0.296356201171875, -0.2591094970703125, -0.22186279296875, -0.1846160888671875, -0.147369384765625, -0.1101226806640625, -0.0728759765625, -0.0356292724609375, 0.001617431640625, 0.0388641357421875, 0.07611083984375, 0.1133575439453125, 0.150604248046875, 0.1878509521484375, 0.22509765625, 0.2623443603515625, 0.299591064453125, 0.3368377685546875, 0.37408447265625, 0.4113311767578125, 0.448577880859375, 0.4858245849609375, 0.5230712890625, 0.5603179931640625, 0.597564697265625, 0.6348114013671875, 0.67205810546875, 0.7093048095703125, 0.746551513671875, 0.7837982177734375, 0.821044921875, 0.8582916259765625, 0.895538330078125, 0.9327850341796875, 0.97003173828125, 1.0072784423828125, 1.044525146484375, 1.0817718505859375, 1.1190185546875, 1.1562652587890625, 1.193511962890625, 1.2307586669921875, 1.26800537109375, 1.3052520751953125, 1.342498779296875, 1.3797454833984375, 1.4169921875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 6.0, 6.0, 18.0, 17.0, 37.0, 60.0, 65.0, 79.0, 84.0, 111.0, 107.0, 110.0, 62.0, 68.0, 48.0, 47.0, 26.0, 17.0, 10.0, 11.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.965401649475098, -5.720076084136963, -5.474750518798828, -5.229424953460693, -4.984099388122559, -4.738774299621582, -4.493448257446289, -4.2481231689453125, -4.002797603607178, -3.757472038269043, -3.512146472930908, -3.2668209075927734, -3.0214955806732178, -2.776170015335083, -2.5308444499969482, -2.2855191230773926, -2.0401933193206787, -1.794867753982544, -1.5495423078536987, -1.304216742515564, -1.0588912963867188, -0.813565731048584, -0.5682401657104492, -0.322914719581604, -0.07758915424346924, 0.16773636639118195, 0.41306188702583313, 0.6583874225616455, 0.9037129282951355, 1.1490384340286255, 1.3943639993667603, 1.6396894454956055, 1.8850150108337402, 2.130340576171875, 2.3756661415100098, 2.6209917068481445, 2.8663170337677, 3.111642599105835, 3.3569681644439697, 3.6022934913635254, 3.84761905670166, 4.092944622039795, 4.33827018737793, 4.5835957527160645, 4.828921318054199, 5.074246406555176, 5.319572448730469, 5.564897537231445, 5.810223579406738, 6.055549144744873, 6.300874710083008, 6.546200275421143, 6.791525840759277, 7.036850929260254, 7.282176971435547, 7.527502059936523, 7.772827625274658, 8.018153190612793, 8.26347827911377, 8.508804321289062, 8.754129409790039, 8.999455451965332, 9.244780540466309, 9.490106582641602, 9.735431671142578]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 4.0, 9.0, 5.0, 11.0, 11.0, 14.0, 20.0, 29.0, 16.0, 19.0, 23.0, 24.0, 34.0, 31.0, 40.0, 30.0, 40.0, 38.0, 37.0, 48.0, 42.0, 32.0, 44.0, 36.0, 32.0, 26.0, 24.0, 38.0, 39.0, 28.0, 29.0, 29.0, 17.0, 17.0, 14.0, 10.0, 10.0, 9.0, 7.0, 1.0, 7.0, 1.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-6.395018100738525, -6.217862129211426, -6.040706634521484, -5.863550662994385, -5.686394691467285, -5.509239196777344, -5.332083225250244, -5.1549272537231445, -4.977771759033203, -4.8006157875061035, -4.623460292816162, -4.4463043212890625, -4.269148826599121, -4.0919928550720215, -3.914836883544922, -3.7376811504364014, -3.560525417327881, -3.3833696842193604, -3.20621395111084, -3.0290579795837402, -2.8519022464752197, -2.674746513366699, -2.4975905418395996, -2.320434808731079, -2.1432790756225586, -1.966123342514038, -1.788967490196228, -1.611811637878418, -1.4346559047698975, -1.257500171661377, -1.080344319343567, -0.9031884670257568, -0.7260322570800781, -0.5488764643669128, -0.37172067165374756, -0.19456487894058228, -0.017409086227416992, 0.1597467064857483, 0.3369024991989136, 0.5140583515167236, 0.6912140846252441, 0.8683698773384094, 1.0455256700515747, 1.2226815223693848, 1.3998372554779053, 1.5769929885864258, 1.7541488409042358, 1.931304693222046, 2.1084604263305664, 2.285616159439087, 2.4627718925476074, 2.639927864074707, 2.8170835971832275, 2.994239330291748, 3.1713953018188477, 3.348551034927368, 3.5257067680358887, 3.702862501144409, 3.8800182342529297, 4.057174205780029, 4.234330177307129, 4.41148567199707, 4.58864164352417, 4.7657976150512695, 4.942953109741211]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 4.0, 4.0, 7.0, 12.0, 13.0, 19.0, 42.0, 40.0, 62.0, 78.0, 148.0, 190.0, 378.0, 663.0, 1179.0, 2360.0, 4792.0, 10827.0, 25762.0, 67460.0, 198690.0, 688308.0, 2076133.0, 769288.0, 223409.0, 74652.0, 27884.0, 11476.0, 5002.0, 2456.0, 1222.0, 624.0, 421.0, 239.0, 152.0, 81.0, 66.0, 39.0, 39.0, 17.0, 13.0, 12.0, 5.0, 9.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.125, -1.091461181640625, -1.05792236328125, -1.024383544921875, -0.9908447265625, -0.957305908203125, -0.92376708984375, -0.890228271484375, -0.856689453125, -0.823150634765625, -0.78961181640625, -0.756072998046875, -0.7225341796875, -0.688995361328125, -0.65545654296875, -0.621917724609375, -0.58837890625, -0.554840087890625, -0.52130126953125, -0.487762451171875, -0.4542236328125, -0.420684814453125, -0.38714599609375, -0.353607177734375, -0.320068359375, -0.286529541015625, -0.25299072265625, -0.219451904296875, -0.1859130859375, -0.152374267578125, -0.11883544921875, -0.085296630859375, -0.0517578125, -0.018218994140625, 0.01531982421875, 0.048858642578125, 0.0823974609375, 0.115936279296875, 0.14947509765625, 0.183013916015625, 0.216552734375, 0.250091552734375, 0.28363037109375, 0.317169189453125, 0.3507080078125, 0.384246826171875, 0.41778564453125, 0.451324462890625, 0.48486328125, 0.518402099609375, 0.55194091796875, 0.585479736328125, 0.6190185546875, 0.652557373046875, 0.68609619140625, 0.719635009765625, 0.753173828125, 0.786712646484375, 0.82025146484375, 0.853790283203125, 0.8873291015625, 0.920867919921875, 0.95440673828125, 0.987945556640625, 1.021484375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 7.0, 6.0, 9.0, 14.0, 17.0, 16.0, 22.0, 14.0, 22.0, 23.0, 28.0, 30.0, 33.0, 30.0, 39.0, 50.0, 34.0, 43.0, 44.0, 49.0, 52.0, 57.0, 45.0, 25.0, 37.0, 27.0, 30.0, 26.0, 26.0, 22.0, 21.0, 18.0, 17.0, 12.0, 9.0, 7.0, 7.0, 5.0, 4.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.83544921875, -0.812042236328125, -0.78863525390625, -0.765228271484375, -0.7418212890625, -0.718414306640625, -0.69500732421875, -0.671600341796875, -0.648193359375, -0.624786376953125, -0.60137939453125, -0.577972412109375, -0.5545654296875, -0.531158447265625, -0.50775146484375, -0.484344482421875, -0.4609375, -0.437530517578125, -0.41412353515625, -0.390716552734375, -0.3673095703125, -0.343902587890625, -0.32049560546875, -0.297088623046875, -0.273681640625, -0.250274658203125, -0.22686767578125, -0.203460693359375, -0.1800537109375, -0.156646728515625, -0.13323974609375, -0.109832763671875, -0.08642578125, -0.063018798828125, -0.03961181640625, -0.016204833984375, 0.0072021484375, 0.030609130859375, 0.05401611328125, 0.077423095703125, 0.100830078125, 0.124237060546875, 0.14764404296875, 0.171051025390625, 0.1944580078125, 0.217864990234375, 0.24127197265625, 0.264678955078125, 0.2880859375, 0.311492919921875, 0.33489990234375, 0.358306884765625, 0.3817138671875, 0.405120849609375, 0.42852783203125, 0.451934814453125, 0.475341796875, 0.498748779296875, 0.52215576171875, 0.545562744140625, 0.5689697265625, 0.592376708984375, 0.61578369140625, 0.639190673828125, 0.66259765625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 13.0, 10.0, 14.0, 16.0, 25.0, 34.0, 37.0, 62.0, 87.0, 105.0, 153.0, 207.0, 273.0, 498.0, 758.0, 1265.0, 2223.0, 4032.0, 8368.0, 18044.0, 43115.0, 115751.0, 341609.0, 1115450.0, 1693881.0, 554893.0, 179525.0, 64290.0, 25662.0, 11309.0, 5299.0, 2860.0, 1575.0, 1021.0, 598.0, 369.0, 231.0, 183.0, 122.0, 95.0, 62.0, 38.0, 33.0, 30.0, 15.0, 11.0, 12.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.50390625, -1.455718994140625, -1.40753173828125, -1.359344482421875, -1.3111572265625, -1.262969970703125, -1.21478271484375, -1.166595458984375, -1.118408203125, -1.070220947265625, -1.02203369140625, -0.973846435546875, -0.9256591796875, -0.877471923828125, -0.82928466796875, -0.781097412109375, -0.73291015625, -0.684722900390625, -0.63653564453125, -0.588348388671875, -0.5401611328125, -0.491973876953125, -0.44378662109375, -0.395599365234375, -0.347412109375, -0.299224853515625, -0.25103759765625, -0.202850341796875, -0.1546630859375, -0.106475830078125, -0.05828857421875, -0.010101318359375, 0.0380859375, 0.086273193359375, 0.13446044921875, 0.182647705078125, 0.2308349609375, 0.279022216796875, 0.32720947265625, 0.375396728515625, 0.423583984375, 0.471771240234375, 0.51995849609375, 0.568145751953125, 0.6163330078125, 0.664520263671875, 0.71270751953125, 0.760894775390625, 0.80908203125, 0.857269287109375, 0.90545654296875, 0.953643798828125, 1.0018310546875, 1.050018310546875, 1.09820556640625, 1.146392822265625, 1.194580078125, 1.242767333984375, 1.29095458984375, 1.339141845703125, 1.3873291015625, 1.435516357421875, 1.48370361328125, 1.531890869140625, 1.580078125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 8.0, 11.0, 22.0, 32.0, 38.0, 63.0, 96.0, 141.0, 229.0, 357.0, 514.0, 739.0, 602.0, 445.0, 240.0, 163.0, 116.0, 73.0, 67.0, 43.0, 29.0, 13.0, 10.0, 7.0, 8.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.40625, -2.348724365234375, -2.29119873046875, -2.233673095703125, -2.1761474609375, -2.118621826171875, -2.06109619140625, -2.003570556640625, -1.946044921875, -1.888519287109375, -1.83099365234375, -1.773468017578125, -1.7159423828125, -1.658416748046875, -1.60089111328125, -1.543365478515625, -1.48583984375, -1.428314208984375, -1.37078857421875, -1.313262939453125, -1.2557373046875, -1.198211669921875, -1.14068603515625, -1.083160400390625, -1.025634765625, -0.968109130859375, -0.91058349609375, -0.853057861328125, -0.7955322265625, -0.738006591796875, -0.68048095703125, -0.622955322265625, -0.5654296875, -0.507904052734375, -0.45037841796875, -0.392852783203125, -0.3353271484375, -0.277801513671875, -0.22027587890625, -0.162750244140625, -0.105224609375, -0.047698974609375, 0.00982666015625, 0.067352294921875, 0.1248779296875, 0.182403564453125, 0.23992919921875, 0.297454833984375, 0.35498046875, 0.412506103515625, 0.47003173828125, 0.527557373046875, 0.5850830078125, 0.642608642578125, 0.70013427734375, 0.757659912109375, 0.815185546875, 0.872711181640625, 0.93023681640625, 0.987762451171875, 1.0452880859375, 1.102813720703125, 1.16033935546875, 1.217864990234375, 1.275390625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 9.0, 14.0, 20.0, 44.0, 62.0, 90.0, 117.0, 137.0, 119.0, 116.0, 102.0, 79.0, 41.0, 28.0, 14.0, 13.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.906071186065674, -3.575515031814575, -3.2449588775634766, -2.914402961730957, -2.5838468074798584, -2.2532906532287598, -1.9227346181869507, -1.5921785831451416, -1.261622428894043, -0.9310663342475891, -0.6005102396011353, -0.2699541449546814, 0.06060194969177246, 0.3911581039428711, 0.7217141389846802, 1.0522701740264893, 1.382826328277588, 1.7133824825286865, 2.043938636779785, 2.3744945526123047, 2.7050507068634033, 3.035606861114502, 3.3661627769470215, 3.69671893119812, 4.027275085449219, 4.357831001281738, 4.688387393951416, 5.0189433097839355, 5.349499702453613, 5.680055618286133, 6.010611534118652, 6.341167449951172, 6.671724319458008, 7.002280235290527, 7.332836627960205, 7.663392543792725, 7.993948936462402, 8.324504852294922, 8.655060768127441, 8.985616683959961, 9.316173553466797, 9.646729469299316, 9.977285385131836, 10.307842254638672, 10.638398170471191, 10.968954086303711, 11.29951000213623, 11.63006591796875, 11.96062183380127, 12.291177749633789, 12.621733665466309, 12.952290534973145, 13.282846450805664, 13.613402366638184, 13.943958282470703, 14.274514198303223, 14.605070114135742, 14.935626029968262, 15.266181945800781, 15.596738815307617, 15.927294731140137, 16.257850646972656, 16.588407516479492, 16.918962478637695, 17.24951934814453]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 9.0, 11.0, 9.0, 10.0, 16.0, 20.0, 23.0, 39.0, 36.0, 48.0, 44.0, 35.0, 48.0, 46.0, 35.0, 68.0, 54.0, 50.0, 52.0, 55.0, 54.0, 41.0, 37.0, 38.0, 32.0, 26.0, 17.0, 17.0, 13.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.272446632385254, -6.095283508300781, -5.918120384216309, -5.740957260131836, -5.563794136047363, -5.386631011962891, -5.209467887878418, -5.032304763793945, -4.855141639709473, -4.677978515625, -4.500815391540527, -4.323652267456055, -4.146489143371582, -3.9693260192871094, -3.7921626567840576, -3.614999532699585, -3.437836170196533, -3.2606730461120605, -3.083509922027588, -2.9063467979431152, -2.7291836738586426, -2.55202054977417, -2.374857187271118, -2.1976940631866455, -2.020530939102173, -1.8433678150177002, -1.6662046909332275, -1.4890414476394653, -1.3118783235549927, -1.13471519947052, -0.9575519561767578, -0.7803888320922852, -0.6032257080078125, -0.42606255412101746, -0.2488994002342224, -0.07173621654510498, 0.10542690753936768, 0.28259003162384033, 0.45975327491760254, 0.6369163990020752, 0.8140795230865479, 0.9912426471710205, 1.1684057712554932, 1.3455690145492554, 1.522732138633728, 1.6998952627182007, 1.877058506011963, 2.0542216300964355, 2.231384754180908, 2.408547878265381, 2.5857110023498535, 2.762874126434326, 2.940037250518799, 3.1172003746032715, 3.2943637371063232, 3.471526861190796, 3.6486899852752686, 3.825853109359741, 4.003016471862793, 4.180179595947266, 4.357342720031738, 4.534505844116211, 4.711668968200684, 4.888832092285156, 5.065995216369629]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 8.0, 12.0, 13.0, 28.0, 53.0, 70.0, 108.0, 165.0, 240.0, 378.0, 620.0, 853.0, 1407.0, 2110.0, 2978.0, 4575.0, 6588.0, 9924.0, 14362.0, 20907.0, 31729.0, 50976.0, 93053.0, 184802.0, 244715.0, 161901.0, 81446.0, 45420.0, 28870.0, 19270.0, 13246.0, 8804.0, 6298.0, 4225.0, 2772.0, 1930.0, 1243.0, 824.0, 582.0, 367.0, 269.0, 158.0, 95.0, 63.0, 41.0, 31.0, 15.0, 10.0, 3.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.8603515625, -0.8360443115234375, -0.811737060546875, -0.7874298095703125, -0.76312255859375, -0.7388153076171875, -0.714508056640625, -0.6902008056640625, -0.6658935546875, -0.6415863037109375, -0.617279052734375, -0.5929718017578125, -0.56866455078125, -0.5443572998046875, -0.520050048828125, -0.4957427978515625, -0.471435546875, -0.4471282958984375, -0.422821044921875, -0.3985137939453125, -0.37420654296875, -0.3498992919921875, -0.325592041015625, -0.3012847900390625, -0.2769775390625, -0.2526702880859375, -0.228363037109375, -0.2040557861328125, -0.17974853515625, -0.1554412841796875, -0.131134033203125, -0.1068267822265625, -0.08251953125, -0.0582122802734375, -0.033905029296875, -0.0095977783203125, 0.01470947265625, 0.0390167236328125, 0.063323974609375, 0.0876312255859375, 0.1119384765625, 0.1362457275390625, 0.160552978515625, 0.1848602294921875, 0.20916748046875, 0.2334747314453125, 0.257781982421875, 0.2820892333984375, 0.306396484375, 0.3307037353515625, 0.355010986328125, 0.3793182373046875, 0.40362548828125, 0.4279327392578125, 0.452239990234375, 0.4765472412109375, 0.5008544921875, 0.5251617431640625, 0.549468994140625, 0.5737762451171875, 0.59808349609375, 0.6223907470703125, 0.646697998046875, 0.6710052490234375, 0.6953125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 9.0, 7.0, 10.0, 10.0, 8.0, 17.0, 16.0, 25.0, 29.0, 23.0, 26.0, 25.0, 36.0, 24.0, 46.0, 52.0, 40.0, 55.0, 50.0, 48.0, 41.0, 51.0, 40.0, 33.0, 31.0, 25.0, 37.0, 33.0, 23.0, 24.0, 17.0, 18.0, 19.0, 12.0, 6.0, 7.0, 7.0, 5.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8740234375, -0.8477783203125, -0.821533203125, -0.7952880859375, -0.76904296875, -0.7427978515625, -0.716552734375, -0.6903076171875, -0.6640625, -0.6378173828125, -0.611572265625, -0.5853271484375, -0.55908203125, -0.5328369140625, -0.506591796875, -0.4803466796875, -0.4541015625, -0.4278564453125, -0.401611328125, -0.3753662109375, -0.34912109375, -0.3228759765625, -0.296630859375, -0.2703857421875, -0.244140625, -0.2178955078125, -0.191650390625, -0.1654052734375, -0.13916015625, -0.1129150390625, -0.086669921875, -0.0604248046875, -0.0341796875, -0.0079345703125, 0.018310546875, 0.0445556640625, 0.07080078125, 0.0970458984375, 0.123291015625, 0.1495361328125, 0.17578125, 0.2020263671875, 0.228271484375, 0.2545166015625, 0.28076171875, 0.3070068359375, 0.333251953125, 0.3594970703125, 0.3857421875, 0.4119873046875, 0.438232421875, 0.4644775390625, 0.49072265625, 0.5169677734375, 0.543212890625, 0.5694580078125, 0.595703125, 0.6219482421875, 0.648193359375, 0.6744384765625, 0.70068359375, 0.7269287109375, 0.753173828125, 0.7794189453125, 0.8056640625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 7.0, 3.0, 6.0, 5.0, 13.0, 14.0, 28.0, 33.0, 49.0, 69.0, 103.0, 171.0, 413.0, 1602.0, 9211.0, 49594.0, 437355.0, 483976.0, 53335.0, 10027.0, 1676.0, 390.0, 159.0, 108.0, 54.0, 50.0, 34.0, 20.0, 13.0, 15.0, 7.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.375, -4.2535400390625, -4.132080078125, -4.0106201171875, -3.88916015625, -3.7677001953125, -3.646240234375, -3.5247802734375, -3.4033203125, -3.2818603515625, -3.160400390625, -3.0389404296875, -2.91748046875, -2.7960205078125, -2.674560546875, -2.5531005859375, -2.431640625, -2.3101806640625, -2.188720703125, -2.0672607421875, -1.94580078125, -1.8243408203125, -1.702880859375, -1.5814208984375, -1.4599609375, -1.3385009765625, -1.217041015625, -1.0955810546875, -0.97412109375, -0.8526611328125, -0.731201171875, -0.6097412109375, -0.48828125, -0.3668212890625, -0.245361328125, -0.1239013671875, -0.00244140625, 0.1190185546875, 0.240478515625, 0.3619384765625, 0.4833984375, 0.6048583984375, 0.726318359375, 0.8477783203125, 0.96923828125, 1.0906982421875, 1.212158203125, 1.3336181640625, 1.455078125, 1.5765380859375, 1.697998046875, 1.8194580078125, 1.94091796875, 2.0623779296875, 2.183837890625, 2.3052978515625, 2.4267578125, 2.5482177734375, 2.669677734375, 2.7911376953125, 2.91259765625, 3.0340576171875, 3.155517578125, 3.2769775390625, 3.3984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 4.0, 5.0, 2.0, 9.0, 8.0, 15.0, 17.0, 35.0, 33.0, 25.0, 55.0, 48.0, 56.0, 59.0, 62.0, 70.0, 61.0, 57.0, 41.0, 52.0, 58.0, 39.0, 40.0, 29.0, 26.0, 24.0, 11.0, 9.0, 14.0, 8.0, 2.0, 5.0, 6.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.142578125, -3.0377197265625, -2.932861328125, -2.8280029296875, -2.72314453125, -2.6182861328125, -2.513427734375, -2.4085693359375, -2.3037109375, -2.1988525390625, -2.093994140625, -1.9891357421875, -1.88427734375, -1.7794189453125, -1.674560546875, -1.5697021484375, -1.46484375, -1.3599853515625, -1.255126953125, -1.1502685546875, -1.04541015625, -0.9405517578125, -0.835693359375, -0.7308349609375, -0.6259765625, -0.5211181640625, -0.416259765625, -0.3114013671875, -0.20654296875, -0.1016845703125, 0.003173828125, 0.1080322265625, 0.212890625, 0.3177490234375, 0.422607421875, 0.5274658203125, 0.63232421875, 0.7371826171875, 0.842041015625, 0.9468994140625, 1.0517578125, 1.1566162109375, 1.261474609375, 1.3663330078125, 1.47119140625, 1.5760498046875, 1.680908203125, 1.7857666015625, 1.890625, 1.9954833984375, 2.100341796875, 2.2052001953125, 2.31005859375, 2.4149169921875, 2.519775390625, 2.6246337890625, 2.7294921875, 2.8343505859375, 2.939208984375, 3.0440673828125, 3.14892578125, 3.2537841796875, 3.358642578125, 3.4635009765625, 3.568359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 9.0, 8.0, 12.0, 16.0, 25.0, 41.0, 100.0, 180.0, 322.0, 650.0, 1509.0, 3295.0, 7614.0, 17634.0, 43852.0, 166192.0, 598051.0, 139430.0, 40794.0, 16351.0, 6975.0, 2852.0, 1376.0, 613.0, 299.0, 150.0, 86.0, 44.0, 28.0, 20.0, 13.0, 4.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0732421875, -1.0326690673828125, -0.992095947265625, -0.9515228271484375, -0.91094970703125, -0.8703765869140625, -0.829803466796875, -0.7892303466796875, -0.7486572265625, -0.7080841064453125, -0.667510986328125, -0.6269378662109375, -0.58636474609375, -0.5457916259765625, -0.505218505859375, -0.4646453857421875, -0.424072265625, -0.3834991455078125, -0.342926025390625, -0.3023529052734375, -0.26177978515625, -0.2212066650390625, -0.180633544921875, -0.1400604248046875, -0.0994873046875, -0.0589141845703125, -0.018341064453125, 0.0222320556640625, 0.06280517578125, 0.1033782958984375, 0.143951416015625, 0.1845245361328125, 0.22509765625, 0.2656707763671875, 0.306243896484375, 0.3468170166015625, 0.38739013671875, 0.4279632568359375, 0.468536376953125, 0.5091094970703125, 0.5496826171875, 0.5902557373046875, 0.630828857421875, 0.6714019775390625, 0.71197509765625, 0.7525482177734375, 0.793121337890625, 0.8336944580078125, 0.874267578125, 0.9148406982421875, 0.955413818359375, 0.9959869384765625, 1.03656005859375, 1.0771331787109375, 1.117706298828125, 1.1582794189453125, 1.1988525390625, 1.2394256591796875, 1.279998779296875, 1.3205718994140625, 1.36114501953125, 1.4017181396484375, 1.442291259765625, 1.4828643798828125, 1.5234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 7.0, 3.0, 5.0, 4.0, 6.0, 10.0, 6.0, 6.0, 6.0, 8.0, 16.0, 22.0, 23.0, 34.0, 54.0, 81.0, 123.0, 152.0, 131.0, 77.0, 55.0, 31.0, 25.0, 15.0, 11.0, 13.0, 12.0, 7.0, 11.0, 10.0, 5.0, 1.0, 7.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013971328735351562, -0.00013494864106178284, -0.00013018399477005005, -0.00012541934847831726, -0.00012065470218658447, -0.00011589005589485168, -0.0001111254096031189, -0.00010636076331138611, -0.00010159611701965332, -9.683147072792053e-05, -9.206682443618774e-05, -8.730217814445496e-05, -8.253753185272217e-05, -7.777288556098938e-05, -7.300823926925659e-05, -6.82435929775238e-05, -6.347894668579102e-05, -5.871430039405823e-05, -5.394965410232544e-05, -4.918500781059265e-05, -4.442036151885986e-05, -3.9655715227127075e-05, -3.489106893539429e-05, -3.01264226436615e-05, -2.536177635192871e-05, -2.0597130060195923e-05, -1.5832483768463135e-05, -1.1067837476730347e-05, -6.303191184997559e-06, -1.5385448932647705e-06, 3.2261013984680176e-06, 7.990747690200806e-06, 1.2755393981933594e-05, 1.7520040273666382e-05, 2.228468656539917e-05, 2.7049332857131958e-05, 3.1813979148864746e-05, 3.6578625440597534e-05, 4.134327173233032e-05, 4.610791802406311e-05, 5.08725643157959e-05, 5.5637210607528687e-05, 6.0401856899261475e-05, 6.516650319099426e-05, 6.993114948272705e-05, 7.469579577445984e-05, 7.946044206619263e-05, 8.422508835792542e-05, 8.89897346496582e-05, 9.375438094139099e-05, 9.851902723312378e-05, 0.00010328367352485657, 0.00010804831981658936, 0.00011281296610832214, 0.00011757761240005493, 0.00012234225869178772, 0.0001271069049835205, 0.0001318715512752533, 0.00013663619756698608, 0.00014140084385871887, 0.00014616549015045166, 0.00015093013644218445, 0.00015569478273391724, 0.00016045942902565002, 0.0001652240753173828]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 10.0, 10.0, 11.0, 18.0, 17.0, 25.0, 45.0, 73.0, 127.0, 222.0, 371.0, 773.0, 1858.0, 4443.0, 11864.0, 30698.0, 93321.0, 487006.0, 312688.0, 65893.0, 23988.0, 8730.0, 3372.0, 1424.0, 666.0, 341.0, 191.0, 109.0, 86.0, 50.0, 37.0, 24.0, 22.0, 10.0, 12.0, 7.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.025299072265625, -0.98712158203125, -0.948944091796875, -0.9107666015625, -0.872589111328125, -0.83441162109375, -0.796234130859375, -0.758056640625, -0.719879150390625, -0.68170166015625, -0.643524169921875, -0.6053466796875, -0.567169189453125, -0.52899169921875, -0.490814208984375, -0.45263671875, -0.414459228515625, -0.37628173828125, -0.338104248046875, -0.2999267578125, -0.261749267578125, -0.22357177734375, -0.185394287109375, -0.147216796875, -0.109039306640625, -0.07086181640625, -0.032684326171875, 0.0054931640625, 0.043670654296875, 0.08184814453125, 0.120025634765625, 0.158203125, 0.196380615234375, 0.23455810546875, 0.272735595703125, 0.3109130859375, 0.349090576171875, 0.38726806640625, 0.425445556640625, 0.463623046875, 0.501800537109375, 0.53997802734375, 0.578155517578125, 0.6163330078125, 0.654510498046875, 0.69268798828125, 0.730865478515625, 0.76904296875, 0.807220458984375, 0.84539794921875, 0.883575439453125, 0.9217529296875, 0.959930419921875, 0.99810791015625, 1.036285400390625, 1.074462890625, 1.112640380859375, 1.15081787109375, 1.188995361328125, 1.2271728515625, 1.265350341796875, 1.30352783203125, 1.341705322265625, 1.3798828125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 8.0, 6.0, 15.0, 22.0, 31.0, 55.0, 63.0, 144.0, 199.0, 190.0, 100.0, 57.0, 27.0, 16.0, 10.0, 17.0, 9.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0], "bins": [-2.201171875, -2.1529998779296875, -2.104827880859375, -2.0566558837890625, -2.00848388671875, -1.9603118896484375, -1.912139892578125, -1.8639678955078125, -1.8157958984375, -1.7676239013671875, -1.719451904296875, -1.6712799072265625, -1.62310791015625, -1.5749359130859375, -1.526763916015625, -1.4785919189453125, -1.430419921875, -1.3822479248046875, -1.334075927734375, -1.2859039306640625, -1.23773193359375, -1.1895599365234375, -1.141387939453125, -1.0932159423828125, -1.0450439453125, -0.9968719482421875, -0.948699951171875, -0.9005279541015625, -0.85235595703125, -0.8041839599609375, -0.756011962890625, -0.7078399658203125, -0.65966796875, -0.6114959716796875, -0.563323974609375, -0.5151519775390625, -0.46697998046875, -0.4188079833984375, -0.370635986328125, -0.3224639892578125, -0.2742919921875, -0.2261199951171875, -0.177947998046875, -0.1297760009765625, -0.08160400390625, -0.0334320068359375, 0.014739990234375, 0.0629119873046875, 0.111083984375, 0.1592559814453125, 0.207427978515625, 0.2555999755859375, 0.30377197265625, 0.3519439697265625, 0.400115966796875, 0.4482879638671875, 0.4964599609375, 0.5446319580078125, 0.592803955078125, 0.6409759521484375, 0.68914794921875, 0.7373199462890625, 0.785491943359375, 0.8336639404296875, 0.8818359375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 15.0, 47.0, 50.0, 90.0, 108.0, 130.0, 143.0, 122.0, 99.0, 70.0, 49.0, 33.0, 17.0, 8.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.25293731689453, -16.902162551879883, -16.551387786865234, -16.200611114501953, -15.849837303161621, -15.499061584472656, -15.148286819458008, -14.79751205444336, -14.446737289428711, -14.095962524414062, -13.745186805725098, -13.39441204071045, -13.0436372756958, -12.692861557006836, -12.342086791992188, -11.991312026977539, -11.640536308288574, -11.289761543273926, -10.938985824584961, -10.588211059570312, -10.237436294555664, -9.886661529541016, -9.53588581085205, -9.185111045837402, -8.834335327148438, -8.483560562133789, -8.132784843444824, -7.782010078430176, -7.431235313415527, -7.080460071563721, -6.729684829711914, -6.378910064697266, -6.028134346008301, -5.677359104156494, -5.326584339141846, -4.975809097290039, -4.625034332275391, -4.274259090423584, -3.9234838485717773, -3.57270884513855, -3.2219338417053223, -2.8711588382720947, -2.520383834838867, -2.1696085929870605, -1.818833589553833, -1.4680585861206055, -1.1172833442687988, -0.7665083408355713, -0.41573333740234375, -0.06495827436447144, 0.2858167886734009, 0.636591911315918, 0.9873669147491455, 1.338141918182373, 1.6889171600341797, 2.0396921634674072, 2.3904671669006348, 2.7412421703338623, 3.09201717376709, 3.4427924156188965, 3.793567419052124, 4.144342422485352, 4.495117664337158, 4.845892906188965, 5.196667671203613]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 0.0, 2.0, 9.0, 7.0, 10.0, 5.0, 5.0, 8.0, 15.0, 16.0, 6.0, 24.0, 20.0, 21.0, 30.0, 25.0, 20.0, 27.0, 29.0, 33.0, 42.0, 29.0, 41.0, 41.0, 36.0, 44.0, 42.0, 47.0, 35.0, 34.0, 40.0, 32.0, 19.0, 27.0, 30.0, 19.0, 17.0, 20.0, 22.0, 16.0, 11.0, 13.0, 5.0, 8.0, 9.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8177313804626465, -6.612051963806152, -6.406372547149658, -6.200693130493164, -5.99501371383667, -5.789334297180176, -5.58365535736084, -5.3779754638671875, -5.172296524047852, -4.966617107391357, -4.760937690734863, -4.555258274078369, -4.349578857421875, -4.143899440765381, -3.938220262527466, -3.7325408458709717, -3.5268611907958984, -3.3211817741394043, -3.11550235748291, -2.909822940826416, -2.704143524169922, -2.4984641075134277, -2.2927849292755127, -2.0871055126190186, -1.8814260959625244, -1.6757466793060303, -1.4700672626495361, -1.2643879652023315, -1.0587085485458374, -0.8530291318893433, -0.6473498344421387, -0.44167041778564453, -0.2359914779663086, -0.03031209111213684, 0.1753672957420349, 0.3810466527938843, 0.5867260694503784, 0.7924054861068726, 0.9980847835540771, 1.2037642002105713, 1.4094436168670654, 1.6151230335235596, 1.8208024501800537, 2.0264816284179688, 2.232161045074463, 2.437840461730957, 2.643519878387451, 2.8491992950439453, 3.0548787117004395, 3.2605581283569336, 3.4662375450134277, 3.671916961669922, 3.877596378326416, 4.08327579498291, 4.288954734802246, 4.494634628295898, 4.700313568115234, 4.9059929847717285, 5.111672401428223, 5.317351818084717, 5.523031234741211, 5.728710651397705, 5.934390068054199, 6.140069007873535, 6.3457489013671875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 8.0, 11.0, 13.0, 9.0, 17.0, 30.0, 46.0, 56.0, 63.0, 112.0, 175.0, 243.0, 367.0, 610.0, 959.0, 1721.0, 3005.0, 5387.0, 10419.0, 21345.0, 45890.0, 104719.0, 264935.0, 810122.0, 1974973.0, 582749.0, 205775.0, 84750.0, 37867.0, 17728.0, 8987.0, 4778.0, 2509.0, 1506.0, 807.0, 528.0, 330.0, 198.0, 161.0, 110.0, 79.0, 47.0, 41.0, 22.0, 19.0, 16.0, 13.0, 8.0, 5.0, 3.0, 7.0, 1.0, 7.0], "bins": [-1.185546875, -1.1520309448242188, -1.1185150146484375, -1.0849990844726562, -1.051483154296875, -1.0179672241210938, -0.9844512939453125, -0.9509353637695312, -0.91741943359375, -0.8839035034179688, -0.8503875732421875, -0.8168716430664062, -0.783355712890625, -0.7498397827148438, -0.7163238525390625, -0.6828079223632812, -0.6492919921875, -0.6157760620117188, -0.5822601318359375, -0.5487442016601562, -0.515228271484375, -0.48171234130859375, -0.4481964111328125, -0.41468048095703125, -0.38116455078125, -0.34764862060546875, -0.3141326904296875, -0.28061676025390625, -0.247100830078125, -0.21358489990234375, -0.1800689697265625, -0.14655303955078125, -0.113037109375, -0.07952117919921875, -0.0460052490234375, -0.01248931884765625, 0.021026611328125, 0.05454254150390625, 0.0880584716796875, 0.12157440185546875, 0.15509033203125, 0.18860626220703125, 0.2221221923828125, 0.25563812255859375, 0.289154052734375, 0.32266998291015625, 0.3561859130859375, 0.38970184326171875, 0.4232177734375, 0.45673370361328125, 0.4902496337890625, 0.5237655639648438, 0.557281494140625, 0.5907974243164062, 0.6243133544921875, 0.6578292846679688, 0.69134521484375, 0.7248611450195312, 0.7583770751953125, 0.7918930053710938, 0.825408935546875, 0.8589248657226562, 0.8924407958984375, 0.9259567260742188, 0.95947265625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 7.0, 3.0, 5.0, 7.0, 5.0, 5.0, 9.0, 7.0, 12.0, 20.0, 28.0, 17.0, 24.0, 19.0, 18.0, 22.0, 34.0, 36.0, 24.0, 52.0, 31.0, 45.0, 41.0, 44.0, 40.0, 37.0, 29.0, 43.0, 38.0, 38.0, 34.0, 24.0, 22.0, 29.0, 26.0, 25.0, 16.0, 18.0, 13.0, 14.0, 11.0, 7.0, 9.0, 8.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7978515625, -0.7718048095703125, -0.745758056640625, -0.7197113037109375, -0.69366455078125, -0.6676177978515625, -0.641571044921875, -0.6155242919921875, -0.5894775390625, -0.5634307861328125, -0.537384033203125, -0.5113372802734375, -0.48529052734375, -0.4592437744140625, -0.433197021484375, -0.4071502685546875, -0.381103515625, -0.3550567626953125, -0.329010009765625, -0.3029632568359375, -0.27691650390625, -0.2508697509765625, -0.224822998046875, -0.1987762451171875, -0.1727294921875, -0.1466827392578125, -0.120635986328125, -0.0945892333984375, -0.06854248046875, -0.0424957275390625, -0.016448974609375, 0.0095977783203125, 0.03564453125, 0.0616912841796875, 0.087738037109375, 0.1137847900390625, 0.13983154296875, 0.1658782958984375, 0.191925048828125, 0.2179718017578125, 0.2440185546875, 0.2700653076171875, 0.296112060546875, 0.3221588134765625, 0.34820556640625, 0.3742523193359375, 0.400299072265625, 0.4263458251953125, 0.452392578125, 0.4784393310546875, 0.504486083984375, 0.5305328369140625, 0.55657958984375, 0.5826263427734375, 0.608673095703125, 0.6347198486328125, 0.6607666015625, 0.6868133544921875, 0.712860107421875, 0.7389068603515625, 0.76495361328125, 0.7910003662109375, 0.817047119140625, 0.8430938720703125, 0.869140625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 10.0, 19.0, 27.0, 29.0, 58.0, 71.0, 101.0, 178.0, 295.0, 525.0, 1024.0, 2234.0, 5255.0, 14852.0, 53542.0, 258373.0, 1939640.0, 1620926.0, 226115.0, 48037.0, 13672.0, 4927.0, 2160.0, 992.0, 506.0, 235.0, 150.0, 96.0, 76.0, 37.0, 26.0, 22.0, 19.0, 10.0, 12.0, 6.0, 7.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.841796875, -2.7469482421875, -2.652099609375, -2.5572509765625, -2.46240234375, -2.3675537109375, -2.272705078125, -2.1778564453125, -2.0830078125, -1.9881591796875, -1.893310546875, -1.7984619140625, -1.70361328125, -1.6087646484375, -1.513916015625, -1.4190673828125, -1.32421875, -1.2293701171875, -1.134521484375, -1.0396728515625, -0.94482421875, -0.8499755859375, -0.755126953125, -0.6602783203125, -0.5654296875, -0.4705810546875, -0.375732421875, -0.2808837890625, -0.18603515625, -0.0911865234375, 0.003662109375, 0.0985107421875, 0.193359375, 0.2882080078125, 0.383056640625, 0.4779052734375, 0.57275390625, 0.6676025390625, 0.762451171875, 0.8572998046875, 0.9521484375, 1.0469970703125, 1.141845703125, 1.2366943359375, 1.33154296875, 1.4263916015625, 1.521240234375, 1.6160888671875, 1.7109375, 1.8057861328125, 1.900634765625, 1.9954833984375, 2.09033203125, 2.1851806640625, 2.280029296875, 2.3748779296875, 2.4697265625, 2.5645751953125, 2.659423828125, 2.7542724609375, 2.84912109375, 2.9439697265625, 3.038818359375, 3.1336669921875, 3.228515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 9.0, 10.0, 26.0, 41.0, 86.0, 131.0, 214.0, 394.0, 812.0, 1060.0, 561.0, 305.0, 171.0, 95.0, 62.0, 29.0, 23.0, 12.0, 11.0, 6.0, 4.0, 8.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.857421875, -3.7684783935546875, -3.679534912109375, -3.5905914306640625, -3.50164794921875, -3.4127044677734375, -3.323760986328125, -3.2348175048828125, -3.1458740234375, -3.0569305419921875, -2.967987060546875, -2.8790435791015625, -2.79010009765625, -2.7011566162109375, -2.612213134765625, -2.5232696533203125, -2.434326171875, -2.3453826904296875, -2.256439208984375, -2.1674957275390625, -2.07855224609375, -1.9896087646484375, -1.900665283203125, -1.8117218017578125, -1.7227783203125, -1.6338348388671875, -1.544891357421875, -1.4559478759765625, -1.36700439453125, -1.2780609130859375, -1.189117431640625, -1.1001739501953125, -1.01123046875, -0.9222869873046875, -0.833343505859375, -0.7444000244140625, -0.65545654296875, -0.5665130615234375, -0.477569580078125, -0.3886260986328125, -0.2996826171875, -0.2107391357421875, -0.121795654296875, -0.0328521728515625, 0.05609130859375, 0.1450347900390625, 0.233978271484375, 0.3229217529296875, 0.411865234375, 0.5008087158203125, 0.589752197265625, 0.6786956787109375, 0.76763916015625, 0.8565826416015625, 0.945526123046875, 1.0344696044921875, 1.1234130859375, 1.2123565673828125, 1.301300048828125, 1.3902435302734375, 1.47918701171875, 1.5681304931640625, 1.657073974609375, 1.7460174560546875, 1.8349609375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 9.0, 6.0, 25.0, 56.0, 81.0, 166.0, 177.0, 171.0, 134.0, 83.0, 64.0, 19.0, 12.0, 3.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.150348663330078, -5.626521110534668, -5.1026930809021, -4.578865051269531, -4.055037498474121, -3.531209707260132, -3.0073819160461426, -2.4835541248321533, -1.959726333618164, -1.4358985424041748, -0.9120707511901855, -0.3882429599761963, 0.13558483123779297, 0.6594126224517822, 1.1832404136657715, 1.7070682048797607, 2.23089599609375, 2.7547237873077393, 3.2785515785217285, 3.8023793697357178, 4.326207160949707, 4.850034713745117, 5.3738627433776855, 5.897690773010254, 6.421518325805664, 6.945345878601074, 7.469173908233643, 7.993001937866211, 8.516829490661621, 9.040657043457031, 9.564485549926758, 10.088313102722168, 10.612140655517578, 11.135968208312988, 11.659795761108398, 12.183624267578125, 12.707451820373535, 13.231279373168945, 13.755107879638672, 14.278935432434082, 14.802762985229492, 15.326590538024902, 15.850418090820312, 16.37424659729004, 16.898075103759766, 17.42190170288086, 17.945730209350586, 18.46955680847168, 18.993385314941406, 19.517213821411133, 20.041040420532227, 20.564868927001953, 21.088695526123047, 21.612524032592773, 22.1363525390625, 22.660179138183594, 23.18400764465332, 23.707836151123047, 24.23166275024414, 24.755491256713867, 25.279319763183594, 25.803146362304688, 26.326974868774414, 26.850801467895508, 27.374629974365234]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 9.0, 2.0, 2.0, 10.0, 9.0, 10.0, 11.0, 13.0, 21.0, 27.0, 17.0, 28.0, 31.0, 29.0, 31.0, 26.0, 31.0, 47.0, 52.0, 51.0, 44.0, 38.0, 45.0, 39.0, 37.0, 29.0, 32.0, 32.0, 31.0, 32.0, 27.0, 26.0, 25.0, 20.0, 18.0, 22.0, 10.0, 5.0, 8.0, 8.0, 7.0, 4.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.409483432769775, -5.241763591766357, -5.0740437507629395, -4.90632438659668, -4.738604545593262, -4.570884704589844, -4.403164863586426, -4.235445022583008, -4.06772518157959, -3.900005340576172, -3.732285737991333, -3.564565896987915, -3.396846294403076, -3.229126453399658, -3.0614066123962402, -2.8936867713928223, -2.7259674072265625, -2.5582475662231445, -2.3905279636383057, -2.2228081226348877, -2.055088520050049, -1.8873686790466309, -1.719648838043213, -1.5519291162490845, -1.384209394454956, -1.2164896726608276, -1.0487699508666992, -0.8810501098632812, -0.7133303880691528, -0.5456106662750244, -0.37789082527160645, -0.21017110347747803, -0.04245138168334961, 0.1252683699131012, 0.292988121509552, 0.4607079029083252, 0.6284276247024536, 0.796147346496582, 0.9638671875, 1.1315869092941284, 1.2993066310882568, 1.4670263528823853, 1.6347460746765137, 1.8024659156799316, 1.97018563747406, 2.1379053592681885, 2.3056252002716064, 2.4733448028564453, 2.6410646438598633, 2.8087844848632812, 2.97650408744812, 3.144223928451538, 3.311943531036377, 3.479663372039795, 3.647383213043213, 3.815103054046631, 3.9828226566314697, 4.150542259216309, 4.318262100219727, 4.4859819412231445, 4.6537017822265625, 4.8214216232299805, 4.989141464233398, 5.156860828399658, 5.324580669403076]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 13.0, 11.0, 16.0, 44.0, 54.0, 95.0, 182.0, 290.0, 574.0, 989.0, 1739.0, 3210.0, 5587.0, 9669.0, 17455.0, 30570.0, 54326.0, 106869.0, 224570.0, 278024.0, 150919.0, 72431.0, 39346.0, 22321.0, 12697.0, 7171.0, 4095.0, 2266.0, 1292.0, 734.0, 418.0, 224.0, 135.0, 102.0, 43.0, 30.0, 22.0, 10.0, 7.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.982421875, -0.9488067626953125, -0.915191650390625, -0.8815765380859375, -0.84796142578125, -0.8143463134765625, -0.780731201171875, -0.7471160888671875, -0.7135009765625, -0.6798858642578125, -0.646270751953125, -0.6126556396484375, -0.57904052734375, -0.5454254150390625, -0.511810302734375, -0.4781951904296875, -0.444580078125, -0.4109649658203125, -0.377349853515625, -0.3437347412109375, -0.31011962890625, -0.2765045166015625, -0.242889404296875, -0.2092742919921875, -0.1756591796875, -0.1420440673828125, -0.108428955078125, -0.0748138427734375, -0.04119873046875, -0.0075836181640625, 0.026031494140625, 0.0596466064453125, 0.09326171875, 0.1268768310546875, 0.160491943359375, 0.1941070556640625, 0.22772216796875, 0.2613372802734375, 0.294952392578125, 0.3285675048828125, 0.3621826171875, 0.3957977294921875, 0.429412841796875, 0.4630279541015625, 0.49664306640625, 0.5302581787109375, 0.563873291015625, 0.5974884033203125, 0.631103515625, 0.6647186279296875, 0.698333740234375, 0.7319488525390625, 0.76556396484375, 0.7991790771484375, 0.832794189453125, 0.8664093017578125, 0.9000244140625, 0.9336395263671875, 0.967254638671875, 1.0008697509765625, 1.03448486328125, 1.0680999755859375, 1.101715087890625, 1.1353302001953125, 1.1689453125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 6.0, 4.0, 4.0, 7.0, 6.0, 3.0, 11.0, 12.0, 17.0, 19.0, 9.0, 13.0, 21.0, 27.0, 28.0, 26.0, 29.0, 50.0, 45.0, 37.0, 30.0, 41.0, 33.0, 33.0, 34.0, 43.0, 44.0, 47.0, 44.0, 34.0, 28.0, 32.0, 31.0, 11.0, 21.0, 15.0, 11.0, 16.0, 11.0, 12.0, 14.0, 11.0, 8.0, 6.0, 9.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.892578125, -0.8651199340820312, -0.8376617431640625, -0.8102035522460938, -0.782745361328125, -0.7552871704101562, -0.7278289794921875, -0.7003707885742188, -0.67291259765625, -0.6454544067382812, -0.6179962158203125, -0.5905380249023438, -0.563079833984375, -0.5356216430664062, -0.5081634521484375, -0.48070526123046875, -0.4532470703125, -0.42578887939453125, -0.3983306884765625, -0.37087249755859375, -0.343414306640625, -0.31595611572265625, -0.2884979248046875, -0.26103973388671875, -0.23358154296875, -0.20612335205078125, -0.1786651611328125, -0.15120697021484375, -0.123748779296875, -0.09629058837890625, -0.0688323974609375, -0.04137420654296875, -0.013916015625, 0.01354217529296875, 0.0410003662109375, 0.06845855712890625, 0.095916748046875, 0.12337493896484375, 0.1508331298828125, 0.17829132080078125, 0.20574951171875, 0.23320770263671875, 0.2606658935546875, 0.28812408447265625, 0.315582275390625, 0.34304046630859375, 0.3704986572265625, 0.39795684814453125, 0.4254150390625, 0.45287322998046875, 0.4803314208984375, 0.5077896118164062, 0.535247802734375, 0.5627059936523438, 0.5901641845703125, 0.6176223754882812, 0.64508056640625, 0.6725387573242188, 0.6999969482421875, 0.7274551391601562, 0.754913330078125, 0.7823715209960938, 0.8098297119140625, 0.8372879028320312, 0.86474609375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 2.0, 1.0, 4.0, 3.0, 8.0, 11.0, 7.0, 14.0, 14.0, 17.0, 20.0, 23.0, 25.0, 29.0, 34.0, 43.0, 82.0, 141.0, 364.0, 1328.0, 6189.0, 35253.0, 250720.0, 637767.0, 96711.0, 15558.0, 2866.0, 706.0, 228.0, 117.0, 63.0, 41.0, 30.0, 24.0, 25.0, 16.0, 17.0, 10.0, 13.0, 9.0, 6.0, 2.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.96875, -3.856231689453125, -3.74371337890625, -3.631195068359375, -3.5186767578125, -3.406158447265625, -3.29364013671875, -3.181121826171875, -3.068603515625, -2.956085205078125, -2.84356689453125, -2.731048583984375, -2.6185302734375, -2.506011962890625, -2.39349365234375, -2.280975341796875, -2.16845703125, -2.055938720703125, -1.94342041015625, -1.830902099609375, -1.7183837890625, -1.605865478515625, -1.49334716796875, -1.380828857421875, -1.268310546875, -1.155792236328125, -1.04327392578125, -0.930755615234375, -0.8182373046875, -0.705718994140625, -0.59320068359375, -0.480682373046875, -0.3681640625, -0.255645751953125, -0.14312744140625, -0.030609130859375, 0.0819091796875, 0.194427490234375, 0.30694580078125, 0.419464111328125, 0.531982421875, 0.644500732421875, 0.75701904296875, 0.869537353515625, 0.9820556640625, 1.094573974609375, 1.20709228515625, 1.319610595703125, 1.43212890625, 1.544647216796875, 1.65716552734375, 1.769683837890625, 1.8822021484375, 1.994720458984375, 2.10723876953125, 2.219757080078125, 2.332275390625, 2.444793701171875, 2.55731201171875, 2.669830322265625, 2.7823486328125, 2.894866943359375, 3.00738525390625, 3.119903564453125, 3.232421875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 5.0, 12.0, 12.0, 17.0, 12.0, 14.0, 15.0, 18.0, 27.0, 29.0, 31.0, 33.0, 45.0, 45.0, 45.0, 41.0, 37.0, 39.0, 40.0, 53.0, 43.0, 45.0, 48.0, 25.0, 34.0, 30.0, 26.0, 31.0, 28.0, 15.0, 14.0, 20.0, 14.0, 14.0, 11.0, 7.0, 8.0, 3.0, 3.0, 3.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.06640625, -2.973236083984375, -2.88006591796875, -2.786895751953125, -2.6937255859375, -2.600555419921875, -2.50738525390625, -2.414215087890625, -2.321044921875, -2.227874755859375, -2.13470458984375, -2.041534423828125, -1.9483642578125, -1.855194091796875, -1.76202392578125, -1.668853759765625, -1.57568359375, -1.482513427734375, -1.38934326171875, -1.296173095703125, -1.2030029296875, -1.109832763671875, -1.01666259765625, -0.923492431640625, -0.830322265625, -0.737152099609375, -0.64398193359375, -0.550811767578125, -0.4576416015625, -0.364471435546875, -0.27130126953125, -0.178131103515625, -0.0849609375, 0.008209228515625, 0.10137939453125, 0.194549560546875, 0.2877197265625, 0.380889892578125, 0.47406005859375, 0.567230224609375, 0.660400390625, 0.753570556640625, 0.84674072265625, 0.939910888671875, 1.0330810546875, 1.126251220703125, 1.21942138671875, 1.312591552734375, 1.40576171875, 1.498931884765625, 1.59210205078125, 1.685272216796875, 1.7784423828125, 1.871612548828125, 1.96478271484375, 2.057952880859375, 2.151123046875, 2.244293212890625, 2.33746337890625, 2.430633544921875, 2.5238037109375, 2.616973876953125, 2.71014404296875, 2.803314208984375, 2.896484375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 7.0, 14.0, 20.0, 34.0, 44.0, 88.0, 176.0, 322.0, 530.0, 1113.0, 2369.0, 5348.0, 12938.0, 31692.0, 80580.0, 252195.0, 416658.0, 152529.0, 54095.0, 21678.0, 8836.0, 3715.0, 1665.0, 893.0, 462.0, 225.0, 143.0, 74.0, 39.0, 26.0, 21.0, 6.0, 9.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74267578125, -0.7133102416992188, -0.6839447021484375, -0.6545791625976562, -0.625213623046875, -0.5958480834960938, -0.5664825439453125, -0.5371170043945312, -0.50775146484375, -0.47838592529296875, -0.4490203857421875, -0.41965484619140625, -0.390289306640625, -0.36092376708984375, -0.3315582275390625, -0.30219268798828125, -0.2728271484375, -0.24346160888671875, -0.2140960693359375, -0.18473052978515625, -0.155364990234375, -0.12599945068359375, -0.0966339111328125, -0.06726837158203125, -0.03790283203125, -0.00853729248046875, 0.0208282470703125, 0.05019378662109375, 0.079559326171875, 0.10892486572265625, 0.1382904052734375, 0.16765594482421875, 0.197021484375, 0.22638702392578125, 0.2557525634765625, 0.28511810302734375, 0.314483642578125, 0.34384918212890625, 0.3732147216796875, 0.40258026123046875, 0.43194580078125, 0.46131134033203125, 0.4906768798828125, 0.5200424194335938, 0.549407958984375, 0.5787734985351562, 0.6081390380859375, 0.6375045776367188, 0.6668701171875, 0.6962356567382812, 0.7256011962890625, 0.7549667358398438, 0.784332275390625, 0.8136978149414062, 0.8430633544921875, 0.8724288940429688, 0.90179443359375, 0.9311599731445312, 0.9605255126953125, 0.9898910522460938, 1.019256591796875, 1.0486221313476562, 1.0779876708984375, 1.1073532104492188, 1.13671875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 6.0, 3.0, 5.0, 6.0, 10.0, 5.0, 16.0, 13.0, 16.0, 23.0, 27.0, 37.0, 37.0, 59.0, 83.0, 90.0, 119.0, 96.0, 81.0, 57.0, 46.0, 33.0, 22.0, 23.0, 18.0, 13.0, 8.0, 12.0, 14.0, 6.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00017058849334716797, -0.00016604457050561905, -0.00016150064766407013, -0.0001569567248225212, -0.0001524128019809723, -0.00014786887913942337, -0.00014332495629787445, -0.00013878103345632553, -0.0001342371106147766, -0.0001296931877732277, -0.00012514926493167877, -0.00012060534209012985, -0.00011606141924858093, -0.00011151749640703201, -0.0001069735735654831, -0.00010242965072393417, -9.788572788238525e-05, -9.334180504083633e-05, -8.879788219928741e-05, -8.42539593577385e-05, -7.971003651618958e-05, -7.516611367464066e-05, -7.062219083309174e-05, -6.607826799154282e-05, -6.15343451499939e-05, -5.699042230844498e-05, -5.244649946689606e-05, -4.790257662534714e-05, -4.335865378379822e-05, -3.88147309422493e-05, -3.427080810070038e-05, -2.972688525915146e-05, -2.518296241760254e-05, -2.063903957605362e-05, -1.60951167345047e-05, -1.155119389295578e-05, -7.00727105140686e-06, -2.4633482098579407e-06, 2.080574631690979e-06, 6.624497473239899e-06, 1.1168420314788818e-05, 1.5712343156337738e-05, 2.0256265997886658e-05, 2.4800188839435577e-05, 2.9344111680984497e-05, 3.388803452253342e-05, 3.8431957364082336e-05, 4.2975880205631256e-05, 4.7519803047180176e-05, 5.2063725888729095e-05, 5.6607648730278015e-05, 6.115157157182693e-05, 6.569549441337585e-05, 7.023941725492477e-05, 7.47833400964737e-05, 7.932726293802261e-05, 8.387118577957153e-05, 8.841510862112045e-05, 9.295903146266937e-05, 9.750295430421829e-05, 0.00010204687714576721, 0.00010659079998731613, 0.00011113472282886505, 0.00011567864567041397, 0.00012022256851196289]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 10.0, 5.0, 11.0, 13.0, 14.0, 17.0, 14.0, 25.0, 37.0, 43.0, 68.0, 106.0, 193.0, 357.0, 747.0, 2052.0, 6434.0, 23431.0, 90937.0, 411455.0, 393599.0, 86623.0, 22638.0, 6202.0, 1895.0, 756.0, 318.0, 173.0, 122.0, 69.0, 52.0, 31.0, 25.0, 29.0, 16.0, 12.0, 3.0, 7.0, 12.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.23828125, -1.195556640625, -1.15283203125, -1.110107421875, -1.0673828125, -1.024658203125, -0.98193359375, -0.939208984375, -0.896484375, -0.853759765625, -0.81103515625, -0.768310546875, -0.7255859375, -0.682861328125, -0.64013671875, -0.597412109375, -0.5546875, -0.511962890625, -0.46923828125, -0.426513671875, -0.3837890625, -0.341064453125, -0.29833984375, -0.255615234375, -0.212890625, -0.170166015625, -0.12744140625, -0.084716796875, -0.0419921875, 0.000732421875, 0.04345703125, 0.086181640625, 0.12890625, 0.171630859375, 0.21435546875, 0.257080078125, 0.2998046875, 0.342529296875, 0.38525390625, 0.427978515625, 0.470703125, 0.513427734375, 0.55615234375, 0.598876953125, 0.6416015625, 0.684326171875, 0.72705078125, 0.769775390625, 0.8125, 0.855224609375, 0.89794921875, 0.940673828125, 0.9833984375, 1.026123046875, 1.06884765625, 1.111572265625, 1.154296875, 1.197021484375, 1.23974609375, 1.282470703125, 1.3251953125, 1.367919921875, 1.41064453125, 1.453369140625, 1.49609375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 8.0, 9.0, 10.0, 16.0, 14.0, 20.0, 30.0, 23.0, 37.0, 58.0, 75.0, 82.0, 93.0, 112.0, 90.0, 63.0, 55.0, 35.0, 30.0, 30.0, 25.0, 21.0, 21.0, 16.0, 7.0, 5.0, 5.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.892578125, -0.8648834228515625, -0.837188720703125, -0.8094940185546875, -0.78179931640625, -0.7541046142578125, -0.726409912109375, -0.6987152099609375, -0.6710205078125, -0.6433258056640625, -0.615631103515625, -0.5879364013671875, -0.56024169921875, -0.5325469970703125, -0.504852294921875, -0.4771575927734375, -0.449462890625, -0.4217681884765625, -0.394073486328125, -0.3663787841796875, -0.33868408203125, -0.3109893798828125, -0.283294677734375, -0.2555999755859375, -0.2279052734375, -0.2002105712890625, -0.172515869140625, -0.1448211669921875, -0.11712646484375, -0.0894317626953125, -0.061737060546875, -0.0340423583984375, -0.00634765625, 0.0213470458984375, 0.049041748046875, 0.0767364501953125, 0.10443115234375, 0.1321258544921875, 0.159820556640625, 0.1875152587890625, 0.2152099609375, 0.2429046630859375, 0.270599365234375, 0.2982940673828125, 0.32598876953125, 0.3536834716796875, 0.381378173828125, 0.4090728759765625, 0.436767578125, 0.4644622802734375, 0.492156982421875, 0.5198516845703125, 0.54754638671875, 0.5752410888671875, 0.602935791015625, 0.6306304931640625, 0.6583251953125, 0.6860198974609375, 0.713714599609375, 0.7414093017578125, 0.76910400390625, 0.7967987060546875, 0.824493408203125, 0.8521881103515625, 0.8798828125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 7.0, 25.0, 60.0, 173.0, 287.0, 253.0, 141.0, 51.0, 13.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.589248180389404, -6.825368404388428, -6.061488628387451, -5.297608375549316, -4.53372859954834, -3.7698490619659424, -3.0059690475463867, -2.24208927154541, -1.4782094955444336, -0.7143296599388123, 0.04955017566680908, 0.8134300708770752, 1.5773098468780518, 2.3411896228790283, 3.105069637298584, 3.8689494132995605, 4.632829189300537, 5.396708965301514, 6.16058874130249, 6.924468994140625, 7.688348770141602, 8.452228546142578, 9.216108322143555, 9.979988098144531, 10.743867874145508, 11.507747650146484, 12.271627426147461, 13.035507202148438, 13.799386978149414, 14.56326675415039, 15.327146530151367, 16.091026306152344, 16.85490608215332, 17.618785858154297, 18.382665634155273, 19.14654541015625, 19.910425186157227, 20.674304962158203, 21.43818473815918, 22.202064514160156, 22.965944290161133, 23.72982406616211, 24.493703842163086, 25.257583618164062, 26.02146339416504, 26.785343170166016, 27.549222946166992, 28.31310272216797, 29.076984405517578, 29.840864181518555, 30.60474395751953, 31.368623733520508, 32.132503509521484, 32.896385192871094, 33.66026306152344, 34.42414474487305, 35.18802261352539, 35.951904296875, 36.715782165527344, 37.47966384887695, 38.2435417175293, 39.007423400878906, 39.77130126953125, 40.53518295288086, 41.2990608215332]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 10.0, 11.0, 13.0, 11.0, 18.0, 16.0, 18.0, 20.0, 28.0, 26.0, 24.0, 18.0, 41.0, 45.0, 56.0, 45.0, 43.0, 41.0, 53.0, 43.0, 50.0, 40.0, 48.0, 42.0, 23.0, 37.0, 25.0, 35.0, 24.0, 16.0, 11.0, 9.0, 12.0, 14.0, 15.0, 2.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.313058853149414, -8.069992065429688, -7.826924800872803, -7.583857536315918, -7.340790748596191, -7.097723484039307, -6.854656219482422, -6.611589431762695, -6.368522644042969, -6.125455379486084, -5.882388591766357, -5.639321327209473, -5.396254539489746, -5.153187274932861, -4.910120010375977, -4.66705322265625, -4.423985958099365, -4.1809186935424805, -3.937851905822754, -3.694784641265869, -3.4517178535461426, -3.208650588989258, -2.965583562850952, -2.7225165367126465, -2.479449510574341, -2.236382484436035, -1.9933154582977295, -1.7502483129501343, -1.5071812868118286, -1.264114260673523, -1.0210471153259277, -0.7779800891876221, -0.5349125862121582, -0.29184553027153015, -0.0487784743309021, 0.19428861141204834, 0.437355637550354, 0.6804226636886597, 0.9234898090362549, 1.1665568351745605, 1.4096238613128662, 1.6526908874511719, 1.8957579135894775, 2.138824939727783, 2.381892204284668, 2.6249589920043945, 2.8680262565612793, 3.111093282699585, 3.3541603088378906, 3.5972273349761963, 3.840294361114502, 4.083361625671387, 4.326428413391113, 4.569495677947998, 4.812562942504883, 5.055629730224609, 5.298696517944336, 5.541763782501221, 5.784830570220947, 6.027897834777832, 6.270964622497559, 6.514031887054443, 6.757099151611328, 7.000165939331055, 7.2432332038879395]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 0.0, 7.0, 3.0, 8.0, 10.0, 18.0, 30.0, 38.0, 41.0, 67.0, 76.0, 138.0, 217.0, 289.0, 473.0, 670.0, 999.0, 1550.0, 2479.0, 3997.0, 6678.0, 11599.0, 21448.0, 41078.0, 85952.0, 198569.0, 530699.0, 1626626.0, 1043730.0, 342995.0, 138143.0, 63089.0, 31611.0, 16617.0, 9416.0, 5459.0, 3348.0, 2155.0, 1271.0, 859.0, 594.0, 385.0, 257.0, 167.0, 126.0, 90.0, 62.0, 42.0, 43.0, 16.0, 23.0, 15.0, 8.0, 4.0, 5.0, 0.0, 2.0, 4.0, 0.0, 2.0], "bins": [-1.1181640625, -1.0829925537109375, -1.047821044921875, -1.0126495361328125, -0.97747802734375, -0.9423065185546875, -0.907135009765625, -0.8719635009765625, -0.8367919921875, -0.8016204833984375, -0.766448974609375, -0.7312774658203125, -0.69610595703125, -0.6609344482421875, -0.625762939453125, -0.5905914306640625, -0.555419921875, -0.5202484130859375, -0.485076904296875, -0.4499053955078125, -0.41473388671875, -0.3795623779296875, -0.344390869140625, -0.3092193603515625, -0.2740478515625, -0.2388763427734375, -0.203704833984375, -0.1685333251953125, -0.13336181640625, -0.0981903076171875, -0.063018798828125, -0.0278472900390625, 0.00732421875, 0.0424957275390625, 0.077667236328125, 0.1128387451171875, 0.14801025390625, 0.1831817626953125, 0.218353271484375, 0.2535247802734375, 0.2886962890625, 0.3238677978515625, 0.359039306640625, 0.3942108154296875, 0.42938232421875, 0.4645538330078125, 0.499725341796875, 0.5348968505859375, 0.570068359375, 0.6052398681640625, 0.640411376953125, 0.6755828857421875, 0.71075439453125, 0.7459259033203125, 0.781097412109375, 0.8162689208984375, 0.8514404296875, 0.8866119384765625, 0.921783447265625, 0.9569549560546875, 0.99212646484375, 1.0272979736328125, 1.062469482421875, 1.0976409912109375, 1.1328125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 2.0, 7.0, 4.0, 6.0, 6.0, 12.0, 14.0, 12.0, 18.0, 25.0, 20.0, 20.0, 32.0, 25.0, 37.0, 19.0, 36.0, 40.0, 34.0, 58.0, 47.0, 40.0, 50.0, 45.0, 38.0, 43.0, 39.0, 39.0, 28.0, 34.0, 27.0, 22.0, 26.0, 12.0, 10.0, 12.0, 11.0, 15.0, 9.0, 6.0, 7.0, 1.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80859375, -0.77886962890625, -0.7491455078125, -0.71942138671875, -0.689697265625, -0.65997314453125, -0.6302490234375, -0.60052490234375, -0.57080078125, -0.54107666015625, -0.5113525390625, -0.48162841796875, -0.451904296875, -0.42218017578125, -0.3924560546875, -0.36273193359375, -0.3330078125, -0.30328369140625, -0.2735595703125, -0.24383544921875, -0.214111328125, -0.18438720703125, -0.1546630859375, -0.12493896484375, -0.09521484375, -0.06549072265625, -0.0357666015625, -0.00604248046875, 0.023681640625, 0.05340576171875, 0.0831298828125, 0.11285400390625, 0.142578125, 0.17230224609375, 0.2020263671875, 0.23175048828125, 0.261474609375, 0.29119873046875, 0.3209228515625, 0.35064697265625, 0.38037109375, 0.41009521484375, 0.4398193359375, 0.46954345703125, 0.499267578125, 0.52899169921875, 0.5587158203125, 0.58843994140625, 0.6181640625, 0.64788818359375, 0.6776123046875, 0.70733642578125, 0.737060546875, 0.76678466796875, 0.7965087890625, 0.82623291015625, 0.85595703125, 0.88568115234375, 0.9154052734375, 0.94512939453125, 0.974853515625, 1.00457763671875, 1.0343017578125, 1.06402587890625, 1.09375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 6.0, 5.0, 7.0, 9.0, 8.0, 12.0, 12.0, 18.0, 25.0, 29.0, 57.0, 44.0, 98.0, 203.0, 422.0, 864.0, 2037.0, 5423.0, 16801.0, 65041.0, 352684.0, 2663890.0, 911675.0, 131129.0, 29575.0, 8699.0, 3091.0, 1161.0, 544.0, 287.0, 145.0, 92.0, 34.0, 39.0, 34.0, 20.0, 13.0, 13.0, 8.0, 8.0, 4.0, 12.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-3.8046875, -3.69818115234375, -3.5916748046875, -3.48516845703125, -3.378662109375, -3.27215576171875, -3.1656494140625, -3.05914306640625, -2.95263671875, -2.84613037109375, -2.7396240234375, -2.63311767578125, -2.526611328125, -2.42010498046875, -2.3135986328125, -2.20709228515625, -2.1005859375, -1.99407958984375, -1.8875732421875, -1.78106689453125, -1.674560546875, -1.56805419921875, -1.4615478515625, -1.35504150390625, -1.24853515625, -1.14202880859375, -1.0355224609375, -0.92901611328125, -0.822509765625, -0.71600341796875, -0.6094970703125, -0.50299072265625, -0.396484375, -0.28997802734375, -0.1834716796875, -0.07696533203125, 0.029541015625, 0.13604736328125, 0.2425537109375, 0.34906005859375, 0.45556640625, 0.56207275390625, 0.6685791015625, 0.77508544921875, 0.881591796875, 0.98809814453125, 1.0946044921875, 1.20111083984375, 1.3076171875, 1.41412353515625, 1.5206298828125, 1.62713623046875, 1.733642578125, 1.84014892578125, 1.9466552734375, 2.05316162109375, 2.15966796875, 2.26617431640625, 2.3726806640625, 2.47918701171875, 2.585693359375, 2.69219970703125, 2.7987060546875, 2.90521240234375, 3.01171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 7.0, 5.0, 15.0, 17.0, 49.0, 74.0, 104.0, 189.0, 404.0, 891.0, 1137.0, 581.0, 259.0, 135.0, 89.0, 43.0, 31.0, 20.0, 10.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.265625, -5.140869140625, -5.01611328125, -4.891357421875, -4.7666015625, -4.641845703125, -4.51708984375, -4.392333984375, -4.267578125, -4.142822265625, -4.01806640625, -3.893310546875, -3.7685546875, -3.643798828125, -3.51904296875, -3.394287109375, -3.26953125, -3.144775390625, -3.02001953125, -2.895263671875, -2.7705078125, -2.645751953125, -2.52099609375, -2.396240234375, -2.271484375, -2.146728515625, -2.02197265625, -1.897216796875, -1.7724609375, -1.647705078125, -1.52294921875, -1.398193359375, -1.2734375, -1.148681640625, -1.02392578125, -0.899169921875, -0.7744140625, -0.649658203125, -0.52490234375, -0.400146484375, -0.275390625, -0.150634765625, -0.02587890625, 0.098876953125, 0.2236328125, 0.348388671875, 0.47314453125, 0.597900390625, 0.72265625, 0.847412109375, 0.97216796875, 1.096923828125, 1.2216796875, 1.346435546875, 1.47119140625, 1.595947265625, 1.720703125, 1.845458984375, 1.97021484375, 2.094970703125, 2.2197265625, 2.344482421875, 2.46923828125, 2.593994140625, 2.71875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 4.0, 5.0, 11.0, 11.0, 23.0, 27.0, 69.0, 69.0, 93.0, 99.0, 115.0, 122.0, 111.0, 99.0, 53.0, 41.0, 25.0, 20.0, 11.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.118927955627441, -5.69596529006958, -5.273002624511719, -4.850040435791016, -4.427077293395996, -4.004115104675293, -3.5811524391174316, -3.1581897735595703, -2.735227108001709, -2.3122644424438477, -1.8893018960952759, -1.466339349746704, -1.0433766841888428, -0.6204140186309814, -0.19745159149169922, 0.2255110740661621, 0.6484737396240234, 1.0714364051818848, 1.4943989515304565, 1.9173614978790283, 2.3403241634368896, 2.763286828994751, 3.186249256134033, 3.6092119216918945, 4.032174587249756, 4.455137252807617, 4.8780999183654785, 5.30106258392334, 5.724024772644043, 6.1469879150390625, 6.569950103759766, 6.992912769317627, 7.415874481201172, 7.838837146759033, 8.261799812316895, 8.684762001037598, 9.107725143432617, 9.53068733215332, 9.953649520874023, 10.376612663269043, 10.799575805664062, 11.222537994384766, 11.645501136779785, 12.068463325500488, 12.491426467895508, 12.914388656616211, 13.337350845336914, 13.760313987731934, 14.183276176452637, 14.60623836517334, 15.02920150756836, 15.452163696289062, 15.875126838684082, 16.2980899810791, 16.721052169799805, 17.144014358520508, 17.56697654724121, 17.989938735961914, 18.412900924682617, 18.835865020751953, 19.258827209472656, 19.68178939819336, 20.104751586914062, 20.527713775634766, 20.9506778717041]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 11.0, 6.0, 8.0, 16.0, 12.0, 22.0, 25.0, 27.0, 34.0, 41.0, 28.0, 46.0, 36.0, 57.0, 40.0, 50.0, 41.0, 42.0, 43.0, 49.0, 51.0, 32.0, 37.0, 36.0, 33.0, 27.0, 40.0, 22.0, 10.0, 16.0, 13.0, 7.0, 15.0, 5.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.546659469604492, -7.3150715827941895, -7.0834832191467285, -6.851895332336426, -6.620306968688965, -6.388719081878662, -6.157131195068359, -5.925542831420898, -5.6939544677734375, -5.462366580963135, -5.230778217315674, -4.999190330505371, -4.76760196685791, -4.536014080047607, -4.304426193237305, -4.072837829589844, -3.841249942779541, -3.609661817550659, -3.3780736923217773, -3.1464858055114746, -2.9148974418640137, -2.683309555053711, -2.451721429824829, -2.2201333045959473, -1.9885451793670654, -1.7569570541381836, -1.5253689289093018, -1.2937809228897095, -1.0621927976608276, -0.8306046724319458, -0.5990166664123535, -0.3674285411834717, -0.13584041595458984, 0.0957476794719696, 0.32733577489852905, 0.5589238405227661, 0.790511965751648, 1.0221000909805298, 1.253688097000122, 1.485276222229004, 1.7168643474578857, 1.9484524726867676, 2.1800405979156494, 2.4116287231445312, 2.643216609954834, 2.874804973602295, 3.1063928604125977, 3.3379809856414795, 3.5695691108703613, 3.801157236099243, 4.032745361328125, 4.264333248138428, 4.495921611785889, 4.727509498596191, 4.959097862243652, 5.190685749053955, 5.422273635864258, 5.6538615226745605, 5.8854498863220215, 6.117037773132324, 6.348626136779785, 6.580214023590088, 6.811801910400391, 7.043390274047852, 7.2749786376953125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 11.0, 22.0, 28.0, 39.0, 40.0, 88.0, 104.0, 198.0, 295.0, 492.0, 827.0, 1305.0, 2131.0, 3441.0, 5700.0, 9732.0, 16613.0, 28299.0, 51382.0, 101532.0, 212589.0, 283475.0, 157299.0, 77052.0, 40012.0, 22562.0, 13210.0, 7932.0, 4792.0, 2825.0, 1710.0, 1081.0, 630.0, 400.0, 243.0, 159.0, 98.0, 65.0, 47.0, 25.0, 23.0, 25.0, 11.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.326171875, -1.277587890625, -1.22900390625, -1.180419921875, -1.1318359375, -1.083251953125, -1.03466796875, -0.986083984375, -0.9375, -0.888916015625, -0.84033203125, -0.791748046875, -0.7431640625, -0.694580078125, -0.64599609375, -0.597412109375, -0.548828125, -0.500244140625, -0.45166015625, -0.403076171875, -0.3544921875, -0.305908203125, -0.25732421875, -0.208740234375, -0.16015625, -0.111572265625, -0.06298828125, -0.014404296875, 0.0341796875, 0.082763671875, 0.13134765625, 0.179931640625, 0.228515625, 0.277099609375, 0.32568359375, 0.374267578125, 0.4228515625, 0.471435546875, 0.52001953125, 0.568603515625, 0.6171875, 0.665771484375, 0.71435546875, 0.762939453125, 0.8115234375, 0.860107421875, 0.90869140625, 0.957275390625, 1.005859375, 1.054443359375, 1.10302734375, 1.151611328125, 1.2001953125, 1.248779296875, 1.29736328125, 1.345947265625, 1.39453125, 1.443115234375, 1.49169921875, 1.540283203125, 1.5888671875, 1.637451171875, 1.68603515625, 1.734619140625, 1.783203125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 8.0, 9.0, 15.0, 12.0, 11.0, 18.0, 17.0, 28.0, 31.0, 22.0, 35.0, 41.0, 36.0, 49.0, 32.0, 60.0, 45.0, 54.0, 47.0, 42.0, 45.0, 42.0, 43.0, 35.0, 23.0, 40.0, 31.0, 24.0, 21.0, 17.0, 16.0, 12.0, 5.0, 8.0, 11.0, 7.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9775390625, -0.9420013427734375, -0.906463623046875, -0.8709259033203125, -0.83538818359375, -0.7998504638671875, -0.764312744140625, -0.7287750244140625, -0.6932373046875, -0.6576995849609375, -0.622161865234375, -0.5866241455078125, -0.55108642578125, -0.5155487060546875, -0.480010986328125, -0.4444732666015625, -0.408935546875, -0.3733978271484375, -0.337860107421875, -0.3023223876953125, -0.26678466796875, -0.2312469482421875, -0.195709228515625, -0.1601715087890625, -0.1246337890625, -0.0890960693359375, -0.053558349609375, -0.0180206298828125, 0.01751708984375, 0.0530548095703125, 0.088592529296875, 0.1241302490234375, 0.15966796875, 0.1952056884765625, 0.230743408203125, 0.2662811279296875, 0.30181884765625, 0.3373565673828125, 0.372894287109375, 0.4084320068359375, 0.4439697265625, 0.4795074462890625, 0.515045166015625, 0.5505828857421875, 0.58612060546875, 0.6216583251953125, 0.657196044921875, 0.6927337646484375, 0.728271484375, 0.7638092041015625, 0.799346923828125, 0.8348846435546875, 0.87042236328125, 0.9059600830078125, 0.941497802734375, 0.9770355224609375, 1.0125732421875, 1.0481109619140625, 1.083648681640625, 1.1191864013671875, 1.15472412109375, 1.1902618408203125, 1.225799560546875, 1.2613372802734375, 1.296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 11.0, 8.0, 9.0, 21.0, 34.0, 40.0, 53.0, 81.0, 124.0, 219.0, 358.0, 916.0, 2466.0, 8482.0, 30249.0, 111641.0, 469583.0, 320013.0, 74520.0, 20452.0, 5937.0, 1866.0, 658.0, 293.0, 162.0, 111.0, 75.0, 61.0, 42.0, 23.0, 15.0, 11.0, 8.0, 8.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.845703125, -3.7353515625, -3.625, -3.5146484375, -3.404296875, -3.2939453125, -3.18359375, -3.0732421875, -2.962890625, -2.8525390625, -2.7421875, -2.6318359375, -2.521484375, -2.4111328125, -2.30078125, -2.1904296875, -2.080078125, -1.9697265625, -1.859375, -1.7490234375, -1.638671875, -1.5283203125, -1.41796875, -1.3076171875, -1.197265625, -1.0869140625, -0.9765625, -0.8662109375, -0.755859375, -0.6455078125, -0.53515625, -0.4248046875, -0.314453125, -0.2041015625, -0.09375, 0.0166015625, 0.126953125, 0.2373046875, 0.34765625, 0.4580078125, 0.568359375, 0.6787109375, 0.7890625, 0.8994140625, 1.009765625, 1.1201171875, 1.23046875, 1.3408203125, 1.451171875, 1.5615234375, 1.671875, 1.7822265625, 1.892578125, 2.0029296875, 2.11328125, 2.2236328125, 2.333984375, 2.4443359375, 2.5546875, 2.6650390625, 2.775390625, 2.8857421875, 2.99609375, 3.1064453125, 3.216796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 5.0, 8.0, 6.0, 4.0, 12.0, 10.0, 9.0, 13.0, 19.0, 18.0, 27.0, 24.0, 19.0, 38.0, 45.0, 36.0, 34.0, 43.0, 56.0, 44.0, 41.0, 52.0, 46.0, 43.0, 41.0, 42.0, 36.0, 24.0, 27.0, 28.0, 28.0, 19.0, 14.0, 14.0, 13.0, 9.0, 13.0, 12.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.673828125, -3.559539794921875, -3.44525146484375, -3.330963134765625, -3.2166748046875, -3.102386474609375, -2.98809814453125, -2.873809814453125, -2.759521484375, -2.645233154296875, -2.53094482421875, -2.416656494140625, -2.3023681640625, -2.188079833984375, -2.07379150390625, -1.959503173828125, -1.84521484375, -1.730926513671875, -1.61663818359375, -1.502349853515625, -1.3880615234375, -1.273773193359375, -1.15948486328125, -1.045196533203125, -0.930908203125, -0.816619873046875, -0.70233154296875, -0.588043212890625, -0.4737548828125, -0.359466552734375, -0.24517822265625, -0.130889892578125, -0.0166015625, 0.097686767578125, 0.21197509765625, 0.326263427734375, 0.4405517578125, 0.554840087890625, 0.66912841796875, 0.783416748046875, 0.897705078125, 1.011993408203125, 1.12628173828125, 1.240570068359375, 1.3548583984375, 1.469146728515625, 1.58343505859375, 1.697723388671875, 1.81201171875, 1.926300048828125, 2.04058837890625, 2.154876708984375, 2.2691650390625, 2.383453369140625, 2.49774169921875, 2.612030029296875, 2.726318359375, 2.840606689453125, 2.95489501953125, 3.069183349609375, 3.1834716796875, 3.297760009765625, 3.41204833984375, 3.526336669921875, 3.640625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 7.0, 5.0, 8.0, 10.0, 11.0, 8.0, 14.0, 25.0, 31.0, 60.0, 84.0, 134.0, 271.0, 486.0, 1139.0, 2806.0, 7630.0, 22199.0, 67440.0, 236362.0, 482792.0, 154421.0, 47282.0, 15781.0, 5639.0, 2092.0, 860.0, 398.0, 181.0, 127.0, 70.0, 53.0, 34.0, 29.0, 20.0, 9.0, 12.0, 14.0, 5.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3779296875, -1.33251953125, -1.287109375, -1.24169921875, -1.1962890625, -1.15087890625, -1.10546875, -1.06005859375, -1.0146484375, -0.96923828125, -0.923828125, -0.87841796875, -0.8330078125, -0.78759765625, -0.7421875, -0.69677734375, -0.6513671875, -0.60595703125, -0.560546875, -0.51513671875, -0.4697265625, -0.42431640625, -0.37890625, -0.33349609375, -0.2880859375, -0.24267578125, -0.197265625, -0.15185546875, -0.1064453125, -0.06103515625, -0.015625, 0.02978515625, 0.0751953125, 0.12060546875, 0.166015625, 0.21142578125, 0.2568359375, 0.30224609375, 0.34765625, 0.39306640625, 0.4384765625, 0.48388671875, 0.529296875, 0.57470703125, 0.6201171875, 0.66552734375, 0.7109375, 0.75634765625, 0.8017578125, 0.84716796875, 0.892578125, 0.93798828125, 0.9833984375, 1.02880859375, 1.07421875, 1.11962890625, 1.1650390625, 1.21044921875, 1.255859375, 1.30126953125, 1.3466796875, 1.39208984375, 1.4375, 1.48291015625, 1.5283203125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 8.0, 7.0, 8.0, 13.0, 7.0, 12.0, 21.0, 21.0, 14.0, 33.0, 38.0, 81.0, 113.0, 148.0, 117.0, 95.0, 69.0, 45.0, 34.0, 18.0, 19.0, 19.0, 15.0, 11.0, 5.0, 4.0, 6.0, 4.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003037452697753906, -0.0002957247197628021, -0.0002877041697502136, -0.0002796836197376251, -0.0002716630697250366, -0.0002636425197124481, -0.0002556219696998596, -0.0002476014196872711, -0.00023958086967468262, -0.00023156031966209412, -0.00022353976964950562, -0.00021551921963691711, -0.0002074986696243286, -0.0001994781196117401, -0.0001914575695991516, -0.0001834370195865631, -0.0001754164695739746, -0.0001673959195613861, -0.0001593753695487976, -0.0001513548195362091, -0.0001433342695236206, -0.0001353137195110321, -0.0001272931694984436, -0.0001192726194858551, -0.0001112520694732666, -0.0001032315194606781, -9.52109694480896e-05, -8.71904194355011e-05, -7.91698694229126e-05, -7.11493194103241e-05, -6.31287693977356e-05, -5.5108219385147095e-05, -4.7087669372558594e-05, -3.906711935997009e-05, -3.104656934738159e-05, -2.302601933479309e-05, -1.500546932220459e-05, -6.984919309616089e-06, 1.0356307029724121e-06, 9.056180715560913e-06, 1.7076730728149414e-05, 2.5097280740737915e-05, 3.3117830753326416e-05, 4.113838076591492e-05, 4.915893077850342e-05, 5.717948079109192e-05, 6.520003080368042e-05, 7.322058081626892e-05, 8.124113082885742e-05, 8.926168084144592e-05, 9.728223085403442e-05, 0.00010530278086662292, 0.00011332333087921143, 0.00012134388089179993, 0.00012936443090438843, 0.00013738498091697693, 0.00014540553092956543, 0.00015342608094215393, 0.00016144663095474243, 0.00016946718096733093, 0.00017748773097991943, 0.00018550828099250793, 0.00019352883100509644, 0.00020154938101768494, 0.00020956993103027344]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 8.0, 3.0, 8.0, 4.0, 15.0, 7.0, 20.0, 19.0, 51.0, 60.0, 103.0, 131.0, 210.0, 443.0, 679.0, 1260.0, 2483.0, 5019.0, 10256.0, 22571.0, 49255.0, 113987.0, 279533.0, 317650.0, 136923.0, 57796.0, 25914.0, 12070.0, 5744.0, 2885.0, 1455.0, 792.0, 466.0, 251.0, 152.0, 107.0, 70.0, 39.0, 33.0, 19.0, 16.0, 16.0, 18.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.015625, -0.9849395751953125, -0.954254150390625, -0.9235687255859375, -0.89288330078125, -0.8621978759765625, -0.831512451171875, -0.8008270263671875, -0.7701416015625, -0.7394561767578125, -0.708770751953125, -0.6780853271484375, -0.64739990234375, -0.6167144775390625, -0.586029052734375, -0.5553436279296875, -0.524658203125, -0.4939727783203125, -0.463287353515625, -0.4326019287109375, -0.40191650390625, -0.3712310791015625, -0.340545654296875, -0.3098602294921875, -0.2791748046875, -0.2484893798828125, -0.217803955078125, -0.1871185302734375, -0.15643310546875, -0.1257476806640625, -0.095062255859375, -0.0643768310546875, -0.03369140625, -0.0030059814453125, 0.027679443359375, 0.0583648681640625, 0.08905029296875, 0.1197357177734375, 0.150421142578125, 0.1811065673828125, 0.2117919921875, 0.2424774169921875, 0.273162841796875, 0.3038482666015625, 0.33453369140625, 0.3652191162109375, 0.395904541015625, 0.4265899658203125, 0.457275390625, 0.4879608154296875, 0.518646240234375, 0.5493316650390625, 0.58001708984375, 0.6107025146484375, 0.641387939453125, 0.6720733642578125, 0.7027587890625, 0.7334442138671875, 0.764129638671875, 0.7948150634765625, 0.82550048828125, 0.8561859130859375, 0.886871337890625, 0.9175567626953125, 0.9482421875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 4.0, 10.0, 8.0, 6.0, 10.0, 9.0, 9.0, 17.0, 14.0, 24.0, 19.0, 24.0, 38.0, 32.0, 40.0, 49.0, 82.0, 81.0, 81.0, 68.0, 43.0, 63.0, 54.0, 37.0, 25.0, 24.0, 24.0, 19.0, 13.0, 11.0, 9.0, 10.0, 2.0, 4.0, 6.0, 8.0, 5.0, 1.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0], "bins": [-1.025390625, -0.9938735961914062, -0.9623565673828125, -0.9308395385742188, -0.899322509765625, -0.8678054809570312, -0.8362884521484375, -0.8047714233398438, -0.77325439453125, -0.7417373657226562, -0.7102203369140625, -0.6787033081054688, -0.647186279296875, -0.6156692504882812, -0.5841522216796875, -0.5526351928710938, -0.5211181640625, -0.48960113525390625, -0.4580841064453125, -0.42656707763671875, -0.395050048828125, -0.36353302001953125, -0.3320159912109375, -0.30049896240234375, -0.26898193359375, -0.23746490478515625, -0.2059478759765625, -0.17443084716796875, -0.142913818359375, -0.11139678955078125, -0.0798797607421875, -0.04836273193359375, -0.016845703125, 0.01467132568359375, 0.0461883544921875, 0.07770538330078125, 0.109222412109375, 0.14073944091796875, 0.1722564697265625, 0.20377349853515625, 0.23529052734375, 0.26680755615234375, 0.2983245849609375, 0.32984161376953125, 0.361358642578125, 0.39287567138671875, 0.4243927001953125, 0.45590972900390625, 0.4874267578125, 0.5189437866210938, 0.5504608154296875, 0.5819778442382812, 0.613494873046875, 0.6450119018554688, 0.6765289306640625, 0.7080459594726562, 0.73956298828125, 0.7710800170898438, 0.8025970458984375, 0.8341140747070312, 0.865631103515625, 0.8971481323242188, 0.9286651611328125, 0.9601821899414062, 0.99169921875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 7.0, 5.0, 29.0, 179.0, 391.0, 312.0, 80.0, 13.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.794010162353516, -11.140338897705078, -9.48666763305664, -7.832995414733887, -6.179324150085449, -4.525652885437012, -2.871980667114258, -1.2183094024658203, 0.4353618621826172, 2.089033365249634, 3.7427048683166504, 5.396376609802246, 7.050047874450684, 8.703719139099121, 10.357391357421875, 12.011062622070312, 13.66473388671875, 15.318405151367188, 16.972076416015625, 18.625747680664062, 20.2794189453125, 21.933090209960938, 23.586763381958008, 25.240434646606445, 26.894105911254883, 28.54777717590332, 30.201448440551758, 31.855121612548828, 33.508792877197266, 35.1624641418457, 36.81613540649414, 38.46980667114258, 40.12348175048828, 41.77715301513672, 43.430824279785156, 45.084495544433594, 46.73816680908203, 48.39183807373047, 50.045509338378906, 51.699180603027344, 53.35285186767578, 55.00652313232422, 56.660194396972656, 58.313865661621094, 59.96753692626953, 61.62120819091797, 63.274879455566406, 64.92855072021484, 66.58222961425781, 68.23590087890625, 69.88957214355469, 71.54324340820312, 73.19691467285156, 74.8505859375, 76.50425720214844, 78.15792846679688, 79.81159973144531, 81.46527099609375, 83.11894226074219, 84.77261352539062, 86.42628479003906, 88.0799560546875, 89.73362731933594, 91.38729858398438, 93.04096984863281]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 7.0, 6.0, 10.0, 9.0, 7.0, 11.0, 14.0, 15.0, 14.0, 23.0, 32.0, 29.0, 29.0, 41.0, 34.0, 36.0, 46.0, 44.0, 43.0, 47.0, 55.0, 41.0, 44.0, 49.0, 46.0, 34.0, 31.0, 28.0, 24.0, 32.0, 16.0, 16.0, 11.0, 14.0, 12.0, 13.0, 7.0, 6.0, 2.0, 9.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.557900428771973, -10.201011657714844, -9.844121932983398, -9.487232208251953, -9.130343437194824, -8.773454666137695, -8.41656494140625, -8.059675216674805, -7.702786445617676, -7.345897197723389, -6.989007949829102, -6.6321187019348145, -6.275229454040527, -5.91834020614624, -5.561450958251953, -5.204561710357666, -4.847672462463379, -4.490783214569092, -4.133893966674805, -3.7770047187805176, -3.4201154708862305, -3.0632262229919434, -2.7063369750976562, -2.349447727203369, -1.992558479309082, -1.635669231414795, -1.2787799835205078, -0.9218907356262207, -0.5650014877319336, -0.20811223983764648, 0.14877700805664062, 0.5056662559509277, 0.8625564575195312, 1.2194457054138184, 1.5763349533081055, 1.9332242012023926, 2.2901134490966797, 2.647002696990967, 3.003891944885254, 3.360781192779541, 3.717670440673828, 4.074559688568115, 4.431448936462402, 4.7883381843566895, 5.145227432250977, 5.502116680145264, 5.859005928039551, 6.215895175933838, 6.572784423828125, 6.929673671722412, 7.286562919616699, 7.643452167510986, 8.000341415405273, 8.357231140136719, 8.714119911193848, 9.071008682250977, 9.427898406982422, 9.784788131713867, 10.141676902770996, 10.498565673828125, 10.85545539855957, 11.212345123291016, 11.569233894348145, 11.926122665405273, 12.283012390136719]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 12.0, 16.0, 14.0, 30.0, 48.0, 52.0, 82.0, 100.0, 146.0, 219.0, 337.0, 463.0, 705.0, 1121.0, 1754.0, 2797.0, 4503.0, 7922.0, 13979.0, 25330.0, 48968.0, 101071.0, 229044.0, 614755.0, 1662932.0, 898264.0, 311009.0, 132202.0, 62669.0, 31899.0, 17050.0, 9720.0, 5663.0, 3367.0, 2037.0, 1318.0, 844.0, 584.0, 399.0, 289.0, 180.0, 116.0, 63.0, 48.0, 74.0, 33.0, 20.0, 13.0, 8.0, 10.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.212890625, -1.174591064453125, -1.13629150390625, -1.097991943359375, -1.0596923828125, -1.021392822265625, -0.98309326171875, -0.944793701171875, -0.906494140625, -0.868194580078125, -0.82989501953125, -0.791595458984375, -0.7532958984375, -0.714996337890625, -0.67669677734375, -0.638397216796875, -0.60009765625, -0.561798095703125, -0.52349853515625, -0.485198974609375, -0.4468994140625, -0.408599853515625, -0.37030029296875, -0.332000732421875, -0.293701171875, -0.255401611328125, -0.21710205078125, -0.178802490234375, -0.1405029296875, -0.102203369140625, -0.06390380859375, -0.025604248046875, 0.0126953125, 0.050994873046875, 0.08929443359375, 0.127593994140625, 0.1658935546875, 0.204193115234375, 0.24249267578125, 0.280792236328125, 0.319091796875, 0.357391357421875, 0.39569091796875, 0.433990478515625, 0.4722900390625, 0.510589599609375, 0.54888916015625, 0.587188720703125, 0.62548828125, 0.663787841796875, 0.70208740234375, 0.740386962890625, 0.7786865234375, 0.816986083984375, 0.85528564453125, 0.893585205078125, 0.931884765625, 0.970184326171875, 1.00848388671875, 1.046783447265625, 1.0850830078125, 1.123382568359375, 1.16168212890625, 1.199981689453125, 1.23828125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 8.0, 4.0, 6.0, 7.0, 7.0, 16.0, 18.0, 13.0, 21.0, 18.0, 34.0, 29.0, 38.0, 25.0, 29.0, 38.0, 39.0, 38.0, 43.0, 46.0, 33.0, 36.0, 51.0, 48.0, 40.0, 47.0, 37.0, 21.0, 32.0, 24.0, 28.0, 21.0, 15.0, 16.0, 12.0, 24.0, 8.0, 6.0, 11.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.17578125, -1.1382904052734375, -1.100799560546875, -1.0633087158203125, -1.02581787109375, -0.9883270263671875, -0.950836181640625, -0.9133453369140625, -0.8758544921875, -0.8383636474609375, -0.800872802734375, -0.7633819580078125, -0.72589111328125, -0.6884002685546875, -0.650909423828125, -0.6134185791015625, -0.575927734375, -0.5384368896484375, -0.500946044921875, -0.4634552001953125, -0.42596435546875, -0.3884735107421875, -0.350982666015625, -0.3134918212890625, -0.2760009765625, -0.2385101318359375, -0.201019287109375, -0.1635284423828125, -0.12603759765625, -0.0885467529296875, -0.051055908203125, -0.0135650634765625, 0.02392578125, 0.0614166259765625, 0.098907470703125, 0.1363983154296875, 0.17388916015625, 0.2113800048828125, 0.248870849609375, 0.2863616943359375, 0.3238525390625, 0.3613433837890625, 0.398834228515625, 0.4363250732421875, 0.47381591796875, 0.5113067626953125, 0.548797607421875, 0.5862884521484375, 0.623779296875, 0.6612701416015625, 0.698760986328125, 0.7362518310546875, 0.77374267578125, 0.8112335205078125, 0.848724365234375, 0.8862152099609375, 0.9237060546875, 0.9611968994140625, 0.998687744140625, 1.0361785888671875, 1.07366943359375, 1.1111602783203125, 1.148651123046875, 1.1861419677734375, 1.2236328125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 6.0, 7.0, 15.0, 16.0, 28.0, 25.0, 52.0, 75.0, 120.0, 199.0, 360.0, 670.0, 1297.0, 2791.0, 6998.0, 20254.0, 62163.0, 220093.0, 1051077.0, 2219230.0, 442633.0, 112498.0, 33931.0, 11419.0, 4305.0, 1921.0, 883.0, 463.0, 266.0, 151.0, 103.0, 53.0, 43.0, 35.0, 19.0, 24.0, 12.0, 13.0, 8.0, 7.0, 3.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.78515625, -2.696014404296875, -2.60687255859375, -2.517730712890625, -2.4285888671875, -2.339447021484375, -2.25030517578125, -2.161163330078125, -2.072021484375, -1.982879638671875, -1.89373779296875, -1.804595947265625, -1.7154541015625, -1.626312255859375, -1.53717041015625, -1.448028564453125, -1.35888671875, -1.269744873046875, -1.18060302734375, -1.091461181640625, -1.0023193359375, -0.913177490234375, -0.82403564453125, -0.734893798828125, -0.645751953125, -0.556610107421875, -0.46746826171875, -0.378326416015625, -0.2891845703125, -0.200042724609375, -0.11090087890625, -0.021759033203125, 0.0673828125, 0.156524658203125, 0.24566650390625, 0.334808349609375, 0.4239501953125, 0.513092041015625, 0.60223388671875, 0.691375732421875, 0.780517578125, 0.869659423828125, 0.95880126953125, 1.047943115234375, 1.1370849609375, 1.226226806640625, 1.31536865234375, 1.404510498046875, 1.49365234375, 1.582794189453125, 1.67193603515625, 1.761077880859375, 1.8502197265625, 1.939361572265625, 2.02850341796875, 2.117645263671875, 2.206787109375, 2.295928955078125, 2.38507080078125, 2.474212646484375, 2.5633544921875, 2.652496337890625, 2.74163818359375, 2.830780029296875, 2.919921875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 8.0, 13.0, 16.0, 31.0, 40.0, 39.0, 72.0, 112.0, 135.0, 228.0, 362.0, 597.0, 770.0, 596.0, 365.0, 244.0, 148.0, 87.0, 63.0, 39.0, 28.0, 22.0, 18.0, 9.0, 6.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.080078125, -2.98236083984375, -2.8846435546875, -2.78692626953125, -2.689208984375, -2.59149169921875, -2.4937744140625, -2.39605712890625, -2.29833984375, -2.20062255859375, -2.1029052734375, -2.00518798828125, -1.907470703125, -1.80975341796875, -1.7120361328125, -1.61431884765625, -1.5166015625, -1.41888427734375, -1.3211669921875, -1.22344970703125, -1.125732421875, -1.02801513671875, -0.9302978515625, -0.83258056640625, -0.73486328125, -0.63714599609375, -0.5394287109375, -0.44171142578125, -0.343994140625, -0.24627685546875, -0.1485595703125, -0.05084228515625, 0.046875, 0.14459228515625, 0.2423095703125, 0.34002685546875, 0.437744140625, 0.53546142578125, 0.6331787109375, 0.73089599609375, 0.82861328125, 0.92633056640625, 1.0240478515625, 1.12176513671875, 1.219482421875, 1.31719970703125, 1.4149169921875, 1.51263427734375, 1.6103515625, 1.70806884765625, 1.8057861328125, 1.90350341796875, 2.001220703125, 2.09893798828125, 2.1966552734375, 2.29437255859375, 2.39208984375, 2.48980712890625, 2.5875244140625, 2.68524169921875, 2.782958984375, 2.88067626953125, 2.9783935546875, 3.07611083984375, 3.173828125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 8.0, 7.0, 19.0, 20.0, 26.0, 32.0, 49.0, 44.0, 66.0, 66.0, 78.0, 74.0, 77.0, 96.0, 76.0, 51.0, 46.0, 45.0, 30.0, 23.0, 24.0, 10.0, 7.0, 5.0, 5.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.427412033081055, -10.109634399414062, -9.791857719421387, -9.474080085754395, -9.156303405761719, -8.838525772094727, -8.520748138427734, -8.202970504760742, -7.885193824768066, -7.567416667938232, -7.249639511108398, -6.931861877441406, -6.614084720611572, -6.296307563781738, -5.978529930114746, -5.660752773284912, -5.342975616455078, -5.025198459625244, -4.70742130279541, -4.389643669128418, -4.071866512298584, -3.75408935546875, -3.436311960220337, -3.118534564971924, -2.80075740814209, -2.482980251312256, -2.1652028560638428, -1.8474255800247192, -1.5296483039855957, -1.2118710279464722, -0.8940937519073486, -0.5763163566589355, -0.25853919982910156, 0.05923807621002197, 0.3770153522491455, 0.694792628288269, 1.0125699043273926, 1.3303471803665161, 1.6481244564056396, 1.9659018516540527, 2.2836790084838867, 2.6014561653137207, 2.919233560562134, 3.237010955810547, 3.554788112640381, 3.872565269470215, 4.190342903137207, 4.508120059967041, 4.825897216796875, 5.143674373626709, 5.461451530456543, 5.779229164123535, 6.097006320953369, 6.414783477783203, 6.732561111450195, 7.050338268280029, 7.368115425109863, 7.685892581939697, 8.003669738769531, 8.321447372436523, 8.639225006103516, 8.957001686096191, 9.274779319763184, 9.59255599975586, 9.910333633422852]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 4.0, 10.0, 7.0, 8.0, 10.0, 13.0, 19.0, 14.0, 34.0, 21.0, 32.0, 20.0, 36.0, 33.0, 34.0, 38.0, 43.0, 42.0, 49.0, 54.0, 44.0, 51.0, 43.0, 46.0, 42.0, 40.0, 37.0, 21.0, 27.0, 24.0, 20.0, 14.0, 13.0, 8.0, 15.0, 6.0, 8.0, 8.0, 5.0, 2.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-9.653166770935059, -9.388315200805664, -9.123462677001953, -8.858611106872559, -8.593759536743164, -8.328907012939453, -8.064055442810059, -7.799203872680664, -7.534351825714111, -7.269499778747559, -7.004648208618164, -6.739796161651611, -6.474944114685059, -6.210092544555664, -5.945240497589111, -5.680388450622559, -5.415536880493164, -5.150684833526611, -4.885833263397217, -4.620981216430664, -4.3561296463012695, -4.091277599334717, -3.826425552368164, -3.5615737438201904, -3.296721935272217, -3.031870126724243, -2.7670183181762695, -2.502166271209717, -2.237314462661743, -1.9724626541137695, -1.7076107263565063, -1.4427587985992432, -1.177907943725586, -0.9130560755729675, -0.6482042074203491, -0.3833523392677307, -0.1185004711151123, 0.14635133743286133, 0.4112032651901245, 0.6760551929473877, 0.9409070014953613, 1.205758810043335, 1.4706107378005981, 1.7354626655578613, 2.000314474105835, 2.2651662826538086, 2.5300183296203613, 2.794870138168335, 3.0597219467163086, 3.3245737552642822, 3.589425563812256, 3.8542776107788086, 4.119129180908203, 4.383981227874756, 4.648833274841309, 4.913684844970703, 5.178536891937256, 5.443388938903809, 5.708240509033203, 5.973092555999756, 6.237944602966309, 6.502796173095703, 6.767648220062256, 7.032500267028809, 7.297351837158203]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 4.0, 3.0, 5.0, 12.0, 10.0, 17.0, 21.0, 34.0, 59.0, 83.0, 127.0, 163.0, 245.0, 387.0, 477.0, 713.0, 1025.0, 1541.0, 2216.0, 3300.0, 5141.0, 7800.0, 12138.0, 19087.0, 32328.0, 57983.0, 136811.0, 326090.0, 237104.0, 89555.0, 43978.0, 25210.0, 15459.0, 9927.0, 6382.0, 4210.0, 2845.0, 2006.0, 1300.0, 845.0, 604.0, 368.0, 295.0, 229.0, 127.0, 91.0, 63.0, 55.0, 25.0, 25.0, 11.0, 7.0, 5.0, 6.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.375, -1.33172607421875, -1.2884521484375, -1.24517822265625, -1.201904296875, -1.15863037109375, -1.1153564453125, -1.07208251953125, -1.02880859375, -0.98553466796875, -0.9422607421875, -0.89898681640625, -0.855712890625, -0.81243896484375, -0.7691650390625, -0.72589111328125, -0.6826171875, -0.63934326171875, -0.5960693359375, -0.55279541015625, -0.509521484375, -0.46624755859375, -0.4229736328125, -0.37969970703125, -0.33642578125, -0.29315185546875, -0.2498779296875, -0.20660400390625, -0.163330078125, -0.12005615234375, -0.0767822265625, -0.03350830078125, 0.009765625, 0.05303955078125, 0.0963134765625, 0.13958740234375, 0.182861328125, 0.22613525390625, 0.2694091796875, 0.31268310546875, 0.35595703125, 0.39923095703125, 0.4425048828125, 0.48577880859375, 0.529052734375, 0.57232666015625, 0.6156005859375, 0.65887451171875, 0.7021484375, 0.74542236328125, 0.7886962890625, 0.83197021484375, 0.875244140625, 0.91851806640625, 0.9617919921875, 1.00506591796875, 1.04833984375, 1.09161376953125, 1.1348876953125, 1.17816162109375, 1.221435546875, 1.26470947265625, 1.3079833984375, 1.35125732421875, 1.39453125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 7.0, 5.0, 8.0, 12.0, 14.0, 13.0, 14.0, 9.0, 21.0, 17.0, 24.0, 20.0, 30.0, 26.0, 26.0, 43.0, 26.0, 34.0, 42.0, 34.0, 36.0, 31.0, 35.0, 49.0, 29.0, 35.0, 37.0, 25.0, 35.0, 36.0, 37.0, 25.0, 24.0, 22.0, 24.0, 12.0, 16.0, 12.0, 5.0, 14.0, 6.0, 8.0, 7.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.12890625, -1.095367431640625, -1.06182861328125, -1.028289794921875, -0.9947509765625, -0.961212158203125, -0.92767333984375, -0.894134521484375, -0.860595703125, -0.827056884765625, -0.79351806640625, -0.759979248046875, -0.7264404296875, -0.692901611328125, -0.65936279296875, -0.625823974609375, -0.59228515625, -0.558746337890625, -0.52520751953125, -0.491668701171875, -0.4581298828125, -0.424591064453125, -0.39105224609375, -0.357513427734375, -0.323974609375, -0.290435791015625, -0.25689697265625, -0.223358154296875, -0.1898193359375, -0.156280517578125, -0.12274169921875, -0.089202880859375, -0.0556640625, -0.022125244140625, 0.01141357421875, 0.044952392578125, 0.0784912109375, 0.112030029296875, 0.14556884765625, 0.179107666015625, 0.212646484375, 0.246185302734375, 0.27972412109375, 0.313262939453125, 0.3468017578125, 0.380340576171875, 0.41387939453125, 0.447418212890625, 0.48095703125, 0.514495849609375, 0.54803466796875, 0.581573486328125, 0.6151123046875, 0.648651123046875, 0.68218994140625, 0.715728759765625, 0.749267578125, 0.782806396484375, 0.81634521484375, 0.849884033203125, 0.8834228515625, 0.916961669921875, 0.95050048828125, 0.984039306640625, 1.017578125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 8.0, 10.0, 11.0, 28.0, 26.0, 38.0, 41.0, 97.0, 146.0, 236.0, 442.0, 1135.0, 3072.0, 7929.0, 21221.0, 62973.0, 326935.0, 494221.0, 86020.0, 27275.0, 10081.0, 3795.0, 1489.0, 612.0, 307.0, 138.0, 79.0, 66.0, 38.0, 26.0, 15.0, 13.0, 8.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.265625, -3.169921875, -3.07421875, -2.978515625, -2.8828125, -2.787109375, -2.69140625, -2.595703125, -2.5, -2.404296875, -2.30859375, -2.212890625, -2.1171875, -2.021484375, -1.92578125, -1.830078125, -1.734375, -1.638671875, -1.54296875, -1.447265625, -1.3515625, -1.255859375, -1.16015625, -1.064453125, -0.96875, -0.873046875, -0.77734375, -0.681640625, -0.5859375, -0.490234375, -0.39453125, -0.298828125, -0.203125, -0.107421875, -0.01171875, 0.083984375, 0.1796875, 0.275390625, 0.37109375, 0.466796875, 0.5625, 0.658203125, 0.75390625, 0.849609375, 0.9453125, 1.041015625, 1.13671875, 1.232421875, 1.328125, 1.423828125, 1.51953125, 1.615234375, 1.7109375, 1.806640625, 1.90234375, 1.998046875, 2.09375, 2.189453125, 2.28515625, 2.380859375, 2.4765625, 2.572265625, 2.66796875, 2.763671875, 2.859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 8.0, 4.0, 4.0, 7.0, 9.0, 11.0, 17.0, 18.0, 13.0, 26.0, 21.0, 23.0, 40.0, 32.0, 40.0, 49.0, 43.0, 49.0, 50.0, 56.0, 62.0, 52.0, 45.0, 52.0, 29.0, 41.0, 24.0, 32.0, 21.0, 23.0, 23.0, 15.0, 17.0, 13.0, 11.0, 7.0, 7.0, 4.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.58203125, -3.4610595703125, -3.340087890625, -3.2191162109375, -3.09814453125, -2.9771728515625, -2.856201171875, -2.7352294921875, -2.6142578125, -2.4932861328125, -2.372314453125, -2.2513427734375, -2.13037109375, -2.0093994140625, -1.888427734375, -1.7674560546875, -1.646484375, -1.5255126953125, -1.404541015625, -1.2835693359375, -1.16259765625, -1.0416259765625, -0.920654296875, -0.7996826171875, -0.6787109375, -0.5577392578125, -0.436767578125, -0.3157958984375, -0.19482421875, -0.0738525390625, 0.047119140625, 0.1680908203125, 0.2890625, 0.4100341796875, 0.531005859375, 0.6519775390625, 0.77294921875, 0.8939208984375, 1.014892578125, 1.1358642578125, 1.2568359375, 1.3778076171875, 1.498779296875, 1.6197509765625, 1.74072265625, 1.8616943359375, 1.982666015625, 2.1036376953125, 2.224609375, 2.3455810546875, 2.466552734375, 2.5875244140625, 2.70849609375, 2.8294677734375, 2.950439453125, 3.0714111328125, 3.1923828125, 3.3133544921875, 3.434326171875, 3.5552978515625, 3.67626953125, 3.7972412109375, 3.918212890625, 4.0391845703125, 4.16015625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 16.0, 19.0, 19.0, 32.0, 40.0, 59.0, 104.0, 136.0, 211.0, 354.0, 757.0, 1237.0, 2516.0, 5060.0, 10047.0, 20395.0, 43330.0, 92465.0, 252969.0, 377213.0, 128660.0, 58333.0, 27567.0, 13373.0, 6605.0, 3320.0, 1661.0, 838.0, 472.0, 257.0, 164.0, 83.0, 76.0, 56.0, 34.0, 14.0, 5.0, 13.0, 10.0, 7.0, 4.0, 3.0, 4.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.83544921875, -0.8077850341796875, -0.780120849609375, -0.7524566650390625, -0.72479248046875, -0.6971282958984375, -0.669464111328125, -0.6417999267578125, -0.6141357421875, -0.5864715576171875, -0.558807373046875, -0.5311431884765625, -0.50347900390625, -0.4758148193359375, -0.448150634765625, -0.4204864501953125, -0.392822265625, -0.3651580810546875, -0.337493896484375, -0.3098297119140625, -0.28216552734375, -0.2545013427734375, -0.226837158203125, -0.1991729736328125, -0.1715087890625, -0.1438446044921875, -0.116180419921875, -0.0885162353515625, -0.06085205078125, -0.0331878662109375, -0.005523681640625, 0.0221405029296875, 0.0498046875, 0.0774688720703125, 0.105133056640625, 0.1327972412109375, 0.16046142578125, 0.1881256103515625, 0.215789794921875, 0.2434539794921875, 0.2711181640625, 0.2987823486328125, 0.326446533203125, 0.3541107177734375, 0.38177490234375, 0.4094390869140625, 0.437103271484375, 0.4647674560546875, 0.492431640625, 0.5200958251953125, 0.547760009765625, 0.5754241943359375, 0.60308837890625, 0.6307525634765625, 0.658416748046875, 0.6860809326171875, 0.7137451171875, 0.7414093017578125, 0.769073486328125, 0.7967376708984375, 0.82440185546875, 0.8520660400390625, 0.879730224609375, 0.9073944091796875, 0.93505859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 7.0, 6.0, 6.0, 4.0, 9.0, 13.0, 19.0, 22.0, 25.0, 41.0, 45.0, 68.0, 102.0, 160.0, 136.0, 91.0, 56.0, 36.0, 29.0, 17.0, 21.0, 14.0, 16.0, 7.0, 8.0, 10.0, 7.0, 8.0, 1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.00019359588623046875, -0.0001871064305305481, -0.00018061697483062744, -0.0001741275191307068, -0.00016763806343078613, -0.00016114860773086548, -0.00015465915203094482, -0.00014816969633102417, -0.00014168024063110352, -0.00013519078493118286, -0.0001287013292312622, -0.00012221187353134155, -0.0001157224178314209, -0.00010923296213150024, -0.00010274350643157959, -9.625405073165894e-05, -8.976459503173828e-05, -8.327513933181763e-05, -7.678568363189697e-05, -7.029622793197632e-05, -6.380677223205566e-05, -5.731731653213501e-05, -5.0827860832214355e-05, -4.43384051322937e-05, -3.784894943237305e-05, -3.135949373245239e-05, -2.4870038032531738e-05, -1.8380582332611084e-05, -1.189112663269043e-05, -5.401670932769775e-06, 1.087784767150879e-06, 7.577240467071533e-06, 1.4066696166992188e-05, 2.0556151866912842e-05, 2.7045607566833496e-05, 3.353506326675415e-05, 4.0024518966674805e-05, 4.651397466659546e-05, 5.300343036651611e-05, 5.949288606643677e-05, 6.598234176635742e-05, 7.247179746627808e-05, 7.896125316619873e-05, 8.545070886611938e-05, 9.194016456604004e-05, 9.84296202659607e-05, 0.00010491907596588135, 0.000111408531665802, 0.00011789798736572266, 0.0001243874430656433, 0.00013087689876556396, 0.00013736635446548462, 0.00014385581016540527, 0.00015034526586532593, 0.00015683472156524658, 0.00016332417726516724, 0.0001698136329650879, 0.00017630308866500854, 0.0001827925443649292, 0.00018928200006484985, 0.0001957714557647705, 0.00020226091146469116, 0.00020875036716461182, 0.00021523982286453247, 0.00022172927856445312]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 13.0, 11.0, 30.0, 34.0, 43.0, 73.0, 120.0, 199.0, 350.0, 681.0, 1391.0, 3144.0, 8179.0, 24722.0, 84594.0, 375574.0, 413826.0, 93109.0, 27189.0, 8767.0, 3324.0, 1462.0, 737.0, 398.0, 220.0, 107.0, 82.0, 70.0, 35.0, 17.0, 12.0, 14.0, 7.0, 10.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.4296875, -1.38641357421875, -1.3431396484375, -1.29986572265625, -1.256591796875, -1.21331787109375, -1.1700439453125, -1.12677001953125, -1.08349609375, -1.04022216796875, -0.9969482421875, -0.95367431640625, -0.910400390625, -0.86712646484375, -0.8238525390625, -0.78057861328125, -0.7373046875, -0.69403076171875, -0.6507568359375, -0.60748291015625, -0.564208984375, -0.52093505859375, -0.4776611328125, -0.43438720703125, -0.39111328125, -0.34783935546875, -0.3045654296875, -0.26129150390625, -0.218017578125, -0.17474365234375, -0.1314697265625, -0.08819580078125, -0.044921875, -0.00164794921875, 0.0416259765625, 0.08489990234375, 0.128173828125, 0.17144775390625, 0.2147216796875, 0.25799560546875, 0.30126953125, 0.34454345703125, 0.3878173828125, 0.43109130859375, 0.474365234375, 0.51763916015625, 0.5609130859375, 0.60418701171875, 0.6474609375, 0.69073486328125, 0.7340087890625, 0.77728271484375, 0.820556640625, 0.86383056640625, 0.9071044921875, 0.95037841796875, 0.99365234375, 1.03692626953125, 1.0802001953125, 1.12347412109375, 1.166748046875, 1.21002197265625, 1.2532958984375, 1.29656982421875, 1.33984375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 2.0, 8.0, 4.0, 6.0, 8.0, 10.0, 8.0, 16.0, 11.0, 17.0, 22.0, 35.0, 21.0, 40.0, 59.0, 68.0, 91.0, 80.0, 94.0, 67.0, 57.0, 48.0, 33.0, 35.0, 23.0, 19.0, 17.0, 15.0, 11.0, 12.0, 11.0, 9.0, 6.0, 3.0, 5.0, 1.0, 5.0, 2.0, 1.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.861328125, -0.8333053588867188, -0.8052825927734375, -0.7772598266601562, -0.749237060546875, -0.7212142944335938, -0.6931915283203125, -0.6651687622070312, -0.63714599609375, -0.6091232299804688, -0.5811004638671875, -0.5530776977539062, -0.525054931640625, -0.49703216552734375, -0.4690093994140625, -0.44098663330078125, -0.4129638671875, -0.38494110107421875, -0.3569183349609375, -0.32889556884765625, -0.300872802734375, -0.27285003662109375, -0.2448272705078125, -0.21680450439453125, -0.18878173828125, -0.16075897216796875, -0.1327362060546875, -0.10471343994140625, -0.076690673828125, -0.04866790771484375, -0.0206451416015625, 0.00737762451171875, 0.035400390625, 0.06342315673828125, 0.0914459228515625, 0.11946868896484375, 0.147491455078125, 0.17551422119140625, 0.2035369873046875, 0.23155975341796875, 0.25958251953125, 0.28760528564453125, 0.3156280517578125, 0.34365081787109375, 0.371673583984375, 0.39969635009765625, 0.4277191162109375, 0.45574188232421875, 0.4837646484375, 0.5117874145507812, 0.5398101806640625, 0.5678329467773438, 0.595855712890625, 0.6238784790039062, 0.6519012451171875, 0.6799240112304688, 0.70794677734375, 0.7359695434570312, 0.7639923095703125, 0.7920150756835938, 0.820037841796875, 0.8480606079101562, 0.8760833740234375, 0.9041061401367188, 0.93212890625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 22.0, 50.0, 77.0, 104.0, 159.0, 188.0, 157.0, 110.0, 66.0, 29.0, 12.0, 13.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.155290603637695, -10.607590675354004, -10.059890747070312, -9.512190818786621, -8.96449089050293, -8.416790008544922, -7.8690900802612305, -7.321390151977539, -6.773690223693848, -6.225990295410156, -5.678290367126465, -5.130589962005615, -4.582890033721924, -4.035190105438232, -3.487489938735962, -2.9397897720336914, -2.39208984375, -1.844389796257019, -1.296689748764038, -0.7489897012710571, -0.20128965377807617, 0.34641027450561523, 0.8941104412078857, 1.4418106079101562, 1.9895105361938477, 2.537210464477539, 3.0849106311798096, 3.63261079788208, 4.1803107261657715, 4.728010654449463, 5.2757110595703125, 5.823410987854004, 6.371112823486328, 6.9188127517700195, 7.466512680053711, 8.014212608337402, 8.561912536621094, 9.109613418579102, 9.657313346862793, 10.205013275146484, 10.752713203430176, 11.300413131713867, 11.848113059997559, 12.39581298828125, 12.943513870239258, 13.491212844848633, 14.03891372680664, 14.586613655090332, 15.134313583374023, 15.682013511657715, 16.229713439941406, 16.777414321899414, 17.32511329650879, 17.872814178466797, 18.420513153076172, 18.96821403503418, 19.515914916992188, 20.063615798950195, 20.61131477355957, 21.159015655517578, 21.706714630126953, 22.25441551208496, 22.802114486694336, 23.349815368652344, 23.89751434326172]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 4.0, 7.0, 9.0, 4.0, 4.0, 9.0, 13.0, 12.0, 15.0, 18.0, 27.0, 23.0, 33.0, 25.0, 31.0, 38.0, 25.0, 23.0, 21.0, 45.0, 36.0, 52.0, 32.0, 36.0, 41.0, 46.0, 34.0, 28.0, 40.0, 41.0, 15.0, 19.0, 31.0, 21.0, 18.0, 20.0, 21.0, 15.0, 15.0, 8.0, 8.0, 9.0, 7.0, 6.0, 4.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0], "bins": [-8.14990234375, -7.908098220825195, -7.666294097900391, -7.424489974975586, -7.182685852050781, -6.940881729125977, -6.699077606201172, -6.457273006439209, -6.215468883514404, -5.9736647605896, -5.731860637664795, -5.49005651473999, -5.2482523918151855, -5.006447792053223, -4.764643669128418, -4.522839546203613, -4.281035423278809, -4.039231300354004, -3.797427177429199, -3.5556230545043945, -3.3138186931610107, -3.072014570236206, -2.8302104473114014, -2.5884060859680176, -2.346602439880371, -2.1047983169555664, -1.8629940748214722, -1.6211899518966675, -1.3793857097625732, -1.1375815868377686, -0.8957774639129639, -0.6539732217788696, -0.4121689796447754, -0.17036481201648712, 0.07143935561180115, 0.3132435083389282, 0.5550476908683777, 0.7968518733978271, 1.0386559963226318, 1.280460238456726, 1.5222643613815308, 1.7640684843063354, 2.0058727264404297, 2.2476768493652344, 2.489480972290039, 2.7312850952148438, 2.9730892181396484, 3.2148935794830322, 3.456697702407837, 3.6985018253326416, 3.9403059482574463, 4.18211030960083, 4.423914432525635, 4.6657185554504395, 4.907522678375244, 5.149326801300049, 5.3911309242248535, 5.632935047149658, 5.874739170074463, 6.116543292999268, 6.358347415924072, 6.600152015686035, 6.84195613861084, 7.0837602615356445, 7.325564384460449]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 4.0, 8.0, 19.0, 14.0, 28.0, 28.0, 71.0, 76.0, 105.0, 158.0, 207.0, 324.0, 468.0, 815.0, 1249.0, 2159.0, 3837.0, 6971.0, 13552.0, 29260.0, 66443.0, 170942.0, 584691.0, 2141406.0, 809548.0, 212986.0, 79823.0, 34362.0, 15840.0, 8041.0, 4178.0, 2426.0, 1507.0, 904.0, 550.0, 382.0, 273.0, 185.0, 121.0, 93.0, 68.0, 33.0, 37.0, 16.0, 19.0, 14.0, 10.0, 10.0, 8.0, 5.0, 8.0, 2.0, 0.0, 3.0, 3.0], "bins": [-1.7138671875, -1.6613006591796875, -1.608734130859375, -1.5561676025390625, -1.50360107421875, -1.4510345458984375, -1.398468017578125, -1.3459014892578125, -1.2933349609375, -1.2407684326171875, -1.188201904296875, -1.1356353759765625, -1.08306884765625, -1.0305023193359375, -0.977935791015625, -0.9253692626953125, -0.872802734375, -0.8202362060546875, -0.767669677734375, -0.7151031494140625, -0.66253662109375, -0.6099700927734375, -0.557403564453125, -0.5048370361328125, -0.4522705078125, -0.3997039794921875, -0.347137451171875, -0.2945709228515625, -0.24200439453125, -0.1894378662109375, -0.136871337890625, -0.0843048095703125, -0.03173828125, 0.0208282470703125, 0.073394775390625, 0.1259613037109375, 0.17852783203125, 0.2310943603515625, 0.283660888671875, 0.3362274169921875, 0.3887939453125, 0.4413604736328125, 0.493927001953125, 0.5464935302734375, 0.59906005859375, 0.6516265869140625, 0.704193115234375, 0.7567596435546875, 0.809326171875, 0.8618927001953125, 0.914459228515625, 0.9670257568359375, 1.01959228515625, 1.0721588134765625, 1.124725341796875, 1.1772918701171875, 1.2298583984375, 1.2824249267578125, 1.334991455078125, 1.3875579833984375, 1.44012451171875, 1.4926910400390625, 1.545257568359375, 1.5978240966796875, 1.650390625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 5.0, 4.0, 8.0, 8.0, 7.0, 10.0, 11.0, 8.0, 21.0, 28.0, 16.0, 22.0, 26.0, 26.0, 27.0, 36.0, 35.0, 25.0, 27.0, 34.0, 49.0, 41.0, 44.0, 28.0, 36.0, 42.0, 36.0, 28.0, 39.0, 36.0, 38.0, 31.0, 28.0, 18.0, 17.0, 19.0, 13.0, 10.0, 12.0, 11.0, 9.0, 9.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.96337890625, -0.9307785034179688, -0.8981781005859375, -0.8655776977539062, -0.832977294921875, -0.8003768920898438, -0.7677764892578125, -0.7351760864257812, -0.70257568359375, -0.6699752807617188, -0.6373748779296875, -0.6047744750976562, -0.572174072265625, -0.5395736694335938, -0.5069732666015625, -0.47437286376953125, -0.4417724609375, -0.40917205810546875, -0.3765716552734375, -0.34397125244140625, -0.311370849609375, -0.27877044677734375, -0.2461700439453125, -0.21356964111328125, -0.18096923828125, -0.14836883544921875, -0.1157684326171875, -0.08316802978515625, -0.050567626953125, -0.01796722412109375, 0.0146331787109375, 0.04723358154296875, 0.079833984375, 0.11243438720703125, 0.1450347900390625, 0.17763519287109375, 0.210235595703125, 0.24283599853515625, 0.2754364013671875, 0.30803680419921875, 0.34063720703125, 0.37323760986328125, 0.4058380126953125, 0.43843841552734375, 0.471038818359375, 0.5036392211914062, 0.5362396240234375, 0.5688400268554688, 0.6014404296875, 0.6340408325195312, 0.6666412353515625, 0.6992416381835938, 0.731842041015625, 0.7644424438476562, 0.7970428466796875, 0.8296432495117188, 0.86224365234375, 0.8948440551757812, 0.9274444580078125, 0.9600448608398438, 0.992645263671875, 1.0252456665039062, 1.0578460693359375, 1.0904464721679688, 1.123046875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 5.0, 7.0, 10.0, 15.0, 20.0, 20.0, 20.0, 42.0, 60.0, 94.0, 120.0, 186.0, 254.0, 399.0, 549.0, 898.0, 1451.0, 2378.0, 4047.0, 7327.0, 13734.0, 27624.0, 59893.0, 137805.0, 379442.0, 1523279.0, 1430243.0, 358225.0, 131596.0, 56807.0, 26993.0, 13147.0, 7227.0, 3998.0, 2354.0, 1380.0, 885.0, 598.0, 372.0, 227.0, 159.0, 106.0, 75.0, 61.0, 43.0, 30.0, 22.0, 22.0, 13.0, 9.0, 9.0, 7.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8154296875, -1.7548675537109375, -1.694305419921875, -1.6337432861328125, -1.57318115234375, -1.5126190185546875, -1.452056884765625, -1.3914947509765625, -1.3309326171875, -1.2703704833984375, -1.209808349609375, -1.1492462158203125, -1.08868408203125, -1.0281219482421875, -0.967559814453125, -0.9069976806640625, -0.846435546875, -0.7858734130859375, -0.725311279296875, -0.6647491455078125, -0.60418701171875, -0.5436248779296875, -0.483062744140625, -0.4225006103515625, -0.3619384765625, -0.3013763427734375, -0.240814208984375, -0.1802520751953125, -0.11968994140625, -0.0591278076171875, 0.001434326171875, 0.0619964599609375, 0.12255859375, 0.1831207275390625, 0.243682861328125, 0.3042449951171875, 0.36480712890625, 0.4253692626953125, 0.485931396484375, 0.5464935302734375, 0.6070556640625, 0.6676177978515625, 0.728179931640625, 0.7887420654296875, 0.84930419921875, 0.9098663330078125, 0.970428466796875, 1.0309906005859375, 1.091552734375, 1.1521148681640625, 1.212677001953125, 1.2732391357421875, 1.33380126953125, 1.3943634033203125, 1.454925537109375, 1.5154876708984375, 1.5760498046875, 1.6366119384765625, 1.697174072265625, 1.7577362060546875, 1.81829833984375, 1.8788604736328125, 1.939422607421875, 1.9999847412109375, 2.060546875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 8.0, 10.0, 10.0, 18.0, 22.0, 33.0, 37.0, 64.0, 89.0, 115.0, 169.0, 273.0, 469.0, 794.0, 750.0, 432.0, 252.0, 136.0, 112.0, 70.0, 63.0, 30.0, 27.0, 23.0, 12.0, 11.0, 10.0, 11.0, 6.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.412109375, -3.31976318359375, -3.2274169921875, -3.13507080078125, -3.042724609375, -2.95037841796875, -2.8580322265625, -2.76568603515625, -2.67333984375, -2.58099365234375, -2.4886474609375, -2.39630126953125, -2.303955078125, -2.21160888671875, -2.1192626953125, -2.02691650390625, -1.9345703125, -1.84222412109375, -1.7498779296875, -1.65753173828125, -1.565185546875, -1.47283935546875, -1.3804931640625, -1.28814697265625, -1.19580078125, -1.10345458984375, -1.0111083984375, -0.91876220703125, -0.826416015625, -0.73406982421875, -0.6417236328125, -0.54937744140625, -0.45703125, -0.36468505859375, -0.2723388671875, -0.17999267578125, -0.087646484375, 0.00469970703125, 0.0970458984375, 0.18939208984375, 0.28173828125, 0.37408447265625, 0.4664306640625, 0.55877685546875, 0.651123046875, 0.74346923828125, 0.8358154296875, 0.92816162109375, 1.0205078125, 1.11285400390625, 1.2052001953125, 1.29754638671875, 1.389892578125, 1.48223876953125, 1.5745849609375, 1.66693115234375, 1.75927734375, 1.85162353515625, 1.9439697265625, 2.03631591796875, 2.128662109375, 2.22100830078125, 2.3133544921875, 2.40570068359375, 2.498046875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 9.0, 8.0, 23.0, 29.0, 43.0, 62.0, 72.0, 103.0, 118.0, 133.0, 114.0, 86.0, 86.0, 42.0, 33.0, 14.0, 13.0, 8.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.085648536682129, -11.623440742492676, -11.161233901977539, -10.699026107788086, -10.236818313598633, -9.77461051940918, -9.312402725219727, -8.85019588470459, -8.387988090515137, -7.925780296325684, -7.463572978973389, -7.001365661621094, -6.539157867431641, -6.0769500732421875, -5.614742755889893, -5.152535438537598, -4.6903276443481445, -4.228119850158691, -3.7659125328063965, -3.3037049770355225, -2.8414974212646484, -2.3792898654937744, -1.9170823097229004, -1.4548747539520264, -0.9926671981811523, -0.5304596424102783, -0.0682520866394043, 0.3939554691314697, 0.8561630249023438, 1.3183705806732178, 1.7805781364440918, 2.242785692214966, 2.7049942016601562, 3.1672017574310303, 3.6294093132019043, 4.091616630554199, 4.553824424743652, 5.0160322189331055, 5.4782395362854, 5.940446853637695, 6.402654647827148, 6.864862442016602, 7.3270697593688965, 7.789277076721191, 8.251484870910645, 8.713692665100098, 9.175899505615234, 9.638107299804688, 10.10031509399414, 10.562522888183594, 11.024730682373047, 11.486937522888184, 11.949145317077637, 12.41135311126709, 12.873559951782227, 13.33576774597168, 13.797975540161133, 14.260183334350586, 14.722391128540039, 15.184597969055176, 15.646805763244629, 16.109012603759766, 16.57122039794922, 17.033428192138672, 17.495635986328125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 4.0, 8.0, 10.0, 13.0, 21.0, 18.0, 14.0, 17.0, 19.0, 18.0, 32.0, 24.0, 27.0, 38.0, 37.0, 38.0, 31.0, 41.0, 42.0, 46.0, 40.0, 44.0, 31.0, 34.0, 43.0, 48.0, 32.0, 21.0, 26.0, 32.0, 19.0, 16.0, 20.0, 17.0, 8.0, 9.0, 14.0, 8.0, 8.0, 6.0, 7.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.253666877746582, -6.0353217124938965, -5.816976070404053, -5.598630905151367, -5.380285739898682, -5.161940097808838, -4.943594932556152, -4.725249290466309, -4.506904125213623, -4.2885589599609375, -4.070213317871094, -3.851868152618408, -3.6335227489471436, -3.415177345275879, -3.1968321800231934, -2.9784867763519287, -2.760141611099243, -2.5417962074279785, -2.323451042175293, -2.1051056385040283, -1.8867602348327637, -1.6684149503707886, -1.4500696659088135, -1.2317242622375488, -1.0133789777755737, -0.7950336337089539, -0.576688289642334, -0.3583430051803589, -0.139997661113739, 0.07834768295288086, 0.29669296741485596, 0.5150383710861206, 0.7333836555480957, 0.9517289996147156, 1.1700743436813354, 1.3884196281433105, 1.6067650318145752, 1.8251103162765503, 2.0434556007385254, 2.26180100440979, 2.4801464080810547, 2.6984918117523193, 2.916836977005005, 3.1351823806762695, 3.353527784347534, 3.571873188018799, 3.7902183532714844, 4.008563995361328, 4.2269086837768555, 4.445253849029541, 4.663599491119385, 4.88194465637207, 5.100289821624756, 5.3186354637146, 5.536980628967285, 5.755326271057129, 5.9736714363098145, 6.1920166015625, 6.410362243652344, 6.628707408905029, 6.847052574157715, 7.065398216247559, 7.283743381500244, 7.50208854675293, 7.720434188842773]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 8.0, 3.0, 8.0, 6.0, 13.0, 12.0, 26.0, 34.0, 65.0, 78.0, 132.0, 212.0, 344.0, 504.0, 758.0, 1140.0, 1739.0, 3072.0, 4867.0, 8071.0, 14162.0, 26618.0, 65866.0, 219273.0, 414479.0, 177058.0, 54725.0, 23362.0, 12514.0, 7462.0, 4340.0, 2755.0, 1738.0, 1126.0, 697.0, 442.0, 303.0, 190.0, 133.0, 85.0, 41.0, 23.0, 29.0, 15.0, 14.0, 9.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7216796875, -1.6668701171875, -1.612060546875, -1.5572509765625, -1.50244140625, -1.4476318359375, -1.392822265625, -1.3380126953125, -1.283203125, -1.2283935546875, -1.173583984375, -1.1187744140625, -1.06396484375, -1.0091552734375, -0.954345703125, -0.8995361328125, -0.8447265625, -0.7899169921875, -0.735107421875, -0.6802978515625, -0.62548828125, -0.5706787109375, -0.515869140625, -0.4610595703125, -0.40625, -0.3514404296875, -0.296630859375, -0.2418212890625, -0.18701171875, -0.1322021484375, -0.077392578125, -0.0225830078125, 0.0322265625, 0.0870361328125, 0.141845703125, 0.1966552734375, 0.25146484375, 0.3062744140625, 0.361083984375, 0.4158935546875, 0.470703125, 0.5255126953125, 0.580322265625, 0.6351318359375, 0.68994140625, 0.7447509765625, 0.799560546875, 0.8543701171875, 0.9091796875, 0.9639892578125, 1.018798828125, 1.0736083984375, 1.12841796875, 1.1832275390625, 1.238037109375, 1.2928466796875, 1.34765625, 1.4024658203125, 1.457275390625, 1.5120849609375, 1.56689453125, 1.6217041015625, 1.676513671875, 1.7313232421875, 1.7861328125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 7.0, 6.0, 2.0, 5.0, 6.0, 7.0, 5.0, 17.0, 19.0, 16.0, 12.0, 18.0, 23.0, 31.0, 24.0, 25.0, 18.0, 35.0, 36.0, 44.0, 37.0, 51.0, 43.0, 48.0, 44.0, 39.0, 42.0, 32.0, 36.0, 30.0, 36.0, 33.0, 20.0, 18.0, 29.0, 10.0, 19.0, 12.0, 10.0, 11.0, 8.0, 7.0, 8.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0498046875, -1.0151214599609375, -0.980438232421875, -0.9457550048828125, -0.91107177734375, -0.8763885498046875, -0.841705322265625, -0.8070220947265625, -0.7723388671875, -0.7376556396484375, -0.702972412109375, -0.6682891845703125, -0.63360595703125, -0.5989227294921875, -0.564239501953125, -0.5295562744140625, -0.494873046875, -0.4601898193359375, -0.425506591796875, -0.3908233642578125, -0.35614013671875, -0.3214569091796875, -0.286773681640625, -0.2520904541015625, -0.2174072265625, -0.1827239990234375, -0.148040771484375, -0.1133575439453125, -0.07867431640625, -0.0439910888671875, -0.009307861328125, 0.0253753662109375, 0.06005859375, 0.0947418212890625, 0.129425048828125, 0.1641082763671875, 0.19879150390625, 0.2334747314453125, 0.268157958984375, 0.3028411865234375, 0.3375244140625, 0.3722076416015625, 0.406890869140625, 0.4415740966796875, 0.47625732421875, 0.5109405517578125, 0.545623779296875, 0.5803070068359375, 0.614990234375, 0.6496734619140625, 0.684356689453125, 0.7190399169921875, 0.75372314453125, 0.7884063720703125, 0.823089599609375, 0.8577728271484375, 0.8924560546875, 0.9271392822265625, 0.961822509765625, 0.9965057373046875, 1.03118896484375, 1.0658721923828125, 1.100555419921875, 1.1352386474609375, 1.169921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 8.0, 3.0, 12.0, 7.0, 15.0, 29.0, 34.0, 45.0, 76.0, 152.0, 286.0, 496.0, 1024.0, 2302.0, 4957.0, 11554.0, 30452.0, 124183.0, 538306.0, 255317.0, 49650.0, 16766.0, 6917.0, 3067.0, 1350.0, 681.0, 378.0, 185.0, 120.0, 55.0, 35.0, 24.0, 18.0, 7.0, 7.0, 2.0, 15.0, 6.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.734375, -2.6507568359375, -2.567138671875, -2.4835205078125, -2.39990234375, -2.3162841796875, -2.232666015625, -2.1490478515625, -2.0654296875, -1.9818115234375, -1.898193359375, -1.8145751953125, -1.73095703125, -1.6473388671875, -1.563720703125, -1.4801025390625, -1.396484375, -1.3128662109375, -1.229248046875, -1.1456298828125, -1.06201171875, -0.9783935546875, -0.894775390625, -0.8111572265625, -0.7275390625, -0.6439208984375, -0.560302734375, -0.4766845703125, -0.39306640625, -0.3094482421875, -0.225830078125, -0.1422119140625, -0.05859375, 0.0250244140625, 0.108642578125, 0.1922607421875, 0.27587890625, 0.3594970703125, 0.443115234375, 0.5267333984375, 0.6103515625, 0.6939697265625, 0.777587890625, 0.8612060546875, 0.94482421875, 1.0284423828125, 1.112060546875, 1.1956787109375, 1.279296875, 1.3629150390625, 1.446533203125, 1.5301513671875, 1.61376953125, 1.6973876953125, 1.781005859375, 1.8646240234375, 1.9482421875, 2.0318603515625, 2.115478515625, 2.1990966796875, 2.28271484375, 2.3663330078125, 2.449951171875, 2.5335693359375, 2.6171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 9.0, 7.0, 10.0, 11.0, 14.0, 17.0, 24.0, 22.0, 23.0, 27.0, 44.0, 44.0, 46.0, 49.0, 48.0, 45.0, 48.0, 50.0, 40.0, 61.0, 48.0, 54.0, 46.0, 41.0, 41.0, 31.0, 21.0, 20.0, 11.0, 20.0, 12.0, 3.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.08203125, -4.95428466796875, -4.8265380859375, -4.69879150390625, -4.571044921875, -4.44329833984375, -4.3155517578125, -4.18780517578125, -4.06005859375, -3.93231201171875, -3.8045654296875, -3.67681884765625, -3.549072265625, -3.42132568359375, -3.2935791015625, -3.16583251953125, -3.0380859375, -2.91033935546875, -2.7825927734375, -2.65484619140625, -2.527099609375, -2.39935302734375, -2.2716064453125, -2.14385986328125, -2.01611328125, -1.88836669921875, -1.7606201171875, -1.63287353515625, -1.505126953125, -1.37738037109375, -1.2496337890625, -1.12188720703125, -0.994140625, -0.86639404296875, -0.7386474609375, -0.61090087890625, -0.483154296875, -0.35540771484375, -0.2276611328125, -0.09991455078125, 0.02783203125, 0.15557861328125, 0.2833251953125, 0.41107177734375, 0.538818359375, 0.66656494140625, 0.7943115234375, 0.92205810546875, 1.0498046875, 1.17755126953125, 1.3052978515625, 1.43304443359375, 1.560791015625, 1.68853759765625, 1.8162841796875, 1.94403076171875, 2.07177734375, 2.19952392578125, 2.3272705078125, 2.45501708984375, 2.582763671875, 2.71051025390625, 2.8382568359375, 2.96600341796875, 3.09375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 8.0, 10.0, 19.0, 17.0, 25.0, 53.0, 78.0, 129.0, 167.0, 328.0, 538.0, 903.0, 1743.0, 3346.0, 6674.0, 14117.0, 32729.0, 94475.0, 322017.0, 381097.0, 118538.0, 39366.0, 16328.0, 7535.0, 3713.0, 2005.0, 1101.0, 569.0, 360.0, 211.0, 129.0, 89.0, 51.0, 32.0, 21.0, 13.0, 9.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.09765625, -1.0672454833984375, -1.036834716796875, -1.0064239501953125, -0.97601318359375, -0.9456024169921875, -0.915191650390625, -0.8847808837890625, -0.8543701171875, -0.8239593505859375, -0.793548583984375, -0.7631378173828125, -0.73272705078125, -0.7023162841796875, -0.671905517578125, -0.6414947509765625, -0.611083984375, -0.5806732177734375, -0.550262451171875, -0.5198516845703125, -0.48944091796875, -0.4590301513671875, -0.428619384765625, -0.3982086181640625, -0.3677978515625, -0.3373870849609375, -0.306976318359375, -0.2765655517578125, -0.24615478515625, -0.2157440185546875, -0.185333251953125, -0.1549224853515625, -0.12451171875, -0.0941009521484375, -0.063690185546875, -0.0332794189453125, -0.00286865234375, 0.0275421142578125, 0.057952880859375, 0.0883636474609375, 0.1187744140625, 0.1491851806640625, 0.179595947265625, 0.2100067138671875, 0.24041748046875, 0.2708282470703125, 0.301239013671875, 0.3316497802734375, 0.362060546875, 0.3924713134765625, 0.422882080078125, 0.4532928466796875, 0.48370361328125, 0.5141143798828125, 0.544525146484375, 0.5749359130859375, 0.6053466796875, 0.6357574462890625, 0.666168212890625, 0.6965789794921875, 0.72698974609375, 0.7574005126953125, 0.787811279296875, 0.8182220458984375, 0.8486328125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 4.0, 2.0, 6.0, 8.0, 10.0, 8.0, 9.0, 22.0, 29.0, 60.0, 76.0, 121.0, 146.0, 143.0, 103.0, 77.0, 44.0, 25.0, 25.0, 16.0, 9.0, 16.0, 5.0, 4.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00018024444580078125, -0.00017329305410385132, -0.0001663416624069214, -0.00015939027070999146, -0.00015243887901306152, -0.0001454874873161316, -0.00013853609561920166, -0.00013158470392227173, -0.0001246333122253418, -0.00011768192052841187, -0.00011073052883148193, -0.000103779137134552, -9.682774543762207e-05, -8.987635374069214e-05, -8.292496204376221e-05, -7.597357034683228e-05, -6.902217864990234e-05, -6.207078695297241e-05, -5.511939525604248e-05, -4.816800355911255e-05, -4.121661186218262e-05, -3.4265220165252686e-05, -2.7313828468322754e-05, -2.0362436771392822e-05, -1.341104507446289e-05, -6.459653377532959e-06, 4.917383193969727e-07, 7.443130016326904e-06, 1.4394521713256836e-05, 2.1345913410186768e-05, 2.82973051071167e-05, 3.524869680404663e-05, 4.220008850097656e-05, 4.9151480197906494e-05, 5.6102871894836426e-05, 6.305426359176636e-05, 7.000565528869629e-05, 7.695704698562622e-05, 8.390843868255615e-05, 9.085983037948608e-05, 9.781122207641602e-05, 0.00010476261377334595, 0.00011171400547027588, 0.00011866539716720581, 0.00012561678886413574, 0.00013256818056106567, 0.0001395195722579956, 0.00014647096395492554, 0.00015342235565185547, 0.0001603737473487854, 0.00016732513904571533, 0.00017427653074264526, 0.0001812279224395752, 0.00018817931413650513, 0.00019513070583343506, 0.000202082097530365, 0.00020903348922729492, 0.00021598488092422485, 0.00022293627262115479, 0.00022988766431808472, 0.00023683905601501465, 0.00024379044771194458, 0.0002507418394088745, 0.00025769323110580444, 0.0002646446228027344]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 9.0, 11.0, 18.0, 11.0, 27.0, 42.0, 70.0, 95.0, 135.0, 219.0, 340.0, 545.0, 937.0, 1668.0, 3143.0, 6101.0, 13539.0, 33325.0, 92726.0, 270881.0, 373244.0, 158131.0, 53955.0, 20801.0, 8979.0, 4159.0, 2180.0, 1275.0, 735.0, 425.0, 328.0, 166.0, 110.0, 65.0, 48.0, 31.0, 18.0, 21.0, 14.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.93408203125, -0.9059829711914062, -0.8778839111328125, -0.8497848510742188, -0.821685791015625, -0.7935867309570312, -0.7654876708984375, -0.7373886108398438, -0.70928955078125, -0.6811904907226562, -0.6530914306640625, -0.6249923706054688, -0.596893310546875, -0.5687942504882812, -0.5406951904296875, -0.5125961303710938, -0.4844970703125, -0.45639801025390625, -0.4282989501953125, -0.40019989013671875, -0.372100830078125, -0.34400177001953125, -0.3159027099609375, -0.28780364990234375, -0.25970458984375, -0.23160552978515625, -0.2035064697265625, -0.17540740966796875, -0.147308349609375, -0.11920928955078125, -0.0911102294921875, -0.06301116943359375, -0.034912109375, -0.00681304931640625, 0.0212860107421875, 0.04938507080078125, 0.077484130859375, 0.10558319091796875, 0.1336822509765625, 0.16178131103515625, 0.18988037109375, 0.21797943115234375, 0.2460784912109375, 0.27417755126953125, 0.302276611328125, 0.33037567138671875, 0.3584747314453125, 0.38657379150390625, 0.4146728515625, 0.44277191162109375, 0.4708709716796875, 0.49897003173828125, 0.527069091796875, 0.5551681518554688, 0.5832672119140625, 0.6113662719726562, 0.63946533203125, 0.6675643920898438, 0.6956634521484375, 0.7237625122070312, 0.751861572265625, 0.7799606323242188, 0.8080596923828125, 0.8361587524414062, 0.8642578125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 5.0, 7.0, 3.0, 10.0, 14.0, 11.0, 17.0, 19.0, 24.0, 20.0, 39.0, 51.0, 59.0, 67.0, 88.0, 94.0, 85.0, 83.0, 74.0, 50.0, 38.0, 31.0, 28.0, 15.0, 18.0, 14.0, 7.0, 7.0, 6.0, 7.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.95947265625, -0.9279556274414062, -0.8964385986328125, -0.8649215698242188, -0.833404541015625, -0.8018875122070312, -0.7703704833984375, -0.7388534545898438, -0.70733642578125, -0.6758193969726562, -0.6443023681640625, -0.6127853393554688, -0.581268310546875, -0.5497512817382812, -0.5182342529296875, -0.48671722412109375, -0.4552001953125, -0.42368316650390625, -0.3921661376953125, -0.36064910888671875, -0.329132080078125, -0.29761505126953125, -0.2660980224609375, -0.23458099365234375, -0.20306396484375, -0.17154693603515625, -0.1400299072265625, -0.10851287841796875, -0.076995849609375, -0.04547882080078125, -0.0139617919921875, 0.01755523681640625, 0.049072265625, 0.08058929443359375, 0.1121063232421875, 0.14362335205078125, 0.175140380859375, 0.20665740966796875, 0.2381744384765625, 0.26969146728515625, 0.30120849609375, 0.33272552490234375, 0.3642425537109375, 0.39575958251953125, 0.427276611328125, 0.45879364013671875, 0.4903106689453125, 0.5218276977539062, 0.5533447265625, 0.5848617553710938, 0.6163787841796875, 0.6478958129882812, 0.679412841796875, 0.7109298706054688, 0.7424468994140625, 0.7739639282226562, 0.80548095703125, 0.8369979858398438, 0.8685150146484375, 0.9000320434570312, 0.931549072265625, 0.9630661010742188, 0.9945831298828125, 1.0261001586914062, 1.0576171875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 11.0, 16.0, 36.0, 47.0, 71.0, 120.0, 137.0, 166.0, 136.0, 104.0, 56.0, 51.0, 17.0, 12.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1879072189331055, -5.776994705200195, -5.366082191467285, -4.955169677734375, -4.544257164001465, -4.133344650268555, -3.7224326133728027, -3.3115200996398926, -2.9006075859069824, -2.4896950721740723, -2.078782558441162, -1.667870283126831, -1.256957769393921, -0.8460452556610107, -0.4351329803466797, -0.02422046661376953, 0.3866920471191406, 0.797604501247406, 1.2085169553756714, 1.619429349899292, 2.030341863632202, 2.4412543773651123, 2.8521666526794434, 3.2630791664123535, 3.6739916801452637, 4.084904193878174, 4.495816707611084, 4.906728744506836, 5.317641258239746, 5.728553771972656, 6.139466285705566, 6.550378799438477, 6.96129035949707, 7.3722028732299805, 7.783115386962891, 8.1940279006958, 8.604940414428711, 9.015852928161621, 9.426765441894531, 9.837677001953125, 10.248590469360352, 10.659502983093262, 11.070415496826172, 11.481328010559082, 11.892240524291992, 12.303153038024902, 12.714065551757812, 13.124977111816406, 13.535889625549316, 13.946802139282227, 14.357714653015137, 14.768627166748047, 15.179539680480957, 15.590452194213867, 16.00136375427246, 16.412277221679688, 16.82318878173828, 17.234100341796875, 17.6450138092041, 18.055925369262695, 18.466838836669922, 18.877750396728516, 19.288663864135742, 19.699575424194336, 20.110488891601562]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 7.0, 7.0, 5.0, 14.0, 12.0, 12.0, 14.0, 17.0, 24.0, 21.0, 36.0, 45.0, 42.0, 49.0, 55.0, 48.0, 54.0, 45.0, 45.0, 46.0, 40.0, 45.0, 44.0, 39.0, 32.0, 30.0, 21.0, 24.0, 17.0, 15.0, 23.0, 15.0, 10.0, 8.0, 7.0, 5.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.889074325561523, -8.599440574645996, -8.309805870056152, -8.020172119140625, -7.730538368225098, -7.440904140472412, -7.151269912719727, -6.861636161804199, -6.572001934051514, -6.282367706298828, -5.992733955383301, -5.703099727630615, -5.41346549987793, -5.123831748962402, -4.834197521209717, -4.544563293457031, -4.254929542541504, -3.9652955532073975, -3.675661563873291, -3.3860273361206055, -3.096393346786499, -2.8067593574523926, -2.517125129699707, -2.2274911403656006, -1.9378571510314941, -1.6482231616973877, -1.3585890531539917, -1.0689549446105957, -0.7793209552764893, -0.4896869659423828, -0.20005285739898682, 0.08958125114440918, 0.37921619415283203, 0.6688502430915833, 0.9584842920303345, 1.2481184005737305, 1.537752389907837, 1.8273863792419434, 2.117020606994629, 2.4066545963287354, 2.696288585662842, 2.9859225749969482, 3.2755565643310547, 3.5651907920837402, 3.8548247814178467, 4.144458770751953, 4.434092998504639, 4.723727226257324, 5.013360977172852, 5.302995204925537, 5.5926289558410645, 5.88226318359375, 6.171896934509277, 6.461531162261963, 6.751165390014648, 7.040799140930176, 7.330433368682861, 7.620067596435547, 7.909701347351074, 8.199335098266602, 8.488969802856445, 8.778603553771973, 9.0682373046875, 9.357872009277344, 9.647505760192871]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 6.0, 9.0, 8.0, 14.0, 21.0, 36.0, 50.0, 66.0, 107.0, 164.0, 241.0, 402.0, 623.0, 1158.0, 2139.0, 4264.0, 9622.0, 21767.0, 55329.0, 159175.0, 585754.0, 2069736.0, 928785.0, 228793.0, 75124.0, 28373.0, 11633.0, 5141.0, 2511.0, 1265.0, 741.0, 445.0, 265.0, 169.0, 108.0, 84.0, 41.0, 36.0, 19.0, 18.0, 12.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.9833984375, -1.9207305908203125, -1.858062744140625, -1.7953948974609375, -1.73272705078125, -1.6700592041015625, -1.607391357421875, -1.5447235107421875, -1.4820556640625, -1.4193878173828125, -1.356719970703125, -1.2940521240234375, -1.23138427734375, -1.1687164306640625, -1.106048583984375, -1.0433807373046875, -0.980712890625, -0.9180450439453125, -0.855377197265625, -0.7927093505859375, -0.73004150390625, -0.6673736572265625, -0.604705810546875, -0.5420379638671875, -0.4793701171875, -0.4167022705078125, -0.354034423828125, -0.2913665771484375, -0.22869873046875, -0.1660308837890625, -0.103363037109375, -0.0406951904296875, 0.02197265625, 0.0846405029296875, 0.147308349609375, 0.2099761962890625, 0.27264404296875, 0.3353118896484375, 0.397979736328125, 0.4606475830078125, 0.5233154296875, 0.5859832763671875, 0.648651123046875, 0.7113189697265625, 0.77398681640625, 0.8366546630859375, 0.899322509765625, 0.9619903564453125, 1.024658203125, 1.0873260498046875, 1.149993896484375, 1.2126617431640625, 1.27532958984375, 1.3379974365234375, 1.400665283203125, 1.4633331298828125, 1.5260009765625, 1.5886688232421875, 1.651336669921875, 1.7140045166015625, 1.77667236328125, 1.8393402099609375, 1.902008056640625, 1.9646759033203125, 2.02734375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 9.0, 11.0, 14.0, 17.0, 14.0, 13.0, 17.0, 23.0, 22.0, 29.0, 31.0, 26.0, 31.0, 32.0, 33.0, 43.0, 26.0, 43.0, 37.0, 43.0, 43.0, 55.0, 37.0, 41.0, 37.0, 31.0, 31.0, 24.0, 21.0, 24.0, 22.0, 26.0, 20.0, 12.0, 9.0, 8.0, 4.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0771484375, -1.04339599609375, -1.0096435546875, -0.97589111328125, -0.942138671875, -0.90838623046875, -0.8746337890625, -0.84088134765625, -0.80712890625, -0.77337646484375, -0.7396240234375, -0.70587158203125, -0.672119140625, -0.63836669921875, -0.6046142578125, -0.57086181640625, -0.537109375, -0.50335693359375, -0.4696044921875, -0.43585205078125, -0.402099609375, -0.36834716796875, -0.3345947265625, -0.30084228515625, -0.26708984375, -0.23333740234375, -0.1995849609375, -0.16583251953125, -0.132080078125, -0.09832763671875, -0.0645751953125, -0.03082275390625, 0.0029296875, 0.03668212890625, 0.0704345703125, 0.10418701171875, 0.137939453125, 0.17169189453125, 0.2054443359375, 0.23919677734375, 0.27294921875, 0.30670166015625, 0.3404541015625, 0.37420654296875, 0.407958984375, 0.44171142578125, 0.4754638671875, 0.50921630859375, 0.54296875, 0.57672119140625, 0.6104736328125, 0.64422607421875, 0.677978515625, 0.71173095703125, 0.7454833984375, 0.77923583984375, 0.81298828125, 0.84674072265625, 0.8804931640625, 0.91424560546875, 0.947998046875, 0.98175048828125, 1.0155029296875, 1.04925537109375, 1.0830078125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 13.0, 17.0, 5.0, 19.0, 23.0, 34.0, 47.0, 60.0, 93.0, 143.0, 210.0, 306.0, 552.0, 892.0, 1606.0, 2990.0, 5941.0, 12294.0, 26646.0, 62224.0, 155677.0, 458474.0, 1787036.0, 1171222.0, 307526.0, 112748.0, 46653.0, 20806.0, 9456.0, 4713.0, 2509.0, 1289.0, 743.0, 448.0, 289.0, 182.0, 139.0, 81.0, 56.0, 28.0, 29.0, 13.0, 12.0, 13.0, 10.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2.005859375, -1.94476318359375, -1.8836669921875, -1.82257080078125, -1.761474609375, -1.70037841796875, -1.6392822265625, -1.57818603515625, -1.51708984375, -1.45599365234375, -1.3948974609375, -1.33380126953125, -1.272705078125, -1.21160888671875, -1.1505126953125, -1.08941650390625, -1.0283203125, -0.96722412109375, -0.9061279296875, -0.84503173828125, -0.783935546875, -0.72283935546875, -0.6617431640625, -0.60064697265625, -0.53955078125, -0.47845458984375, -0.4173583984375, -0.35626220703125, -0.295166015625, -0.23406982421875, -0.1729736328125, -0.11187744140625, -0.05078125, 0.01031494140625, 0.0714111328125, 0.13250732421875, 0.193603515625, 0.25469970703125, 0.3157958984375, 0.37689208984375, 0.43798828125, 0.49908447265625, 0.5601806640625, 0.62127685546875, 0.682373046875, 0.74346923828125, 0.8045654296875, 0.86566162109375, 0.9267578125, 0.98785400390625, 1.0489501953125, 1.11004638671875, 1.171142578125, 1.23223876953125, 1.2933349609375, 1.35443115234375, 1.41552734375, 1.47662353515625, 1.5377197265625, 1.59881591796875, 1.659912109375, 1.72100830078125, 1.7821044921875, 1.84320068359375, 1.904296875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 2.0, 9.0, 8.0, 8.0, 15.0, 25.0, 28.0, 29.0, 41.0, 59.0, 72.0, 116.0, 141.0, 208.0, 281.0, 501.0, 659.0, 603.0, 381.0, 233.0, 175.0, 123.0, 83.0, 71.0, 44.0, 40.0, 38.0, 18.0, 16.0, 11.0, 8.0, 11.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.951171875, -2.866485595703125, -2.78179931640625, -2.697113037109375, -2.6124267578125, -2.527740478515625, -2.44305419921875, -2.358367919921875, -2.273681640625, -2.188995361328125, -2.10430908203125, -2.019622802734375, -1.9349365234375, -1.850250244140625, -1.76556396484375, -1.680877685546875, -1.59619140625, -1.511505126953125, -1.42681884765625, -1.342132568359375, -1.2574462890625, -1.172760009765625, -1.08807373046875, -1.003387451171875, -0.918701171875, -0.834014892578125, -0.74932861328125, -0.664642333984375, -0.5799560546875, -0.495269775390625, -0.41058349609375, -0.325897216796875, -0.2412109375, -0.156524658203125, -0.07183837890625, 0.012847900390625, 0.0975341796875, 0.182220458984375, 0.26690673828125, 0.351593017578125, 0.436279296875, 0.520965576171875, 0.60565185546875, 0.690338134765625, 0.7750244140625, 0.859710693359375, 0.94439697265625, 1.029083251953125, 1.11376953125, 1.198455810546875, 1.28314208984375, 1.367828369140625, 1.4525146484375, 1.537200927734375, 1.62188720703125, 1.706573486328125, 1.791259765625, 1.875946044921875, 1.96063232421875, 2.045318603515625, 2.1300048828125, 2.214691162109375, 2.29937744140625, 2.384063720703125, 2.46875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 14.0, 12.0, 22.0, 41.0, 64.0, 99.0, 124.0, 137.0, 140.0, 98.0, 93.0, 63.0, 35.0, 28.0, 14.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.199920654296875, -16.66350555419922, -16.12708854675293, -15.590673446655273, -15.0542573928833, -14.517841339111328, -13.981426239013672, -13.4450101852417, -12.908594131469727, -12.372178077697754, -11.835762023925781, -11.299346923828125, -10.762930870056152, -10.22651481628418, -9.690099716186523, -9.15368366241455, -8.617267608642578, -8.080851554870605, -7.544435977935791, -7.008020401000977, -6.471604347229004, -5.935188293457031, -5.398772716522217, -4.862357139587402, -4.32594108581543, -3.789525270462036, -3.2531094551086426, -2.716693639755249, -2.1802778244018555, -1.643862009048462, -1.1074461936950684, -0.5710303783416748, -0.03461647033691406, 0.5017993450164795, 1.038215160369873, 1.5746309757232666, 2.11104679107666, 2.6474626064300537, 3.1838784217834473, 3.720294237136841, 4.256710052490234, 4.793126106262207, 5.3295416831970215, 5.865957260131836, 6.402373313903809, 6.938789367675781, 7.475204944610596, 8.01162052154541, 8.548036575317383, 9.084452629089355, 9.620868682861328, 10.157283782958984, 10.693699836730957, 11.23011589050293, 11.766530990600586, 12.302947044372559, 12.839363098144531, 13.375779151916504, 13.912195205688477, 14.448610305786133, 14.985026359558105, 15.521442413330078, 16.057857513427734, 16.594274520874023, 17.13068962097168]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 10.0, 10.0, 14.0, 17.0, 18.0, 18.0, 31.0, 24.0, 29.0, 38.0, 52.0, 27.0, 39.0, 44.0, 43.0, 39.0, 48.0, 59.0, 45.0, 42.0, 36.0, 41.0, 27.0, 35.0, 29.0, 27.0, 25.0, 23.0, 19.0, 18.0, 16.0, 17.0, 10.0, 8.0, 2.0, 4.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.609548568725586, -8.327886581420898, -8.046224594116211, -7.76456356048584, -7.482901573181152, -7.201239585876465, -6.9195780754089355, -6.637916564941406, -6.356254577636719, -6.074592590332031, -5.792931079864502, -5.511269569396973, -5.229607582092285, -4.947945594787598, -4.666284084320068, -4.384622573852539, -4.102960586547852, -3.821298837661743, -3.5396370887756348, -3.2579753398895264, -2.976313591003418, -2.6946518421173096, -2.412990093231201, -2.1313283443450928, -1.8496665954589844, -1.568004846572876, -1.2863430976867676, -1.0046813488006592, -0.7230195999145508, -0.4413578510284424, -0.15969610214233398, 0.12196564674377441, 0.4036273956298828, 0.6852891445159912, 0.9669508934020996, 1.248612642288208, 1.5302743911743164, 1.8119361400604248, 2.093597888946533, 2.3752596378326416, 2.65692138671875, 2.9385831356048584, 3.220244884490967, 3.501906633377075, 3.7835683822631836, 4.065230369567871, 4.3468918800354, 4.62855339050293, 4.910215377807617, 5.191877365112305, 5.473538875579834, 5.755200386047363, 6.036862373352051, 6.318524360656738, 6.600185871124268, 6.881847381591797, 7.163509368896484, 7.445171356201172, 7.726832866668701, 8.00849437713623, 8.290156364440918, 8.571818351745605, 8.853479385375977, 9.135141372680664, 9.416803359985352]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 9.0, 10.0, 18.0, 18.0, 31.0, 46.0, 58.0, 108.0, 149.0, 213.0, 363.0, 564.0, 899.0, 1508.0, 2317.0, 3545.0, 5747.0, 9344.0, 16252.0, 33011.0, 103336.0, 473787.0, 280320.0, 59282.0, 24088.0, 12915.0, 7778.0, 4690.0, 2957.0, 1936.0, 1189.0, 751.0, 457.0, 309.0, 178.0, 123.0, 93.0, 50.0, 34.0, 22.0, 17.0, 7.0, 11.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.8125, -2.729278564453125, -2.64605712890625, -2.562835693359375, -2.4796142578125, -2.396392822265625, -2.31317138671875, -2.229949951171875, -2.146728515625, -2.063507080078125, -1.98028564453125, -1.897064208984375, -1.8138427734375, -1.730621337890625, -1.64739990234375, -1.564178466796875, -1.48095703125, -1.397735595703125, -1.31451416015625, -1.231292724609375, -1.1480712890625, -1.064849853515625, -0.98162841796875, -0.898406982421875, -0.815185546875, -0.731964111328125, -0.64874267578125, -0.565521240234375, -0.4822998046875, -0.399078369140625, -0.31585693359375, -0.232635498046875, -0.1494140625, -0.066192626953125, 0.01702880859375, 0.100250244140625, 0.1834716796875, 0.266693115234375, 0.34991455078125, 0.433135986328125, 0.516357421875, 0.599578857421875, 0.68280029296875, 0.766021728515625, 0.8492431640625, 0.932464599609375, 1.01568603515625, 1.098907470703125, 1.18212890625, 1.265350341796875, 1.34857177734375, 1.431793212890625, 1.5150146484375, 1.598236083984375, 1.68145751953125, 1.764678955078125, 1.847900390625, 1.931121826171875, 2.01434326171875, 2.097564697265625, 2.1807861328125, 2.264007568359375, 2.34722900390625, 2.430450439453125, 2.513671875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 3.0, 6.0, 7.0, 11.0, 8.0, 7.0, 11.0, 16.0, 23.0, 26.0, 17.0, 28.0, 31.0, 38.0, 34.0, 28.0, 36.0, 43.0, 52.0, 34.0, 44.0, 41.0, 38.0, 42.0, 42.0, 49.0, 44.0, 42.0, 20.0, 21.0, 21.0, 21.0, 16.0, 28.0, 14.0, 13.0, 10.0, 6.0, 9.0, 3.0, 4.0, 2.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2236328125, -1.18499755859375, -1.1463623046875, -1.10772705078125, -1.069091796875, -1.03045654296875, -0.9918212890625, -0.95318603515625, -0.91455078125, -0.87591552734375, -0.8372802734375, -0.79864501953125, -0.760009765625, -0.72137451171875, -0.6827392578125, -0.64410400390625, -0.60546875, -0.56683349609375, -0.5281982421875, -0.48956298828125, -0.450927734375, -0.41229248046875, -0.3736572265625, -0.33502197265625, -0.29638671875, -0.25775146484375, -0.2191162109375, -0.18048095703125, -0.141845703125, -0.10321044921875, -0.0645751953125, -0.02593994140625, 0.0126953125, 0.05133056640625, 0.0899658203125, 0.12860107421875, 0.167236328125, 0.20587158203125, 0.2445068359375, 0.28314208984375, 0.32177734375, 0.36041259765625, 0.3990478515625, 0.43768310546875, 0.476318359375, 0.51495361328125, 0.5535888671875, 0.59222412109375, 0.630859375, 0.66949462890625, 0.7081298828125, 0.74676513671875, 0.785400390625, 0.82403564453125, 0.8626708984375, 0.90130615234375, 0.93994140625, 0.97857666015625, 1.0172119140625, 1.05584716796875, 1.094482421875, 1.13311767578125, 1.1717529296875, 1.21038818359375, 1.2490234375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 6.0, 11.0, 14.0, 13.0, 26.0, 27.0, 37.0, 45.0, 83.0, 96.0, 142.0, 223.0, 411.0, 698.0, 1370.0, 2882.0, 6520.0, 14407.0, 32637.0, 108010.0, 584467.0, 214546.0, 46308.0, 18889.0, 8671.0, 4023.0, 1756.0, 924.0, 486.0, 267.0, 180.0, 120.0, 71.0, 50.0, 39.0, 32.0, 18.0, 15.0, 11.0, 6.0, 2.0, 6.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.2734375, -3.17010498046875, -3.0667724609375, -2.96343994140625, -2.860107421875, -2.75677490234375, -2.6534423828125, -2.55010986328125, -2.44677734375, -2.34344482421875, -2.2401123046875, -2.13677978515625, -2.033447265625, -1.93011474609375, -1.8267822265625, -1.72344970703125, -1.6201171875, -1.51678466796875, -1.4134521484375, -1.31011962890625, -1.206787109375, -1.10345458984375, -1.0001220703125, -0.89678955078125, -0.79345703125, -0.69012451171875, -0.5867919921875, -0.48345947265625, -0.380126953125, -0.27679443359375, -0.1734619140625, -0.07012939453125, 0.033203125, 0.13653564453125, 0.2398681640625, 0.34320068359375, 0.446533203125, 0.54986572265625, 0.6531982421875, 0.75653076171875, 0.85986328125, 0.96319580078125, 1.0665283203125, 1.16986083984375, 1.273193359375, 1.37652587890625, 1.4798583984375, 1.58319091796875, 1.6865234375, 1.78985595703125, 1.8931884765625, 1.99652099609375, 2.099853515625, 2.20318603515625, 2.3065185546875, 2.40985107421875, 2.51318359375, 2.61651611328125, 2.7198486328125, 2.82318115234375, 2.926513671875, 3.02984619140625, 3.1331787109375, 3.23651123046875, 3.33984375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 2.0, 8.0, 6.0, 10.0, 11.0, 12.0, 12.0, 18.0, 25.0, 16.0, 23.0, 34.0, 41.0, 40.0, 45.0, 50.0, 42.0, 40.0, 48.0, 53.0, 41.0, 44.0, 42.0, 47.0, 47.0, 33.0, 31.0, 40.0, 29.0, 20.0, 13.0, 23.0, 12.0, 13.0, 12.0, 6.0, 2.0, 5.0, 1.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.36328125, -4.24017333984375, -4.1170654296875, -3.99395751953125, -3.870849609375, -3.74774169921875, -3.6246337890625, -3.50152587890625, -3.37841796875, -3.25531005859375, -3.1322021484375, -3.00909423828125, -2.885986328125, -2.76287841796875, -2.6397705078125, -2.51666259765625, -2.3935546875, -2.27044677734375, -2.1473388671875, -2.02423095703125, -1.901123046875, -1.77801513671875, -1.6549072265625, -1.53179931640625, -1.40869140625, -1.28558349609375, -1.1624755859375, -1.03936767578125, -0.916259765625, -0.79315185546875, -0.6700439453125, -0.54693603515625, -0.423828125, -0.30072021484375, -0.1776123046875, -0.05450439453125, 0.068603515625, 0.19171142578125, 0.3148193359375, 0.43792724609375, 0.56103515625, 0.68414306640625, 0.8072509765625, 0.93035888671875, 1.053466796875, 1.17657470703125, 1.2996826171875, 1.42279052734375, 1.5458984375, 1.66900634765625, 1.7921142578125, 1.91522216796875, 2.038330078125, 2.16143798828125, 2.2845458984375, 2.40765380859375, 2.53076171875, 2.65386962890625, 2.7769775390625, 2.90008544921875, 3.023193359375, 3.14630126953125, 3.2694091796875, 3.39251708984375, 3.515625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 7.0, 14.0, 28.0, 40.0, 69.0, 119.0, 218.0, 381.0, 783.0, 1720.0, 4107.0, 10472.0, 29979.0, 159845.0, 693798.0, 107167.0, 24434.0, 8920.0, 3539.0, 1398.0, 716.0, 351.0, 193.0, 111.0, 63.0, 32.0, 18.0, 20.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.720703125, -1.66412353515625, -1.6075439453125, -1.55096435546875, -1.494384765625, -1.43780517578125, -1.3812255859375, -1.32464599609375, -1.26806640625, -1.21148681640625, -1.1549072265625, -1.09832763671875, -1.041748046875, -0.98516845703125, -0.9285888671875, -0.87200927734375, -0.8154296875, -0.75885009765625, -0.7022705078125, -0.64569091796875, -0.589111328125, -0.53253173828125, -0.4759521484375, -0.41937255859375, -0.36279296875, -0.30621337890625, -0.2496337890625, -0.19305419921875, -0.136474609375, -0.07989501953125, -0.0233154296875, 0.03326416015625, 0.08984375, 0.14642333984375, 0.2030029296875, 0.25958251953125, 0.316162109375, 0.37274169921875, 0.4293212890625, 0.48590087890625, 0.54248046875, 0.59906005859375, 0.6556396484375, 0.71221923828125, 0.768798828125, 0.82537841796875, 0.8819580078125, 0.93853759765625, 0.9951171875, 1.05169677734375, 1.1082763671875, 1.16485595703125, 1.221435546875, 1.27801513671875, 1.3345947265625, 1.39117431640625, 1.44775390625, 1.50433349609375, 1.5609130859375, 1.61749267578125, 1.674072265625, 1.73065185546875, 1.7872314453125, 1.84381103515625, 1.900390625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 8.0, 12.0, 9.0, 9.0, 14.0, 13.0, 29.0, 58.0, 181.0, 321.0, 163.0, 55.0, 30.0, 19.0, 13.0, 11.0, 9.0, 6.0, 5.0, 3.0, 8.0, 4.0, 7.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00039839744567871094, -0.0003828220069408417, -0.0003672465682029724, -0.00035167112946510315, -0.0003360956907272339, -0.0003205202519893646, -0.00030494481325149536, -0.0002893693745136261, -0.00027379393577575684, -0.0002582184970378876, -0.0002426430583000183, -0.00022706761956214905, -0.00021149218082427979, -0.00019591674208641052, -0.00018034130334854126, -0.000164765864610672, -0.00014919042587280273, -0.00013361498713493347, -0.00011803954839706421, -0.00010246410965919495, -8.688867092132568e-05, -7.131323218345642e-05, -5.573779344558716e-05, -4.0162354707717896e-05, -2.4586915969848633e-05, -9.01147723197937e-06, 6.563961505889893e-06, 2.2139400243759155e-05, 3.771483898162842e-05, 5.329027771949768e-05, 6.886571645736694e-05, 8.44411551952362e-05, 0.00010001659393310547, 0.00011559203267097473, 0.000131167471408844, 0.00014674291014671326, 0.00016231834888458252, 0.00017789378762245178, 0.00019346922636032104, 0.0002090446650981903, 0.00022462010383605957, 0.00024019554257392883, 0.0002557709813117981, 0.00027134642004966736, 0.0002869218587875366, 0.0003024972975254059, 0.00031807273626327515, 0.0003336481750011444, 0.00034922361373901367, 0.00036479905247688293, 0.0003803744912147522, 0.00039594992995262146, 0.0004115253686904907, 0.00042710080742836, 0.00044267624616622925, 0.0004582516849040985, 0.0004738271236419678, 0.000489402562379837, 0.0005049780011177063, 0.0005205534398555756, 0.0005361288785934448, 0.0005517043173313141, 0.0005672797560691833, 0.0005828551948070526, 0.0005984306335449219]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 5.0, 4.0, 6.0, 2.0, 11.0, 17.0, 18.0, 23.0, 33.0, 39.0, 75.0, 119.0, 163.0, 268.0, 408.0, 682.0, 1185.0, 2381.0, 4804.0, 10748.0, 27445.0, 97691.0, 407925.0, 367324.0, 83078.0, 24506.0, 9894.0, 4450.0, 2279.0, 1163.0, 680.0, 376.0, 259.0, 159.0, 92.0, 72.0, 43.0, 42.0, 26.0, 12.0, 15.0, 8.0, 7.0, 6.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-1.2158203125, -1.1810302734375, -1.146240234375, -1.1114501953125, -1.07666015625, -1.0418701171875, -1.007080078125, -0.9722900390625, -0.9375, -0.9027099609375, -0.867919921875, -0.8331298828125, -0.79833984375, -0.7635498046875, -0.728759765625, -0.6939697265625, -0.6591796875, -0.6243896484375, -0.589599609375, -0.5548095703125, -0.52001953125, -0.4852294921875, -0.450439453125, -0.4156494140625, -0.380859375, -0.3460693359375, -0.311279296875, -0.2764892578125, -0.24169921875, -0.2069091796875, -0.172119140625, -0.1373291015625, -0.1025390625, -0.0677490234375, -0.032958984375, 0.0018310546875, 0.03662109375, 0.0714111328125, 0.106201171875, 0.1409912109375, 0.17578125, 0.2105712890625, 0.245361328125, 0.2801513671875, 0.31494140625, 0.3497314453125, 0.384521484375, 0.4193115234375, 0.4541015625, 0.4888916015625, 0.523681640625, 0.5584716796875, 0.59326171875, 0.6280517578125, 0.662841796875, 0.6976318359375, 0.732421875, 0.7672119140625, 0.802001953125, 0.8367919921875, 0.87158203125, 0.9063720703125, 0.941162109375, 0.9759521484375, 1.0107421875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 3.0, 3.0, 7.0, 3.0, 10.0, 15.0, 15.0, 24.0, 39.0, 48.0, 64.0, 67.0, 87.0, 94.0, 93.0, 90.0, 93.0, 58.0, 49.0, 30.0, 24.0, 23.0, 18.0, 4.0, 3.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.171875, -1.136505126953125, -1.10113525390625, -1.065765380859375, -1.0303955078125, -0.995025634765625, -0.95965576171875, -0.924285888671875, -0.888916015625, -0.853546142578125, -0.81817626953125, -0.782806396484375, -0.7474365234375, -0.712066650390625, -0.67669677734375, -0.641326904296875, -0.60595703125, -0.570587158203125, -0.53521728515625, -0.499847412109375, -0.4644775390625, -0.429107666015625, -0.39373779296875, -0.358367919921875, -0.322998046875, -0.287628173828125, -0.25225830078125, -0.216888427734375, -0.1815185546875, -0.146148681640625, -0.11077880859375, -0.075408935546875, -0.0400390625, -0.004669189453125, 0.03070068359375, 0.066070556640625, 0.1014404296875, 0.136810302734375, 0.17218017578125, 0.207550048828125, 0.242919921875, 0.278289794921875, 0.31365966796875, 0.349029541015625, 0.3843994140625, 0.419769287109375, 0.45513916015625, 0.490509033203125, 0.52587890625, 0.561248779296875, 0.59661865234375, 0.631988525390625, 0.6673583984375, 0.702728271484375, 0.73809814453125, 0.773468017578125, 0.808837890625, 0.844207763671875, 0.87957763671875, 0.914947509765625, 0.9503173828125, 0.985687255859375, 1.02105712890625, 1.056427001953125, 1.091796875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 31.0, 69.0, 151.0, 216.0, 237.0, 165.0, 72.0, 31.0, 11.0, 0.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.045879364013672, -29.211015701293945, -28.37615394592285, -27.541290283203125, -26.70642852783203, -25.871564865112305, -25.036701202392578, -24.201839447021484, -23.36697769165039, -22.532114028930664, -21.69725227355957, -20.862388610839844, -20.02752685546875, -19.192663192749023, -18.357799530029297, -17.522937774658203, -16.688074111938477, -15.853211402893066, -15.018348693847656, -14.18348503112793, -13.348623275756836, -12.51375961303711, -11.6788969039917, -10.844034194946289, -10.009171485900879, -9.174308776855469, -8.339446067810059, -7.50458288192749, -6.66972017288208, -5.83485746383667, -4.999994277954102, -4.165131568908691, -3.3302688598632812, -2.495406150817871, -1.6605432033538818, -0.8256802558898926, 0.009182453155517578, 0.8440451622009277, 1.678908348083496, 2.5137710571289062, 3.3486337661743164, 4.183496475219727, 5.018359184265137, 5.853222370147705, 6.688085079193115, 7.522947788238525, 8.357810974121094, 9.192673683166504, 10.027536392211914, 10.862399101257324, 11.697261810302734, 12.532125473022461, 13.366987228393555, 14.201850891113281, 15.036713600158691, 15.871576309204102, 16.706439971923828, 17.541303634643555, 18.37616539001465, 19.211029052734375, 20.04589080810547, 20.880754470825195, 21.715618133544922, 22.550479888916016, 23.38534164428711]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 4.0, 6.0, 9.0, 10.0, 6.0, 17.0, 15.0, 18.0, 12.0, 17.0, 19.0, 36.0, 29.0, 34.0, 41.0, 40.0, 28.0, 45.0, 33.0, 52.0, 39.0, 52.0, 56.0, 36.0, 34.0, 29.0, 36.0, 35.0, 33.0, 31.0, 16.0, 20.0, 15.0, 25.0, 13.0, 15.0, 11.0, 10.0, 6.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.591285705566406, -9.288394927978516, -8.985504150390625, -8.682613372802734, -8.37972354888916, -8.07683277130127, -7.773941993713379, -7.471051216125488, -7.168160438537598, -6.865269660949707, -6.562379360198975, -6.259488582611084, -5.956597805023193, -5.653707504272461, -5.35081672668457, -5.04792594909668, -4.745035648345947, -4.442144870758057, -4.139254570007324, -3.8363637924194336, -3.533473014831543, -3.2305824756622314, -2.92769193649292, -2.6248011589050293, -2.3219106197357178, -2.0190200805664062, -1.7161293029785156, -1.413238763809204, -1.110348105430603, -0.807457447052002, -0.5045669078826904, -0.2016761302947998, 0.10121440887451172, 0.4041050374507904, 0.7069956660270691, 1.0098862648010254, 1.3127769231796265, 1.6156675815582275, 1.918558120727539, 2.2214488983154297, 2.524339437484741, 2.8272299766540527, 3.1301207542419434, 3.433011293411255, 3.7359018325805664, 4.038792610168457, 4.341683387756348, 4.644574165344238, 4.947464466094971, 5.250355243682861, 5.553245544433594, 5.856136322021484, 6.159027099609375, 6.461917877197266, 6.764808177947998, 7.067698955535889, 7.370589256286621, 7.673480033874512, 7.976370334625244, 8.279260635375977, 8.582151412963867, 8.885042190551758, 9.187932968139648, 9.490823745727539, 9.79371452331543]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 15.0, 18.0, 15.0, 46.0, 54.0, 75.0, 108.0, 169.0, 274.0, 444.0, 663.0, 1075.0, 1894.0, 3114.0, 5777.0, 10529.0, 20631.0, 42110.0, 92068.0, 230837.0, 688398.0, 1624442.0, 941069.0, 307407.0, 116070.0, 51855.0, 25305.0, 13196.0, 7039.0, 3829.0, 2226.0, 1297.0, 778.0, 521.0, 326.0, 196.0, 139.0, 87.0, 58.0, 42.0, 28.0, 17.0, 15.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.5615234375, -1.516448974609375, -1.47137451171875, -1.426300048828125, -1.3812255859375, -1.336151123046875, -1.29107666015625, -1.246002197265625, -1.200927734375, -1.155853271484375, -1.11077880859375, -1.065704345703125, -1.0206298828125, -0.975555419921875, -0.93048095703125, -0.885406494140625, -0.84033203125, -0.795257568359375, -0.75018310546875, -0.705108642578125, -0.6600341796875, -0.614959716796875, -0.56988525390625, -0.524810791015625, -0.479736328125, -0.434661865234375, -0.38958740234375, -0.344512939453125, -0.2994384765625, -0.254364013671875, -0.20928955078125, -0.164215087890625, -0.119140625, -0.074066162109375, -0.02899169921875, 0.016082763671875, 0.0611572265625, 0.106231689453125, 0.15130615234375, 0.196380615234375, 0.241455078125, 0.286529541015625, 0.33160400390625, 0.376678466796875, 0.4217529296875, 0.466827392578125, 0.51190185546875, 0.556976318359375, 0.60205078125, 0.647125244140625, 0.69219970703125, 0.737274169921875, 0.7823486328125, 0.827423095703125, 0.87249755859375, 0.917572021484375, 0.962646484375, 1.007720947265625, 1.05279541015625, 1.097869873046875, 1.1429443359375, 1.188018798828125, 1.23309326171875, 1.278167724609375, 1.3232421875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 9.0, 2.0, 6.0, 9.0, 10.0, 5.0, 18.0, 15.0, 22.0, 29.0, 22.0, 32.0, 40.0, 31.0, 25.0, 41.0, 57.0, 50.0, 44.0, 43.0, 51.0, 49.0, 53.0, 46.0, 49.0, 49.0, 42.0, 32.0, 25.0, 14.0, 9.0, 17.0, 20.0, 7.0, 7.0, 12.0, 9.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4033203125, -1.357391357421875, -1.31146240234375, -1.265533447265625, -1.2196044921875, -1.173675537109375, -1.12774658203125, -1.081817626953125, -1.035888671875, -0.989959716796875, -0.94403076171875, -0.898101806640625, -0.8521728515625, -0.806243896484375, -0.76031494140625, -0.714385986328125, -0.66845703125, -0.622528076171875, -0.57659912109375, -0.530670166015625, -0.4847412109375, -0.438812255859375, -0.39288330078125, -0.346954345703125, -0.301025390625, -0.255096435546875, -0.20916748046875, -0.163238525390625, -0.1173095703125, -0.071380615234375, -0.02545166015625, 0.020477294921875, 0.06640625, 0.112335205078125, 0.15826416015625, 0.204193115234375, 0.2501220703125, 0.296051025390625, 0.34197998046875, 0.387908935546875, 0.433837890625, 0.479766845703125, 0.52569580078125, 0.571624755859375, 0.6175537109375, 0.663482666015625, 0.70941162109375, 0.755340576171875, 0.80126953125, 0.847198486328125, 0.89312744140625, 0.939056396484375, 0.9849853515625, 1.030914306640625, 1.07684326171875, 1.122772216796875, 1.168701171875, 1.214630126953125, 1.26055908203125, 1.306488037109375, 1.3524169921875, 1.398345947265625, 1.44427490234375, 1.490203857421875, 1.5361328125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 8.0, 14.0, 13.0, 19.0, 27.0, 23.0, 42.0, 64.0, 90.0, 155.0, 237.0, 379.0, 668.0, 1106.0, 2065.0, 3736.0, 7401.0, 15239.0, 33780.0, 79122.0, 203203.0, 704962.0, 2122656.0, 680380.0, 197816.0, 77613.0, 32885.0, 14940.0, 7227.0, 3648.0, 1968.0, 1054.0, 584.0, 386.0, 246.0, 173.0, 106.0, 76.0, 58.0, 32.0, 22.0, 17.0, 7.0, 8.0, 8.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0], "bins": [-2.21875, -2.1544189453125, -2.090087890625, -2.0257568359375, -1.96142578125, -1.8970947265625, -1.832763671875, -1.7684326171875, -1.7041015625, -1.6397705078125, -1.575439453125, -1.5111083984375, -1.44677734375, -1.3824462890625, -1.318115234375, -1.2537841796875, -1.189453125, -1.1251220703125, -1.060791015625, -0.9964599609375, -0.93212890625, -0.8677978515625, -0.803466796875, -0.7391357421875, -0.6748046875, -0.6104736328125, -0.546142578125, -0.4818115234375, -0.41748046875, -0.3531494140625, -0.288818359375, -0.2244873046875, -0.16015625, -0.0958251953125, -0.031494140625, 0.0328369140625, 0.09716796875, 0.1614990234375, 0.225830078125, 0.2901611328125, 0.3544921875, 0.4188232421875, 0.483154296875, 0.5474853515625, 0.61181640625, 0.6761474609375, 0.740478515625, 0.8048095703125, 0.869140625, 0.9334716796875, 0.997802734375, 1.0621337890625, 1.12646484375, 1.1907958984375, 1.255126953125, 1.3194580078125, 1.3837890625, 1.4481201171875, 1.512451171875, 1.5767822265625, 1.64111328125, 1.7054443359375, 1.769775390625, 1.8341064453125, 1.8984375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 9.0, 9.0, 6.0, 24.0, 13.0, 22.0, 25.0, 38.0, 42.0, 44.0, 60.0, 104.0, 108.0, 184.0, 238.0, 391.0, 583.0, 597.0, 489.0, 298.0, 204.0, 149.0, 98.0, 96.0, 50.0, 47.0, 25.0, 22.0, 23.0, 14.0, 9.0, 14.0, 5.0, 8.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.32421875, -2.239044189453125, -2.15386962890625, -2.068695068359375, -1.9835205078125, -1.898345947265625, -1.81317138671875, -1.727996826171875, -1.642822265625, -1.557647705078125, -1.47247314453125, -1.387298583984375, -1.3021240234375, -1.216949462890625, -1.13177490234375, -1.046600341796875, -0.96142578125, -0.876251220703125, -0.79107666015625, -0.705902099609375, -0.6207275390625, -0.535552978515625, -0.45037841796875, -0.365203857421875, -0.280029296875, -0.194854736328125, -0.10968017578125, -0.024505615234375, 0.0606689453125, 0.145843505859375, 0.23101806640625, 0.316192626953125, 0.4013671875, 0.486541748046875, 0.57171630859375, 0.656890869140625, 0.7420654296875, 0.827239990234375, 0.91241455078125, 0.997589111328125, 1.082763671875, 1.167938232421875, 1.25311279296875, 1.338287353515625, 1.4234619140625, 1.508636474609375, 1.59381103515625, 1.678985595703125, 1.76416015625, 1.849334716796875, 1.93450927734375, 2.019683837890625, 2.1048583984375, 2.190032958984375, 2.27520751953125, 2.360382080078125, 2.445556640625, 2.530731201171875, 2.61590576171875, 2.701080322265625, 2.7862548828125, 2.871429443359375, 2.95660400390625, 3.041778564453125, 3.126953125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 11.0, 8.0, 22.0, 46.0, 85.0, 133.0, 158.0, 184.0, 139.0, 103.0, 54.0, 33.0, 13.0, 6.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.255273818969727, -27.52445411682129, -26.79363250732422, -26.06281280517578, -25.33199119567871, -24.601171493530273, -23.870349884033203, -23.139530181884766, -22.408708572387695, -21.677888870239258, -20.947067260742188, -20.21624755859375, -19.48542594909668, -18.754606246948242, -18.023784637451172, -17.292964935302734, -16.562145233154297, -15.831324577331543, -15.100503921508789, -14.369683265686035, -13.638862609863281, -12.908041954040527, -12.177221298217773, -11.446401596069336, -10.715579986572266, -9.984759330749512, -9.253938674926758, -8.523118019104004, -7.79229736328125, -7.061476707458496, -6.3306565284729, -5.5998358726501465, -4.869014739990234, -4.1381940841674805, -3.4073734283447266, -2.6765530109405518, -1.9457323551177979, -1.214911699295044, -0.48409128189086914, 0.24672937393188477, 0.9775500297546387, 1.7083706855773926, 2.4391913414001465, 3.1700117588043213, 3.900832414627075, 4.63165283203125, 5.362473487854004, 6.093294143676758, 6.824114799499512, 7.554935455322266, 8.28575611114502, 9.016576766967773, 9.747397422790527, 10.478218078613281, 11.209037780761719, 11.939859390258789, 12.670679092407227, 13.40149974822998, 14.132320404052734, 14.863141059875488, 15.593961715698242, 16.32478141784668, 17.05560302734375, 17.786422729492188, 18.517244338989258]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 6.0, 7.0, 7.0, 10.0, 5.0, 15.0, 5.0, 22.0, 17.0, 21.0, 26.0, 38.0, 29.0, 32.0, 27.0, 33.0, 30.0, 36.0, 35.0, 34.0, 52.0, 41.0, 32.0, 44.0, 34.0, 30.0, 50.0, 38.0, 23.0, 37.0, 37.0, 19.0, 18.0, 19.0, 6.0, 14.0, 15.0, 10.0, 9.0, 8.0, 5.0, 6.0, 0.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.287981033325195, -7.0393266677856445, -6.790672302246094, -6.542017459869385, -6.293363094329834, -6.044708728790283, -5.796053886413574, -5.547399520874023, -5.298745155334473, -5.050090789794922, -4.801436424255371, -4.552781581878662, -4.304127216339111, -4.0554728507995605, -3.8068182468414307, -3.558163642883301, -3.30950927734375, -3.060854911804199, -2.8122003078460693, -2.5635457038879395, -2.3148913383483887, -2.066236972808838, -1.817582368850708, -1.5689278841018677, -1.3202733993530273, -1.071618914604187, -0.8229644298553467, -0.5743099451065063, -0.325655460357666, -0.07700097560882568, 0.17165350914001465, 0.420307993888855, 0.6689624786376953, 0.9176169633865356, 1.166271448135376, 1.4149259328842163, 1.6635804176330566, 1.912234902381897, 2.1608893871307373, 2.409543991088867, 2.658198356628418, 2.9068527221679688, 3.1555073261260986, 3.4041619300842285, 3.6528162956237793, 3.90147066116333, 4.150125503540039, 4.39877986907959, 4.647434234619141, 4.896088600158691, 5.144742965698242, 5.393397808074951, 5.642052173614502, 5.890706539154053, 6.139361381530762, 6.3880157470703125, 6.636670112609863, 6.885324478149414, 7.133978843688965, 7.382633686065674, 7.631288051605225, 7.879942417144775, 8.128597259521484, 8.377251625061035, 8.625905990600586]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 3.0, 3.0, 7.0, 15.0, 16.0, 19.0, 22.0, 47.0, 76.0, 107.0, 155.0, 225.0, 349.0, 607.0, 817.0, 1363.0, 2164.0, 3361.0, 5382.0, 8722.0, 14038.0, 23494.0, 46169.0, 145631.0, 425924.0, 232955.0, 64033.0, 28732.0, 16447.0, 10140.0, 6372.0, 4188.0, 2477.0, 1606.0, 996.0, 690.0, 436.0, 269.0, 179.0, 107.0, 75.0, 45.0, 34.0, 22.0, 14.0, 10.0, 8.0, 6.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9638671875, -1.8953704833984375, -1.826873779296875, -1.7583770751953125, -1.68988037109375, -1.6213836669921875, -1.552886962890625, -1.4843902587890625, -1.4158935546875, -1.3473968505859375, -1.278900146484375, -1.2104034423828125, -1.14190673828125, -1.0734100341796875, -1.004913330078125, -0.9364166259765625, -0.867919921875, -0.7994232177734375, -0.730926513671875, -0.6624298095703125, -0.59393310546875, -0.5254364013671875, -0.456939697265625, -0.3884429931640625, -0.3199462890625, -0.2514495849609375, -0.182952880859375, -0.1144561767578125, -0.04595947265625, 0.0225372314453125, 0.091033935546875, 0.1595306396484375, 0.22802734375, 0.2965240478515625, 0.365020751953125, 0.4335174560546875, 0.50201416015625, 0.5705108642578125, 0.639007568359375, 0.7075042724609375, 0.7760009765625, 0.8444976806640625, 0.912994384765625, 0.9814910888671875, 1.04998779296875, 1.1184844970703125, 1.186981201171875, 1.2554779052734375, 1.323974609375, 1.3924713134765625, 1.460968017578125, 1.5294647216796875, 1.59796142578125, 1.6664581298828125, 1.734954833984375, 1.8034515380859375, 1.8719482421875, 1.9404449462890625, 2.008941650390625, 2.0774383544921875, 2.14593505859375, 2.2144317626953125, 2.282928466796875, 2.3514251708984375, 2.419921875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 6.0, 7.0, 13.0, 11.0, 11.0, 16.0, 18.0, 14.0, 22.0, 23.0, 16.0, 26.0, 26.0, 30.0, 29.0, 34.0, 35.0, 45.0, 45.0, 46.0, 36.0, 30.0, 39.0, 46.0, 34.0, 38.0, 34.0, 36.0, 30.0, 23.0, 21.0, 15.0, 20.0, 15.0, 24.0, 12.0, 14.0, 5.0, 6.0, 5.0, 5.0, 9.0, 4.0, 7.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.099609375, -1.0633392333984375, -1.027069091796875, -0.9907989501953125, -0.95452880859375, -0.9182586669921875, -0.881988525390625, -0.8457183837890625, -0.8094482421875, -0.7731781005859375, -0.736907958984375, -0.7006378173828125, -0.66436767578125, -0.6280975341796875, -0.591827392578125, -0.5555572509765625, -0.519287109375, -0.4830169677734375, -0.446746826171875, -0.4104766845703125, -0.37420654296875, -0.3379364013671875, -0.301666259765625, -0.2653961181640625, -0.2291259765625, -0.1928558349609375, -0.156585693359375, -0.1203155517578125, -0.08404541015625, -0.0477752685546875, -0.011505126953125, 0.0247650146484375, 0.06103515625, 0.0973052978515625, 0.133575439453125, 0.1698455810546875, 0.20611572265625, 0.2423858642578125, 0.278656005859375, 0.3149261474609375, 0.3511962890625, 0.3874664306640625, 0.423736572265625, 0.4600067138671875, 0.49627685546875, 0.5325469970703125, 0.568817138671875, 0.6050872802734375, 0.641357421875, 0.6776275634765625, 0.713897705078125, 0.7501678466796875, 0.78643798828125, 0.8227081298828125, 0.858978271484375, 0.8952484130859375, 0.9315185546875, 0.9677886962890625, 1.004058837890625, 1.0403289794921875, 1.07659912109375, 1.1128692626953125, 1.149139404296875, 1.1854095458984375, 1.2216796875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 4.0, 7.0, 10.0, 11.0, 16.0, 12.0, 26.0, 34.0, 31.0, 56.0, 92.0, 109.0, 166.0, 281.0, 448.0, 849.0, 1537.0, 3142.0, 6837.0, 15144.0, 35940.0, 138158.0, 605665.0, 169558.0, 39280.0, 16353.0, 7442.0, 3421.0, 1649.0, 861.0, 477.0, 281.0, 194.0, 126.0, 99.0, 68.0, 52.0, 35.0, 27.0, 21.0, 12.0, 5.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.251953125, -3.1455078125, -3.0390625, -2.9326171875, -2.826171875, -2.7197265625, -2.61328125, -2.5068359375, -2.400390625, -2.2939453125, -2.1875, -2.0810546875, -1.974609375, -1.8681640625, -1.76171875, -1.6552734375, -1.548828125, -1.4423828125, -1.3359375, -1.2294921875, -1.123046875, -1.0166015625, -0.91015625, -0.8037109375, -0.697265625, -0.5908203125, -0.484375, -0.3779296875, -0.271484375, -0.1650390625, -0.05859375, 0.0478515625, 0.154296875, 0.2607421875, 0.3671875, 0.4736328125, 0.580078125, 0.6865234375, 0.79296875, 0.8994140625, 1.005859375, 1.1123046875, 1.21875, 1.3251953125, 1.431640625, 1.5380859375, 1.64453125, 1.7509765625, 1.857421875, 1.9638671875, 2.0703125, 2.1767578125, 2.283203125, 2.3896484375, 2.49609375, 2.6025390625, 2.708984375, 2.8154296875, 2.921875, 3.0283203125, 3.134765625, 3.2412109375, 3.34765625, 3.4541015625, 3.560546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 6.0, 6.0, 7.0, 7.0, 12.0, 21.0, 11.0, 23.0, 27.0, 27.0, 33.0, 32.0, 46.0, 38.0, 44.0, 49.0, 50.0, 49.0, 40.0, 39.0, 55.0, 39.0, 35.0, 38.0, 43.0, 24.0, 32.0, 33.0, 28.0, 20.0, 16.0, 7.0, 17.0, 9.0, 8.0, 6.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1484375, -4.0186767578125, -3.888916015625, -3.7591552734375, -3.62939453125, -3.4996337890625, -3.369873046875, -3.2401123046875, -3.1103515625, -2.9805908203125, -2.850830078125, -2.7210693359375, -2.59130859375, -2.4615478515625, -2.331787109375, -2.2020263671875, -2.072265625, -1.9425048828125, -1.812744140625, -1.6829833984375, -1.55322265625, -1.4234619140625, -1.293701171875, -1.1639404296875, -1.0341796875, -0.9044189453125, -0.774658203125, -0.6448974609375, -0.51513671875, -0.3853759765625, -0.255615234375, -0.1258544921875, 0.00390625, 0.1336669921875, 0.263427734375, 0.3931884765625, 0.52294921875, 0.6527099609375, 0.782470703125, 0.9122314453125, 1.0419921875, 1.1717529296875, 1.301513671875, 1.4312744140625, 1.56103515625, 1.6907958984375, 1.820556640625, 1.9503173828125, 2.080078125, 2.2098388671875, 2.339599609375, 2.4693603515625, 2.59912109375, 2.7288818359375, 2.858642578125, 2.9884033203125, 3.1181640625, 3.2479248046875, 3.377685546875, 3.5074462890625, 3.63720703125, 3.7669677734375, 3.896728515625, 4.0264892578125, 4.15625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 8.0, 17.0, 28.0, 42.0, 63.0, 91.0, 158.0, 305.0, 453.0, 762.0, 1439.0, 2663.0, 4660.0, 9075.0, 17763.0, 36018.0, 80668.0, 264858.0, 404916.0, 125448.0, 49527.0, 23735.0, 11896.0, 6363.0, 3405.0, 1761.0, 985.0, 563.0, 306.0, 203.0, 107.0, 87.0, 47.0, 44.0, 25.0, 22.0, 11.0, 4.0, 3.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.017578125, -0.988677978515625, -0.95977783203125, -0.930877685546875, -0.9019775390625, -0.873077392578125, -0.84417724609375, -0.815277099609375, -0.786376953125, -0.757476806640625, -0.72857666015625, -0.699676513671875, -0.6707763671875, -0.641876220703125, -0.61297607421875, -0.584075927734375, -0.55517578125, -0.526275634765625, -0.49737548828125, -0.468475341796875, -0.4395751953125, -0.410675048828125, -0.38177490234375, -0.352874755859375, -0.323974609375, -0.295074462890625, -0.26617431640625, -0.237274169921875, -0.2083740234375, -0.179473876953125, -0.15057373046875, -0.121673583984375, -0.0927734375, -0.063873291015625, -0.03497314453125, -0.006072998046875, 0.0228271484375, 0.051727294921875, 0.08062744140625, 0.109527587890625, 0.138427734375, 0.167327880859375, 0.19622802734375, 0.225128173828125, 0.2540283203125, 0.282928466796875, 0.31182861328125, 0.340728759765625, 0.36962890625, 0.398529052734375, 0.42742919921875, 0.456329345703125, 0.4852294921875, 0.514129638671875, 0.54302978515625, 0.571929931640625, 0.600830078125, 0.629730224609375, 0.65863037109375, 0.687530517578125, 0.7164306640625, 0.745330810546875, 0.77423095703125, 0.803131103515625, 0.83203125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 5.0, 8.0, 8.0, 10.0, 12.0, 15.0, 23.0, 26.0, 30.0, 51.0, 99.0, 129.0, 173.0, 130.0, 82.0, 43.0, 39.0, 22.0, 16.0, 20.0, 8.0, 7.0, 8.0, 6.0, 7.0, 3.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00028014183044433594, -0.00027026981115341187, -0.0002603977918624878, -0.0002505257725715637, -0.00024065375328063965, -0.00023078173398971558, -0.0002209097146987915, -0.00021103769540786743, -0.00020116567611694336, -0.0001912936568260193, -0.00018142163753509521, -0.00017154961824417114, -0.00016167759895324707, -0.000151805579662323, -0.00014193356037139893, -0.00013206154108047485, -0.00012218952178955078, -0.00011231750249862671, -0.00010244548320770264, -9.257346391677856e-05, -8.270144462585449e-05, -7.282942533493042e-05, -6.295740604400635e-05, -5.3085386753082275e-05, -4.32133674621582e-05, -3.334134817123413e-05, -2.346932888031006e-05, -1.3597309589385986e-05, -3.725290298461914e-06, 6.146728992462158e-06, 1.601874828338623e-05, 2.5890767574310303e-05, 3.5762786865234375e-05, 4.563480615615845e-05, 5.550682544708252e-05, 6.537884473800659e-05, 7.525086402893066e-05, 8.512288331985474e-05, 9.499490261077881e-05, 0.00010486692190170288, 0.00011473894119262695, 0.00012461096048355103, 0.0001344829797744751, 0.00014435499906539917, 0.00015422701835632324, 0.00016409903764724731, 0.0001739710569381714, 0.00018384307622909546, 0.00019371509552001953, 0.0002035871148109436, 0.00021345913410186768, 0.00022333115339279175, 0.00023320317268371582, 0.0002430751919746399, 0.00025294721126556396, 0.00026281923055648804, 0.0002726912498474121, 0.0002825632691383362, 0.00029243528842926025, 0.0003023073077201843, 0.0003121793270111084, 0.00032205134630203247, 0.00033192336559295654, 0.0003417953848838806, 0.0003516674041748047]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 12.0, 10.0, 18.0, 34.0, 47.0, 58.0, 70.0, 131.0, 187.0, 321.0, 546.0, 969.0, 2174.0, 4879.0, 12525.0, 33813.0, 107387.0, 409817.0, 341200.0, 86684.0, 28827.0, 10560.0, 4250.0, 1843.0, 929.0, 455.0, 276.0, 159.0, 113.0, 75.0, 43.0, 47.0, 25.0, 19.0, 12.0, 13.0, 7.0, 6.0, 5.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.236328125, -1.1998748779296875, -1.163421630859375, -1.1269683837890625, -1.09051513671875, -1.0540618896484375, -1.017608642578125, -0.9811553955078125, -0.9447021484375, -0.9082489013671875, -0.871795654296875, -0.8353424072265625, -0.79888916015625, -0.7624359130859375, -0.725982666015625, -0.6895294189453125, -0.653076171875, -0.6166229248046875, -0.580169677734375, -0.5437164306640625, -0.50726318359375, -0.4708099365234375, -0.434356689453125, -0.3979034423828125, -0.3614501953125, -0.3249969482421875, -0.288543701171875, -0.2520904541015625, -0.21563720703125, -0.1791839599609375, -0.142730712890625, -0.1062774658203125, -0.06982421875, -0.0333709716796875, 0.003082275390625, 0.0395355224609375, 0.07598876953125, 0.1124420166015625, 0.148895263671875, 0.1853485107421875, 0.2218017578125, 0.2582550048828125, 0.294708251953125, 0.3311614990234375, 0.36761474609375, 0.4040679931640625, 0.440521240234375, 0.4769744873046875, 0.513427734375, 0.5498809814453125, 0.586334228515625, 0.6227874755859375, 0.65924072265625, 0.6956939697265625, 0.732147216796875, 0.7686004638671875, 0.8050537109375, 0.8415069580078125, 0.877960205078125, 0.9144134521484375, 0.95086669921875, 0.9873199462890625, 1.023773193359375, 1.0602264404296875, 1.0966796875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 5.0, 12.0, 7.0, 9.0, 6.0, 10.0, 15.0, 15.0, 22.0, 30.0, 55.0, 70.0, 101.0, 104.0, 102.0, 92.0, 79.0, 66.0, 42.0, 31.0, 30.0, 20.0, 22.0, 14.0, 11.0, 12.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1513671875, -1.1108856201171875, -1.070404052734375, -1.0299224853515625, -0.98944091796875, -0.9489593505859375, -0.908477783203125, -0.8679962158203125, -0.8275146484375, -0.7870330810546875, -0.746551513671875, -0.7060699462890625, -0.66558837890625, -0.6251068115234375, -0.584625244140625, -0.5441436767578125, -0.503662109375, -0.4631805419921875, -0.422698974609375, -0.3822174072265625, -0.34173583984375, -0.3012542724609375, -0.260772705078125, -0.2202911376953125, -0.1798095703125, -0.1393280029296875, -0.098846435546875, -0.0583648681640625, -0.01788330078125, 0.0225982666015625, 0.063079833984375, 0.1035614013671875, 0.14404296875, 0.1845245361328125, 0.225006103515625, 0.2654876708984375, 0.30596923828125, 0.3464508056640625, 0.386932373046875, 0.4274139404296875, 0.4678955078125, 0.5083770751953125, 0.548858642578125, 0.5893402099609375, 0.62982177734375, 0.6703033447265625, 0.710784912109375, 0.7512664794921875, 0.791748046875, 0.8322296142578125, 0.872711181640625, 0.9131927490234375, 0.95367431640625, 0.9941558837890625, 1.034637451171875, 1.0751190185546875, 1.1156005859375, 1.1560821533203125, 1.196563720703125, 1.2370452880859375, 1.27752685546875, 1.3180084228515625, 1.358489990234375, 1.3989715576171875, 1.439453125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 12.0, 35.0, 85.0, 160.0, 210.0, 218.0, 150.0, 76.0, 26.0, 11.0, 8.0, 6.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.011390686035156, -38.19955825805664, -37.38772201538086, -36.575889587402344, -35.76405715942383, -34.95222091674805, -34.14038848876953, -33.328556060791016, -32.516719818115234, -31.704885482788086, -30.89305305480957, -30.081218719482422, -29.269384384155273, -28.457551956176758, -27.64571762084961, -26.833885192871094, -26.022052764892578, -25.21021842956543, -24.398386001586914, -23.586551666259766, -22.774717330932617, -21.9628849029541, -21.151050567626953, -20.339218139648438, -19.527381896972656, -18.715547561645508, -17.903715133666992, -17.091880798339844, -16.280046463012695, -15.46821403503418, -14.656379699707031, -13.8445463180542, -13.032712936401367, -12.220879554748535, -11.409045219421387, -10.597211837768555, -9.785378456115723, -8.97354507446289, -8.161710739135742, -7.34987735748291, -6.53804349899292, -5.72620964050293, -4.914376258850098, -4.102542400360107, -3.2907087802886963, -2.478875160217285, -1.667041301727295, -0.8552079200744629, -0.043374061584472656, 0.7684596180915833, 1.5802932977676392, 2.39212703704834, 3.203960657119751, 4.015794277191162, 4.827628135681152, 5.639461517333984, 6.451295375823975, 7.263129234313965, 8.074962615966797, 8.886796951293945, 9.698630332946777, 10.51046371459961, 11.322298049926758, 12.134130477905273, 12.945964813232422]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 5.0, 10.0, 11.0, 10.0, 5.0, 15.0, 13.0, 13.0, 17.0, 24.0, 20.0, 20.0, 32.0, 28.0, 30.0, 33.0, 34.0, 31.0, 39.0, 49.0, 31.0, 46.0, 46.0, 42.0, 38.0, 35.0, 43.0, 32.0, 33.0, 35.0, 15.0, 14.0, 23.0, 20.0, 20.0, 12.0, 14.0, 15.0, 7.0, 9.0, 8.0, 7.0, 6.0, 5.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.96891975402832, -8.688530921936035, -8.40814208984375, -8.127754211425781, -7.847365379333496, -7.566976547241211, -7.286588191986084, -7.006199836730957, -6.725811004638672, -6.445422172546387, -6.16503381729126, -5.884645462036133, -5.604256629943848, -5.3238677978515625, -5.0434794425964355, -4.763091087341309, -4.482702255249023, -4.202313423156738, -3.9219250679016113, -3.6415364742279053, -3.361147880554199, -3.080759286880493, -2.800370693206787, -2.519982099533081, -2.239593505859375, -1.959204912185669, -1.678816318511963, -1.3984277248382568, -1.1180391311645508, -0.8376505374908447, -0.5572619438171387, -0.2768733501434326, 0.0035152435302734375, 0.2839038372039795, 0.5642924308776855, 0.8446810245513916, 1.1250696182250977, 1.4054582118988037, 1.6858468055725098, 1.9662353992462158, 2.246623992919922, 2.527012586593628, 2.807401180267334, 3.08778977394104, 3.368178367614746, 3.648566961288452, 3.928955554962158, 4.209343910217285, 4.48973274230957, 4.7701215744018555, 5.050509929656982, 5.330898284912109, 5.6112871170043945, 5.89167594909668, 6.172064304351807, 6.452452659606934, 6.732841491699219, 7.013230323791504, 7.293618679046631, 7.574007034301758, 7.854395866394043, 8.134784698486328, 8.415172576904297, 8.695561408996582, 8.975950241088867]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 8.0, 17.0, 13.0, 24.0, 41.0, 48.0, 82.0, 121.0, 178.0, 292.0, 413.0, 742.0, 1193.0, 2044.0, 3613.0, 6184.0, 11284.0, 20774.0, 39018.0, 76262.0, 162839.0, 393572.0, 956903.0, 1297863.0, 698476.0, 279634.0, 119799.0, 57802.0, 29587.0, 15649.0, 8469.0, 4742.0, 2740.0, 1555.0, 874.0, 545.0, 311.0, 200.0, 142.0, 75.0, 54.0, 40.0, 23.0, 13.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.283203125, -1.24346923828125, -1.2037353515625, -1.16400146484375, -1.124267578125, -1.08453369140625, -1.0447998046875, -1.00506591796875, -0.96533203125, -0.92559814453125, -0.8858642578125, -0.84613037109375, -0.806396484375, -0.76666259765625, -0.7269287109375, -0.68719482421875, -0.6474609375, -0.60772705078125, -0.5679931640625, -0.52825927734375, -0.488525390625, -0.44879150390625, -0.4090576171875, -0.36932373046875, -0.32958984375, -0.28985595703125, -0.2501220703125, -0.21038818359375, -0.170654296875, -0.13092041015625, -0.0911865234375, -0.05145263671875, -0.01171875, 0.02801513671875, 0.0677490234375, 0.10748291015625, 0.147216796875, 0.18695068359375, 0.2266845703125, 0.26641845703125, 0.30615234375, 0.34588623046875, 0.3856201171875, 0.42535400390625, 0.465087890625, 0.50482177734375, 0.5445556640625, 0.58428955078125, 0.6240234375, 0.66375732421875, 0.7034912109375, 0.74322509765625, 0.782958984375, 0.82269287109375, 0.8624267578125, 0.90216064453125, 0.94189453125, 0.98162841796875, 1.0213623046875, 1.06109619140625, 1.100830078125, 1.14056396484375, 1.1802978515625, 1.22003173828125, 1.259765625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 8.0, 7.0, 14.0, 10.0, 13.0, 6.0, 28.0, 18.0, 17.0, 31.0, 29.0, 40.0, 27.0, 30.0, 36.0, 42.0, 40.0, 38.0, 43.0, 34.0, 52.0, 42.0, 39.0, 38.0, 31.0, 41.0, 28.0, 38.0, 30.0, 25.0, 21.0, 21.0, 14.0, 14.0, 8.0, 7.0, 10.0, 5.0, 5.0, 5.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.353515625, -1.3130645751953125, -1.272613525390625, -1.2321624755859375, -1.19171142578125, -1.1512603759765625, -1.110809326171875, -1.0703582763671875, -1.0299072265625, -0.9894561767578125, -0.949005126953125, -0.9085540771484375, -0.86810302734375, -0.8276519775390625, -0.787200927734375, -0.7467498779296875, -0.706298828125, -0.6658477783203125, -0.625396728515625, -0.5849456787109375, -0.54449462890625, -0.5040435791015625, -0.463592529296875, -0.4231414794921875, -0.3826904296875, -0.3422393798828125, -0.301788330078125, -0.2613372802734375, -0.22088623046875, -0.1804351806640625, -0.139984130859375, -0.0995330810546875, -0.05908203125, -0.0186309814453125, 0.021820068359375, 0.0622711181640625, 0.10272216796875, 0.1431732177734375, 0.183624267578125, 0.2240753173828125, 0.2645263671875, 0.3049774169921875, 0.345428466796875, 0.3858795166015625, 0.42633056640625, 0.4667816162109375, 0.507232666015625, 0.5476837158203125, 0.588134765625, 0.6285858154296875, 0.669036865234375, 0.7094879150390625, 0.74993896484375, 0.7903900146484375, 0.830841064453125, 0.8712921142578125, 0.9117431640625, 0.9521942138671875, 0.992645263671875, 1.0330963134765625, 1.07354736328125, 1.1139984130859375, 1.154449462890625, 1.1949005126953125, 1.2353515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 7.0, 7.0, 5.0, 13.0, 14.0, 26.0, 34.0, 57.0, 107.0, 179.0, 258.0, 513.0, 996.0, 2031.0, 4730.0, 13332.0, 47231.0, 207132.0, 1482285.0, 2073938.0, 274529.0, 60180.0, 16555.0, 5351.0, 2299.0, 1086.0, 575.0, 307.0, 174.0, 116.0, 76.0, 50.0, 25.0, 21.0, 18.0, 9.0, 8.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.34765625, -3.23638916015625, -3.1251220703125, -3.01385498046875, -2.902587890625, -2.79132080078125, -2.6800537109375, -2.56878662109375, -2.45751953125, -2.34625244140625, -2.2349853515625, -2.12371826171875, -2.012451171875, -1.90118408203125, -1.7899169921875, -1.67864990234375, -1.5673828125, -1.45611572265625, -1.3448486328125, -1.23358154296875, -1.122314453125, -1.01104736328125, -0.8997802734375, -0.78851318359375, -0.67724609375, -0.56597900390625, -0.4547119140625, -0.34344482421875, -0.232177734375, -0.12091064453125, -0.0096435546875, 0.10162353515625, 0.212890625, 0.32415771484375, 0.4354248046875, 0.54669189453125, 0.657958984375, 0.76922607421875, 0.8804931640625, 0.99176025390625, 1.10302734375, 1.21429443359375, 1.3255615234375, 1.43682861328125, 1.548095703125, 1.65936279296875, 1.7706298828125, 1.88189697265625, 1.9931640625, 2.10443115234375, 2.2156982421875, 2.32696533203125, 2.438232421875, 2.54949951171875, 2.6607666015625, 2.77203369140625, 2.88330078125, 2.99456787109375, 3.1058349609375, 3.21710205078125, 3.328369140625, 3.43963623046875, 3.5509033203125, 3.66217041015625, 3.7734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 1.0, 5.0, 3.0, 7.0, 9.0, 7.0, 10.0, 18.0, 17.0, 29.0, 34.0, 63.0, 77.0, 111.0, 174.0, 231.0, 346.0, 547.0, 695.0, 578.0, 373.0, 229.0, 151.0, 99.0, 85.0, 49.0, 35.0, 26.0, 21.0, 18.0, 10.0, 5.0, 5.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.24609375, -3.1319580078125, -3.017822265625, -2.9036865234375, -2.78955078125, -2.6754150390625, -2.561279296875, -2.4471435546875, -2.3330078125, -2.2188720703125, -2.104736328125, -1.9906005859375, -1.87646484375, -1.7623291015625, -1.648193359375, -1.5340576171875, -1.419921875, -1.3057861328125, -1.191650390625, -1.0775146484375, -0.96337890625, -0.8492431640625, -0.735107421875, -0.6209716796875, -0.5068359375, -0.3927001953125, -0.278564453125, -0.1644287109375, -0.05029296875, 0.0638427734375, 0.177978515625, 0.2921142578125, 0.40625, 0.5203857421875, 0.634521484375, 0.7486572265625, 0.86279296875, 0.9769287109375, 1.091064453125, 1.2052001953125, 1.3193359375, 1.4334716796875, 1.547607421875, 1.6617431640625, 1.77587890625, 1.8900146484375, 2.004150390625, 2.1182861328125, 2.232421875, 2.3465576171875, 2.460693359375, 2.5748291015625, 2.68896484375, 2.8031005859375, 2.917236328125, 3.0313720703125, 3.1455078125, 3.2596435546875, 3.373779296875, 3.4879150390625, 3.60205078125, 3.7161865234375, 3.830322265625, 3.9444580078125, 4.05859375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 7.0, 21.0, 53.0, 98.0, 142.0, 211.0, 162.0, 146.0, 88.0, 32.0, 20.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.23779296875, -30.350013732910156, -29.462234497070312, -28.57445526123047, -27.686677932739258, -26.798898696899414, -25.91111946105957, -25.023340225219727, -24.135560989379883, -23.24778175354004, -22.360002517700195, -21.472225189208984, -20.58444595336914, -19.696666717529297, -18.808887481689453, -17.92110824584961, -17.033329010009766, -16.145549774169922, -15.257771492004395, -14.36999225616455, -13.482213020324707, -12.59443473815918, -11.706655502319336, -10.818876266479492, -9.931098937988281, -9.043319702148438, -8.15554141998291, -7.267762184143066, -6.379982948303223, -5.492204189300537, -4.604425430297852, -3.716646194458008, -2.828866958618164, -1.9410879611968994, -1.0533090829849243, -0.16553020477294922, 0.7222487926483154, 1.61002779006958, 2.4978065490722656, 3.3855857849121094, 4.273364543914795, 5.1611433029174805, 6.048922538757324, 6.93670129776001, 7.824480056762695, 8.712259292602539, 9.600038528442383, 10.487817764282227, 11.375596046447754, 12.263375282287598, 13.151153564453125, 14.038932800292969, 14.926712036132812, 15.814491271972656, 16.7022705078125, 17.590049743652344, 18.477827072143555, 19.3656063079834, 20.253385543823242, 21.141162872314453, 22.028942108154297, 22.91672134399414, 23.804500579833984, 24.692279815673828, 25.580059051513672]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 4.0, 6.0, 11.0, 13.0, 12.0, 16.0, 12.0, 15.0, 21.0, 32.0, 14.0, 27.0, 21.0, 37.0, 37.0, 34.0, 46.0, 42.0, 45.0, 50.0, 22.0, 29.0, 38.0, 42.0, 41.0, 37.0, 23.0, 33.0, 37.0, 28.0, 24.0, 19.0, 18.0, 18.0, 10.0, 12.0, 5.0, 12.0, 9.0, 4.0, 8.0, 6.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.429837226867676, -9.129307746887207, -8.828777313232422, -8.528247833251953, -8.227717399597168, -7.927187919616699, -7.626657962799072, -7.326128005981445, -7.025598049163818, -6.725068092346191, -6.4245381355285645, -6.1240081787109375, -5.823478698730469, -5.522948265075684, -5.222418785095215, -4.921888828277588, -4.621358871459961, -4.320828914642334, -4.020298957824707, -3.719769239425659, -3.4192392826080322, -3.1187093257904053, -2.8181796073913574, -2.5176496505737305, -2.2171196937561035, -1.9165897369384766, -1.6160598993301392, -1.3155300617218018, -1.0150001049041748, -0.7144701480865479, -0.41394031047821045, -0.11341047286987305, 0.1871204376220703, 0.4876503348350525, 0.7881802320480347, 1.088710069656372, 1.389240026473999, 1.689769983291626, 1.9902998208999634, 2.290829658508301, 2.5913596153259277, 2.8918895721435547, 3.1924195289611816, 3.4929492473602295, 3.7934792041778564, 4.0940093994140625, 4.394538879394531, 4.695068836212158, 4.995598793029785, 5.296128749847412, 5.596658706665039, 5.897188663482666, 6.197718620300293, 6.498248100280762, 6.798778057098389, 7.099308013916016, 7.399837970733643, 7.7003679275512695, 8.000897407531738, 8.301427841186523, 8.601957321166992, 8.902487754821777, 9.203017234802246, 9.503547668457031, 9.8040771484375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 10.0, 4.0, 11.0, 11.0, 30.0, 41.0, 65.0, 77.0, 131.0, 177.0, 274.0, 406.0, 550.0, 861.0, 1235.0, 1797.0, 2674.0, 3855.0, 5579.0, 8388.0, 12552.0, 19748.0, 31592.0, 58773.0, 128451.0, 262106.0, 250673.0, 117502.0, 54738.0, 30043.0, 18551.0, 12094.0, 8158.0, 5576.0, 3778.0, 2585.0, 1755.0, 1183.0, 802.0, 541.0, 369.0, 267.0, 188.0, 118.0, 73.0, 62.0, 29.0, 22.0, 15.0, 14.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 3.0], "bins": [-1.6611328125, -1.6107177734375, -1.560302734375, -1.5098876953125, -1.45947265625, -1.4090576171875, -1.358642578125, -1.3082275390625, -1.2578125, -1.2073974609375, -1.156982421875, -1.1065673828125, -1.05615234375, -1.0057373046875, -0.955322265625, -0.9049072265625, -0.8544921875, -0.8040771484375, -0.753662109375, -0.7032470703125, -0.65283203125, -0.6024169921875, -0.552001953125, -0.5015869140625, -0.451171875, -0.4007568359375, -0.350341796875, -0.2999267578125, -0.24951171875, -0.1990966796875, -0.148681640625, -0.0982666015625, -0.0478515625, 0.0025634765625, 0.052978515625, 0.1033935546875, 0.15380859375, 0.2042236328125, 0.254638671875, 0.3050537109375, 0.35546875, 0.4058837890625, 0.456298828125, 0.5067138671875, 0.55712890625, 0.6075439453125, 0.657958984375, 0.7083740234375, 0.7587890625, 0.8092041015625, 0.859619140625, 0.9100341796875, 0.96044921875, 1.0108642578125, 1.061279296875, 1.1116943359375, 1.162109375, 1.2125244140625, 1.262939453125, 1.3133544921875, 1.36376953125, 1.4141845703125, 1.464599609375, 1.5150146484375, 1.5654296875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 9.0, 6.0, 7.0, 5.0, 16.0, 11.0, 16.0, 13.0, 10.0, 22.0, 23.0, 32.0, 28.0, 37.0, 26.0, 38.0, 37.0, 39.0, 33.0, 46.0, 43.0, 51.0, 44.0, 51.0, 39.0, 43.0, 41.0, 32.0, 33.0, 24.0, 19.0, 12.0, 16.0, 16.0, 11.0, 16.0, 8.0, 7.0, 6.0, 8.0, 6.0, 6.0, 8.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2138671875, -1.172882080078125, -1.13189697265625, -1.090911865234375, -1.0499267578125, -1.008941650390625, -0.96795654296875, -0.926971435546875, -0.885986328125, -0.845001220703125, -0.80401611328125, -0.763031005859375, -0.7220458984375, -0.681060791015625, -0.64007568359375, -0.599090576171875, -0.55810546875, -0.517120361328125, -0.47613525390625, -0.435150146484375, -0.3941650390625, -0.353179931640625, -0.31219482421875, -0.271209716796875, -0.230224609375, -0.189239501953125, -0.14825439453125, -0.107269287109375, -0.0662841796875, -0.025299072265625, 0.01568603515625, 0.056671142578125, 0.09765625, 0.138641357421875, 0.17962646484375, 0.220611572265625, 0.2615966796875, 0.302581787109375, 0.34356689453125, 0.384552001953125, 0.425537109375, 0.466522216796875, 0.50750732421875, 0.548492431640625, 0.5894775390625, 0.630462646484375, 0.67144775390625, 0.712432861328125, 0.75341796875, 0.794403076171875, 0.83538818359375, 0.876373291015625, 0.9173583984375, 0.958343505859375, 0.99932861328125, 1.040313720703125, 1.081298828125, 1.122283935546875, 1.16326904296875, 1.204254150390625, 1.2452392578125, 1.286224365234375, 1.32720947265625, 1.368194580078125, 1.4091796875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 7.0, 11.0, 11.0, 20.0, 13.0, 20.0, 25.0, 35.0, 55.0, 85.0, 163.0, 189.0, 359.0, 713.0, 1324.0, 2933.0, 7003.0, 17594.0, 52482.0, 242496.0, 555380.0, 114108.0, 32577.0, 11813.0, 4766.0, 2018.0, 948.0, 510.0, 322.0, 159.0, 120.0, 94.0, 58.0, 37.0, 20.0, 22.0, 16.0, 10.0, 9.0, 10.0, 6.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.9375, -3.8074951171875, -3.677490234375, -3.5474853515625, -3.41748046875, -3.2874755859375, -3.157470703125, -3.0274658203125, -2.8974609375, -2.7674560546875, -2.637451171875, -2.5074462890625, -2.37744140625, -2.2474365234375, -2.117431640625, -1.9874267578125, -1.857421875, -1.7274169921875, -1.597412109375, -1.4674072265625, -1.33740234375, -1.2073974609375, -1.077392578125, -0.9473876953125, -0.8173828125, -0.6873779296875, -0.557373046875, -0.4273681640625, -0.29736328125, -0.1673583984375, -0.037353515625, 0.0926513671875, 0.22265625, 0.3526611328125, 0.482666015625, 0.6126708984375, 0.74267578125, 0.8726806640625, 1.002685546875, 1.1326904296875, 1.2626953125, 1.3927001953125, 1.522705078125, 1.6527099609375, 1.78271484375, 1.9127197265625, 2.042724609375, 2.1727294921875, 2.302734375, 2.4327392578125, 2.562744140625, 2.6927490234375, 2.82275390625, 2.9527587890625, 3.082763671875, 3.2127685546875, 3.3427734375, 3.4727783203125, 3.602783203125, 3.7327880859375, 3.86279296875, 3.9927978515625, 4.122802734375, 4.2528076171875, 4.3828125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 2.0, 4.0, 10.0, 13.0, 9.0, 12.0, 17.0, 14.0, 27.0, 25.0, 24.0, 34.0, 32.0, 35.0, 27.0, 27.0, 42.0, 41.0, 37.0, 40.0, 55.0, 30.0, 36.0, 37.0, 33.0, 38.0, 34.0, 30.0, 26.0, 24.0, 31.0, 22.0, 15.0, 21.0, 20.0, 9.0, 10.0, 9.0, 9.0, 6.0, 6.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.962890625, -3.842681884765625, -3.72247314453125, -3.602264404296875, -3.4820556640625, -3.361846923828125, -3.24163818359375, -3.121429443359375, -3.001220703125, -2.881011962890625, -2.76080322265625, -2.640594482421875, -2.5203857421875, -2.400177001953125, -2.27996826171875, -2.159759521484375, -2.03955078125, -1.919342041015625, -1.79913330078125, -1.678924560546875, -1.5587158203125, -1.438507080078125, -1.31829833984375, -1.198089599609375, -1.077880859375, -0.957672119140625, -0.83746337890625, -0.717254638671875, -0.5970458984375, -0.476837158203125, -0.35662841796875, -0.236419677734375, -0.1162109375, 0.003997802734375, 0.12420654296875, 0.244415283203125, 0.3646240234375, 0.484832763671875, 0.60504150390625, 0.725250244140625, 0.845458984375, 0.965667724609375, 1.08587646484375, 1.206085205078125, 1.3262939453125, 1.446502685546875, 1.56671142578125, 1.686920166015625, 1.80712890625, 1.927337646484375, 2.04754638671875, 2.167755126953125, 2.2879638671875, 2.408172607421875, 2.52838134765625, 2.648590087890625, 2.768798828125, 2.889007568359375, 3.00921630859375, 3.129425048828125, 3.2496337890625, 3.369842529296875, 3.49005126953125, 3.610260009765625, 3.73046875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 14.0, 9.0, 28.0, 37.0, 68.0, 126.0, 216.0, 336.0, 626.0, 1110.0, 2058.0, 3890.0, 8099.0, 18255.0, 47916.0, 171397.0, 524406.0, 183090.0, 50495.0, 19005.0, 8547.0, 4078.0, 2138.0, 1134.0, 617.0, 343.0, 217.0, 116.0, 75.0, 49.0, 36.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.353515625, -1.306060791015625, -1.25860595703125, -1.211151123046875, -1.1636962890625, -1.116241455078125, -1.06878662109375, -1.021331787109375, -0.973876953125, -0.926422119140625, -0.87896728515625, -0.831512451171875, -0.7840576171875, -0.736602783203125, -0.68914794921875, -0.641693115234375, -0.59423828125, -0.546783447265625, -0.49932861328125, -0.451873779296875, -0.4044189453125, -0.356964111328125, -0.30950927734375, -0.262054443359375, -0.214599609375, -0.167144775390625, -0.11968994140625, -0.072235107421875, -0.0247802734375, 0.022674560546875, 0.07012939453125, 0.117584228515625, 0.1650390625, 0.212493896484375, 0.25994873046875, 0.307403564453125, 0.3548583984375, 0.402313232421875, 0.44976806640625, 0.497222900390625, 0.544677734375, 0.592132568359375, 0.63958740234375, 0.687042236328125, 0.7344970703125, 0.781951904296875, 0.82940673828125, 0.876861572265625, 0.92431640625, 0.971771240234375, 1.01922607421875, 1.066680908203125, 1.1141357421875, 1.161590576171875, 1.20904541015625, 1.256500244140625, 1.303955078125, 1.351409912109375, 1.39886474609375, 1.446319580078125, 1.4937744140625, 1.541229248046875, 1.58868408203125, 1.636138916015625, 1.68359375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 9.0, 4.0, 1.0, 3.0, 3.0, 4.0, 1.0, 8.0, 9.0, 9.0, 12.0, 22.0, 11.0, 28.0, 52.0, 66.0, 124.0, 166.0, 159.0, 82.0, 70.0, 49.0, 23.0, 10.0, 12.0, 10.0, 6.0, 8.0, 6.0, 10.0, 7.0, 2.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00037860870361328125, -0.0003649666905403137, -0.0003513246774673462, -0.00033768266439437866, -0.00032404065132141113, -0.0003103986382484436, -0.0002967566251754761, -0.00028311461210250854, -0.000269472599029541, -0.0002558305859565735, -0.00024218857288360596, -0.00022854655981063843, -0.0002149045467376709, -0.00020126253366470337, -0.00018762052059173584, -0.0001739785075187683, -0.00016033649444580078, -0.00014669448137283325, -0.00013305246829986572, -0.0001194104552268982, -0.00010576844215393066, -9.212642908096313e-05, -7.84844160079956e-05, -6.484240293502808e-05, -5.120038986206055e-05, -3.755837678909302e-05, -2.3916363716125488e-05, -1.0274350643157959e-05, 3.3676624298095703e-06, 1.70096755027771e-05, 3.065168857574463e-05, 4.429370164871216e-05, 5.793571472167969e-05, 7.157772779464722e-05, 8.521974086761475e-05, 9.886175394058228e-05, 0.0001125037670135498, 0.00012614578008651733, 0.00013978779315948486, 0.0001534298062324524, 0.00016707181930541992, 0.00018071383237838745, 0.00019435584545135498, 0.0002079978585243225, 0.00022163987159729004, 0.00023528188467025757, 0.0002489238977432251, 0.0002625659108161926, 0.00027620792388916016, 0.0002898499369621277, 0.0003034919500350952, 0.00031713396310806274, 0.0003307759761810303, 0.0003444179892539978, 0.00035806000232696533, 0.00037170201539993286, 0.0003853440284729004, 0.0003989860415458679, 0.00041262805461883545, 0.000426270067691803, 0.0004399120807647705, 0.00045355409383773804, 0.00046719610691070557, 0.0004808381199836731, 0.0004944801330566406]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 12.0, 9.0, 25.0, 39.0, 63.0, 120.0, 172.0, 334.0, 695.0, 1572.0, 4085.0, 13117.0, 54719.0, 318456.0, 524522.0, 99153.0, 21379.0, 5997.0, 2174.0, 944.0, 451.0, 209.0, 124.0, 69.0, 27.0, 36.0, 13.0, 11.0, 9.0, 5.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9365234375, -1.8798675537109375, -1.823211669921875, -1.7665557861328125, -1.70989990234375, -1.6532440185546875, -1.596588134765625, -1.5399322509765625, -1.4832763671875, -1.4266204833984375, -1.369964599609375, -1.3133087158203125, -1.25665283203125, -1.1999969482421875, -1.143341064453125, -1.0866851806640625, -1.030029296875, -0.9733734130859375, -0.916717529296875, -0.8600616455078125, -0.80340576171875, -0.7467498779296875, -0.690093994140625, -0.6334381103515625, -0.5767822265625, -0.5201263427734375, -0.463470458984375, -0.4068145751953125, -0.35015869140625, -0.2935028076171875, -0.236846923828125, -0.1801910400390625, -0.12353515625, -0.0668792724609375, -0.010223388671875, 0.0464324951171875, 0.10308837890625, 0.1597442626953125, 0.216400146484375, 0.2730560302734375, 0.3297119140625, 0.3863677978515625, 0.443023681640625, 0.4996795654296875, 0.55633544921875, 0.6129913330078125, 0.669647216796875, 0.7263031005859375, 0.782958984375, 0.8396148681640625, 0.896270751953125, 0.9529266357421875, 1.00958251953125, 1.0662384033203125, 1.122894287109375, 1.1795501708984375, 1.2362060546875, 1.2928619384765625, 1.349517822265625, 1.4061737060546875, 1.46282958984375, 1.5194854736328125, 1.576141357421875, 1.6327972412109375, 1.689453125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 6.0, 4.0, 4.0, 10.0, 14.0, 27.0, 32.0, 30.0, 41.0, 52.0, 78.0, 104.0, 127.0, 116.0, 84.0, 83.0, 49.0, 38.0, 18.0, 24.0, 13.0, 15.0, 8.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.65234375, -1.6004180908203125, -1.548492431640625, -1.4965667724609375, -1.44464111328125, -1.3927154541015625, -1.340789794921875, -1.2888641357421875, -1.2369384765625, -1.1850128173828125, -1.133087158203125, -1.0811614990234375, -1.02923583984375, -0.9773101806640625, -0.925384521484375, -0.8734588623046875, -0.821533203125, -0.7696075439453125, -0.717681884765625, -0.6657562255859375, -0.61383056640625, -0.5619049072265625, -0.509979248046875, -0.4580535888671875, -0.4061279296875, -0.3542022705078125, -0.302276611328125, -0.2503509521484375, -0.19842529296875, -0.1464996337890625, -0.094573974609375, -0.0426483154296875, 0.00927734375, 0.0612030029296875, 0.113128662109375, 0.1650543212890625, 0.21697998046875, 0.2689056396484375, 0.320831298828125, 0.3727569580078125, 0.4246826171875, 0.4766082763671875, 0.528533935546875, 0.5804595947265625, 0.63238525390625, 0.6843109130859375, 0.736236572265625, 0.7881622314453125, 0.840087890625, 0.8920135498046875, 0.943939208984375, 0.9958648681640625, 1.04779052734375, 1.0997161865234375, 1.151641845703125, 1.2035675048828125, 1.2554931640625, 1.3074188232421875, 1.359344482421875, 1.4112701416015625, 1.46319580078125, 1.5151214599609375, 1.567047119140625, 1.6189727783203125, 1.6708984375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 10.0, 18.0, 29.0, 104.0, 141.0, 201.0, 201.0, 144.0, 72.0, 43.0, 15.0, 8.0, 5.0, 5.0, 1.0, 8.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.317363739013672, -17.517105102539062, -16.716846466064453, -15.916587829589844, -15.116329193115234, -14.316070556640625, -13.515811920166016, -12.715553283691406, -11.915294647216797, -11.115036010742188, -10.314777374267578, -9.514518737792969, -8.71426010131836, -7.914001941680908, -7.113743305206299, -6.3134846687316895, -5.513226509094238, -4.712967872619629, -3.9127092361450195, -3.1124508380889893, -2.31219220161438, -1.5119338035583496, -0.7116751670837402, 0.08858346939086914, 0.8888421058654785, 1.689100742340088, 2.4893593788146973, 3.2896177768707275, 4.089876174926758, 4.890134811401367, 5.690393447875977, 6.490652084350586, 7.290910720825195, 8.091169357299805, 8.891427993774414, 9.691686630249023, 10.491945266723633, 11.292203903198242, 12.092462539672852, 12.892721176147461, 13.69297981262207, 14.49323844909668, 15.293497085571289, 16.0937557220459, 16.894014358520508, 17.694272994995117, 18.494531631469727, 19.294790267944336, 20.095046997070312, 20.895305633544922, 21.69556427001953, 22.49582290649414, 23.29608154296875, 24.09634017944336, 24.89659881591797, 25.696857452392578, 26.497116088867188, 27.297374725341797, 28.097633361816406, 28.897891998291016, 29.698150634765625, 30.498409271240234, 31.298667907714844, 32.09892654418945, 32.89918518066406]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 7.0, 3.0, 3.0, 7.0, 5.0, 4.0, 9.0, 12.0, 9.0, 16.0, 15.0, 22.0, 14.0, 23.0, 25.0, 27.0, 18.0, 24.0, 26.0, 31.0, 33.0, 28.0, 33.0, 45.0, 37.0, 33.0, 37.0, 43.0, 29.0, 41.0, 26.0, 23.0, 37.0, 33.0, 26.0, 26.0, 17.0, 26.0, 21.0, 18.0, 16.0, 13.0, 18.0, 8.0, 14.0, 7.0, 7.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-8.147621154785156, -7.870217800140381, -7.592813968658447, -7.315410614013672, -7.038006782531738, -6.760603427886963, -6.4832000732421875, -6.205796241760254, -5.9283928871154785, -5.650989532470703, -5.3735857009887695, -5.096182346343994, -4.818778991699219, -4.541375160217285, -4.26397180557251, -3.9865682125091553, -3.709164619445801, -3.4317610263824463, -3.154357433319092, -2.8769540786743164, -2.599550485610962, -2.3221468925476074, -2.044743537902832, -1.7673399448394775, -1.489936351776123, -1.2125327587127686, -0.9351292848587036, -0.6577257513999939, -0.3803222179412842, -0.10291862487792969, 0.17448484897613525, 0.4518883228302002, 0.7292919158935547, 1.0066955089569092, 1.2840989828109741, 1.561502456665039, 1.8389060497283936, 2.116309642791748, 2.3937129974365234, 2.671116590499878, 2.9485201835632324, 3.225923776626587, 3.5033273696899414, 3.780730724334717, 4.058134078979492, 4.335537910461426, 4.612941265106201, 4.890344619750977, 5.16774845123291, 5.4451518058776855, 5.722555637359619, 5.9999589920043945, 6.277362823486328, 6.5547661781311035, 6.832169532775879, 7.1095733642578125, 7.386976718902588, 7.664380073547363, 7.941783905029297, 8.21918773651123, 8.496590614318848, 8.773994445800781, 9.051398277282715, 9.328801155090332, 9.606204986572266]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 9.0, 4.0, 8.0, 8.0, 18.0, 24.0, 36.0, 53.0, 67.0, 129.0, 198.0, 298.0, 446.0, 755.0, 1263.0, 2102.0, 3567.0, 6627.0, 12390.0, 24057.0, 47729.0, 103703.0, 240636.0, 597449.0, 1226056.0, 1087279.0, 483419.0, 191015.0, 82298.0, 39210.0, 19831.0, 10343.0, 5623.0, 3017.0, 1791.0, 1011.0, 625.0, 393.0, 284.0, 171.0, 101.0, 73.0, 49.0, 36.0, 20.0, 18.0, 16.0, 12.0, 9.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2119140625, -1.1726531982421875, -1.133392333984375, -1.0941314697265625, -1.05487060546875, -1.0156097412109375, -0.976348876953125, -0.9370880126953125, -0.8978271484375, -0.8585662841796875, -0.819305419921875, -0.7800445556640625, -0.74078369140625, -0.7015228271484375, -0.662261962890625, -0.6230010986328125, -0.583740234375, -0.5444793701171875, -0.505218505859375, -0.4659576416015625, -0.42669677734375, -0.3874359130859375, -0.348175048828125, -0.3089141845703125, -0.2696533203125, -0.2303924560546875, -0.191131591796875, -0.1518707275390625, -0.11260986328125, -0.0733489990234375, -0.034088134765625, 0.0051727294921875, 0.04443359375, 0.0836944580078125, 0.122955322265625, 0.1622161865234375, 0.20147705078125, 0.2407379150390625, 0.279998779296875, 0.3192596435546875, 0.3585205078125, 0.3977813720703125, 0.437042236328125, 0.4763031005859375, 0.51556396484375, 0.5548248291015625, 0.594085693359375, 0.6333465576171875, 0.672607421875, 0.7118682861328125, 0.751129150390625, 0.7903900146484375, 0.82965087890625, 0.8689117431640625, 0.908172607421875, 0.9474334716796875, 0.9866943359375, 1.0259552001953125, 1.065216064453125, 1.1044769287109375, 1.14373779296875, 1.1829986572265625, 1.222259521484375, 1.2615203857421875, 1.30078125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 6.0, 5.0, 15.0, 6.0, 14.0, 14.0, 16.0, 18.0, 16.0, 30.0, 27.0, 33.0, 23.0, 29.0, 44.0, 33.0, 36.0, 46.0, 43.0, 30.0, 49.0, 58.0, 37.0, 50.0, 36.0, 37.0, 40.0, 24.0, 30.0, 28.0, 19.0, 18.0, 16.0, 14.0, 7.0, 10.0, 9.0, 6.0, 9.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.228515625, -1.1877899169921875, -1.147064208984375, -1.1063385009765625, -1.06561279296875, -1.0248870849609375, -0.984161376953125, -0.9434356689453125, -0.9027099609375, -0.8619842529296875, -0.821258544921875, -0.7805328369140625, -0.73980712890625, -0.6990814208984375, -0.658355712890625, -0.6176300048828125, -0.576904296875, -0.5361785888671875, -0.495452880859375, -0.4547271728515625, -0.41400146484375, -0.3732757568359375, -0.332550048828125, -0.2918243408203125, -0.2510986328125, -0.2103729248046875, -0.169647216796875, -0.1289215087890625, -0.08819580078125, -0.0474700927734375, -0.006744384765625, 0.0339813232421875, 0.07470703125, 0.1154327392578125, 0.156158447265625, 0.1968841552734375, 0.23760986328125, 0.2783355712890625, 0.319061279296875, 0.3597869873046875, 0.4005126953125, 0.4412384033203125, 0.481964111328125, 0.5226898193359375, 0.56341552734375, 0.6041412353515625, 0.644866943359375, 0.6855926513671875, 0.726318359375, 0.7670440673828125, 0.807769775390625, 0.8484954833984375, 0.88922119140625, 0.9299468994140625, 0.970672607421875, 1.0113983154296875, 1.0521240234375, 1.0928497314453125, 1.133575439453125, 1.1743011474609375, 1.21502685546875, 1.2557525634765625, 1.296478271484375, 1.3372039794921875, 1.3779296875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 9.0, 8.0, 8.0, 11.0, 15.0, 32.0, 41.0, 51.0, 84.0, 146.0, 181.0, 324.0, 493.0, 831.0, 1389.0, 2571.0, 5223.0, 11748.0, 31405.0, 102533.0, 414115.0, 2330591.0, 1014427.0, 190671.0, 53705.0, 18227.0, 7318.0, 3508.0, 1830.0, 1031.0, 643.0, 374.0, 255.0, 153.0, 116.0, 59.0, 44.0, 33.0, 14.0, 12.0, 10.0, 9.0, 12.0, 6.0, 7.0, 5.0, 4.0, 1.0, 0.0, 2.0, 3.0], "bins": [-3.30859375, -3.213348388671875, -3.11810302734375, -3.022857666015625, -2.9276123046875, -2.832366943359375, -2.73712158203125, -2.641876220703125, -2.546630859375, -2.451385498046875, -2.35614013671875, -2.260894775390625, -2.1656494140625, -2.070404052734375, -1.97515869140625, -1.879913330078125, -1.78466796875, -1.689422607421875, -1.59417724609375, -1.498931884765625, -1.4036865234375, -1.308441162109375, -1.21319580078125, -1.117950439453125, -1.022705078125, -0.927459716796875, -0.83221435546875, -0.736968994140625, -0.6417236328125, -0.546478271484375, -0.45123291015625, -0.355987548828125, -0.2607421875, -0.165496826171875, -0.07025146484375, 0.024993896484375, 0.1202392578125, 0.215484619140625, 0.31072998046875, 0.405975341796875, 0.501220703125, 0.596466064453125, 0.69171142578125, 0.786956787109375, 0.8822021484375, 0.977447509765625, 1.07269287109375, 1.167938232421875, 1.26318359375, 1.358428955078125, 1.45367431640625, 1.548919677734375, 1.6441650390625, 1.739410400390625, 1.83465576171875, 1.929901123046875, 2.025146484375, 2.120391845703125, 2.21563720703125, 2.310882568359375, 2.4061279296875, 2.501373291015625, 2.59661865234375, 2.691864013671875, 2.787109375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 13.0, 10.0, 21.0, 24.0, 28.0, 42.0, 56.0, 85.0, 98.0, 120.0, 179.0, 265.0, 445.0, 620.0, 611.0, 463.0, 303.0, 178.0, 135.0, 92.0, 62.0, 62.0, 36.0, 22.0, 29.0, 16.0, 12.0, 4.0, 12.0, 3.0, 7.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4609375, -3.359283447265625, -3.25762939453125, -3.155975341796875, -3.0543212890625, -2.952667236328125, -2.85101318359375, -2.749359130859375, -2.647705078125, -2.546051025390625, -2.44439697265625, -2.342742919921875, -2.2410888671875, -2.139434814453125, -2.03778076171875, -1.936126708984375, -1.83447265625, -1.732818603515625, -1.63116455078125, -1.529510498046875, -1.4278564453125, -1.326202392578125, -1.22454833984375, -1.122894287109375, -1.021240234375, -0.919586181640625, -0.81793212890625, -0.716278076171875, -0.6146240234375, -0.512969970703125, -0.41131591796875, -0.309661865234375, -0.2080078125, -0.106353759765625, -0.00469970703125, 0.096954345703125, 0.1986083984375, 0.300262451171875, 0.40191650390625, 0.503570556640625, 0.605224609375, 0.706878662109375, 0.80853271484375, 0.910186767578125, 1.0118408203125, 1.113494873046875, 1.21514892578125, 1.316802978515625, 1.41845703125, 1.520111083984375, 1.62176513671875, 1.723419189453125, 1.8250732421875, 1.926727294921875, 2.02838134765625, 2.130035400390625, 2.231689453125, 2.333343505859375, 2.43499755859375, 2.536651611328125, 2.6383056640625, 2.739959716796875, 2.84161376953125, 2.943267822265625, 3.044921875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 16.0, 32.0, 106.0, 161.0, 200.0, 196.0, 143.0, 86.0, 30.0, 10.0, 5.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.19289016723633, -34.1256217956543, -33.058353424072266, -31.991086959838867, -30.923818588256836, -29.856550216674805, -28.789283752441406, -27.722015380859375, -26.654747009277344, -25.587478637695312, -24.52021026611328, -23.452943801879883, -22.38567543029785, -21.31840705871582, -20.251140594482422, -19.18387222290039, -18.11660385131836, -17.049335479736328, -15.982068061828613, -14.914800643920898, -13.847532272338867, -12.780263900756836, -11.712996482849121, -10.645729064941406, -9.578460693359375, -8.511192321777344, -7.443924903869629, -6.376657009124756, -5.309389114379883, -4.24212121963501, -3.1748533248901367, -2.1075854301452637, -1.040313720703125, 0.026954174041748047, 1.094222068786621, 2.161489963531494, 3.228757858276367, 4.29602575302124, 5.363293647766113, 6.430561542510986, 7.497829437255859, 8.56509780883789, 9.632365226745605, 10.69963264465332, 11.766901016235352, 12.834169387817383, 13.901436805725098, 14.968704223632812, 16.035972595214844, 17.103240966796875, 18.170509338378906, 19.237775802612305, 20.305044174194336, 21.372312545776367, 22.439579010009766, 23.506847381591797, 24.574115753173828, 25.64138412475586, 26.70865249633789, 27.77591896057129, 28.84318733215332, 29.91045570373535, 30.97772216796875, 32.04499053955078, 33.11225891113281]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 8.0, 12.0, 13.0, 13.0, 11.0, 11.0, 21.0, 17.0, 26.0, 25.0, 32.0, 35.0, 40.0, 65.0, 47.0, 54.0, 54.0, 47.0, 43.0, 52.0, 43.0, 53.0, 33.0, 39.0, 34.0, 27.0, 32.0, 27.0, 21.0, 14.0, 15.0, 14.0, 7.0, 5.0, 4.0, 7.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.87087345123291, -10.498376846313477, -10.125879287719727, -9.753382682800293, -9.38088607788086, -9.00838851928711, -8.635891914367676, -8.263395309448242, -7.89089822769165, -7.518401145935059, -7.145904541015625, -6.773407459259033, -6.400910377502441, -6.028413772583008, -5.655916690826416, -5.283419609069824, -4.910923004150391, -4.538425922393799, -4.165929317474365, -3.7934322357177734, -3.4209353923797607, -3.048438549041748, -2.6759414672851562, -2.3034446239471436, -1.9309477806091309, -1.5584509372711182, -1.185953974723816, -0.8134570121765137, -0.440960168838501, -0.06846332550048828, 0.3040337562561035, 0.6765305995941162, 1.049027442932129, 1.4215242862701416, 1.7940212488174438, 2.166518211364746, 2.539015054702759, 2.9115118980407715, 3.2840089797973633, 3.656505823135376, 4.029002666473389, 4.4014997482299805, 4.773996353149414, 5.146493434906006, 5.518990516662598, 5.891487121582031, 6.263984203338623, 6.636481285095215, 7.008977890014648, 7.38147497177124, 7.753971576690674, 8.126468658447266, 8.4989652633667, 8.871461868286133, 9.243959426879883, 9.616456031799316, 9.98895263671875, 10.361449241638184, 10.733946800231934, 11.106443405151367, 11.4789400100708, 11.851436614990234, 12.223934173583984, 12.596430778503418, 12.968928337097168]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 6.0, 3.0, 5.0, 9.0, 9.0, 20.0, 25.0, 47.0, 39.0, 84.0, 105.0, 174.0, 238.0, 360.0, 462.0, 681.0, 1104.0, 1573.0, 2612.0, 4223.0, 7201.0, 13339.0, 26423.0, 54307.0, 108470.0, 188520.0, 234765.0, 186429.0, 106691.0, 53125.0, 25673.0, 13297.0, 6984.0, 4003.0, 2555.0, 1618.0, 1080.0, 738.0, 493.0, 339.0, 211.0, 184.0, 101.0, 81.0, 48.0, 37.0, 24.0, 20.0, 14.0, 11.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2099609375, -1.1659393310546875, -1.121917724609375, -1.0778961181640625, -1.03387451171875, -0.9898529052734375, -0.945831298828125, -0.9018096923828125, -0.8577880859375, -0.8137664794921875, -0.769744873046875, -0.7257232666015625, -0.68170166015625, -0.6376800537109375, -0.593658447265625, -0.5496368408203125, -0.505615234375, -0.4615936279296875, -0.417572021484375, -0.3735504150390625, -0.32952880859375, -0.2855072021484375, -0.241485595703125, -0.1974639892578125, -0.1534423828125, -0.1094207763671875, -0.065399169921875, -0.0213775634765625, 0.02264404296875, 0.0666656494140625, 0.110687255859375, 0.1547088623046875, 0.19873046875, 0.2427520751953125, 0.286773681640625, 0.3307952880859375, 0.37481689453125, 0.4188385009765625, 0.462860107421875, 0.5068817138671875, 0.5509033203125, 0.5949249267578125, 0.638946533203125, 0.6829681396484375, 0.72698974609375, 0.7710113525390625, 0.815032958984375, 0.8590545654296875, 0.903076171875, 0.9470977783203125, 0.991119384765625, 1.0351409912109375, 1.07916259765625, 1.1231842041015625, 1.167205810546875, 1.2112274169921875, 1.2552490234375, 1.2992706298828125, 1.343292236328125, 1.3873138427734375, 1.43133544921875, 1.4753570556640625, 1.519378662109375, 1.5634002685546875, 1.607421875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 9.0, 3.0, 11.0, 11.0, 10.0, 10.0, 11.0, 18.0, 14.0, 16.0, 29.0, 23.0, 26.0, 19.0, 35.0, 44.0, 51.0, 32.0, 42.0, 42.0, 40.0, 37.0, 44.0, 40.0, 40.0, 50.0, 38.0, 27.0, 29.0, 27.0, 20.0, 22.0, 21.0, 28.0, 19.0, 13.0, 9.0, 7.0, 9.0, 7.0, 7.0, 3.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1650390625, -1.12353515625, -1.08203125, -1.04052734375, -0.9990234375, -0.95751953125, -0.916015625, -0.87451171875, -0.8330078125, -0.79150390625, -0.75, -0.70849609375, -0.6669921875, -0.62548828125, -0.583984375, -0.54248046875, -0.5009765625, -0.45947265625, -0.41796875, -0.37646484375, -0.3349609375, -0.29345703125, -0.251953125, -0.21044921875, -0.1689453125, -0.12744140625, -0.0859375, -0.04443359375, -0.0029296875, 0.03857421875, 0.080078125, 0.12158203125, 0.1630859375, 0.20458984375, 0.24609375, 0.28759765625, 0.3291015625, 0.37060546875, 0.412109375, 0.45361328125, 0.4951171875, 0.53662109375, 0.578125, 0.61962890625, 0.6611328125, 0.70263671875, 0.744140625, 0.78564453125, 0.8271484375, 0.86865234375, 0.91015625, 0.95166015625, 0.9931640625, 1.03466796875, 1.076171875, 1.11767578125, 1.1591796875, 1.20068359375, 1.2421875, 1.28369140625, 1.3251953125, 1.36669921875, 1.408203125, 1.44970703125, 1.4912109375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 5.0, 5.0, 9.0, 8.0, 9.0, 14.0, 32.0, 40.0, 90.0, 156.0, 276.0, 681.0, 1579.0, 4588.0, 17124.0, 95285.0, 484260.0, 365238.0, 61329.0, 11878.0, 3531.0, 1310.0, 538.0, 247.0, 123.0, 65.0, 42.0, 35.0, 17.0, 15.0, 7.0, 4.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.376953125, -3.255828857421875, -3.13470458984375, -3.013580322265625, -2.8924560546875, -2.771331787109375, -2.65020751953125, -2.529083251953125, -2.407958984375, -2.286834716796875, -2.16571044921875, -2.044586181640625, -1.9234619140625, -1.802337646484375, -1.68121337890625, -1.560089111328125, -1.43896484375, -1.317840576171875, -1.19671630859375, -1.075592041015625, -0.9544677734375, -0.833343505859375, -0.71221923828125, -0.591094970703125, -0.469970703125, -0.348846435546875, -0.22772216796875, -0.106597900390625, 0.0145263671875, 0.135650634765625, 0.25677490234375, 0.377899169921875, 0.4990234375, 0.620147705078125, 0.74127197265625, 0.862396240234375, 0.9835205078125, 1.104644775390625, 1.22576904296875, 1.346893310546875, 1.468017578125, 1.589141845703125, 1.71026611328125, 1.831390380859375, 1.9525146484375, 2.073638916015625, 2.19476318359375, 2.315887451171875, 2.43701171875, 2.558135986328125, 2.67926025390625, 2.800384521484375, 2.9215087890625, 3.042633056640625, 3.16375732421875, 3.284881591796875, 3.406005859375, 3.527130126953125, 3.64825439453125, 3.769378662109375, 3.8905029296875, 4.011627197265625, 4.13275146484375, 4.253875732421875, 4.375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 9.0, 4.0, 7.0, 15.0, 10.0, 14.0, 7.0, 13.0, 18.0, 22.0, 23.0, 34.0, 30.0, 32.0, 34.0, 29.0, 33.0, 46.0, 38.0, 49.0, 45.0, 48.0, 36.0, 43.0, 35.0, 29.0, 33.0, 29.0, 23.0, 29.0, 24.0, 22.0, 20.0, 22.0, 19.0, 14.0, 11.0, 11.0, 9.0, 6.0, 6.0, 5.0, 5.0, 1.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.046875, -3.927520751953125, -3.80816650390625, -3.688812255859375, -3.5694580078125, -3.450103759765625, -3.33074951171875, -3.211395263671875, -3.092041015625, -2.972686767578125, -2.85333251953125, -2.733978271484375, -2.6146240234375, -2.495269775390625, -2.37591552734375, -2.256561279296875, -2.13720703125, -2.017852783203125, -1.89849853515625, -1.779144287109375, -1.6597900390625, -1.540435791015625, -1.42108154296875, -1.301727294921875, -1.182373046875, -1.063018798828125, -0.94366455078125, -0.824310302734375, -0.7049560546875, -0.585601806640625, -0.46624755859375, -0.346893310546875, -0.2275390625, -0.108184814453125, 0.01116943359375, 0.130523681640625, 0.2498779296875, 0.369232177734375, 0.48858642578125, 0.607940673828125, 0.727294921875, 0.846649169921875, 0.96600341796875, 1.085357666015625, 1.2047119140625, 1.324066162109375, 1.44342041015625, 1.562774658203125, 1.68212890625, 1.801483154296875, 1.92083740234375, 2.040191650390625, 2.1595458984375, 2.278900146484375, 2.39825439453125, 2.517608642578125, 2.636962890625, 2.756317138671875, 2.87567138671875, 2.995025634765625, 3.1143798828125, 3.233734130859375, 3.35308837890625, 3.472442626953125, 3.591796875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 8.0, 15.0, 15.0, 14.0, 20.0, 45.0, 55.0, 94.0, 113.0, 215.0, 367.0, 603.0, 940.0, 1641.0, 2828.0, 5404.0, 9763.0, 18524.0, 36992.0, 74188.0, 146697.0, 238706.0, 231991.0, 137786.0, 68999.0, 34199.0, 17580.0, 9128.0, 4979.0, 2773.0, 1558.0, 925.0, 550.0, 274.0, 195.0, 134.0, 73.0, 39.0, 32.0, 27.0, 19.0, 14.0, 9.0, 10.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.7646484375, -0.7407150268554688, -0.7167816162109375, -0.6928482055664062, -0.668914794921875, -0.6449813842773438, -0.6210479736328125, -0.5971145629882812, -0.57318115234375, -0.5492477416992188, -0.5253143310546875, -0.5013809204101562, -0.477447509765625, -0.45351409912109375, -0.4295806884765625, -0.40564727783203125, -0.3817138671875, -0.35778045654296875, -0.3338470458984375, -0.30991363525390625, -0.285980224609375, -0.26204681396484375, -0.2381134033203125, -0.21417999267578125, -0.19024658203125, -0.16631317138671875, -0.1423797607421875, -0.11844635009765625, -0.094512939453125, -0.07057952880859375, -0.0466461181640625, -0.02271270751953125, 0.001220703125, 0.02515411376953125, 0.0490875244140625, 0.07302093505859375, 0.096954345703125, 0.12088775634765625, 0.1448211669921875, 0.16875457763671875, 0.19268798828125, 0.21662139892578125, 0.2405548095703125, 0.26448822021484375, 0.288421630859375, 0.31235504150390625, 0.3362884521484375, 0.36022186279296875, 0.3841552734375, 0.40808868408203125, 0.4320220947265625, 0.45595550537109375, 0.479888916015625, 0.5038223266601562, 0.5277557373046875, 0.5516891479492188, 0.57562255859375, 0.5995559692382812, 0.6234893798828125, 0.6474227905273438, 0.671356201171875, 0.6952896118164062, 0.7192230224609375, 0.7431564331054688, 0.76708984375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 6.0, 4.0, 10.0, 9.0, 19.0, 22.0, 24.0, 13.0, 21.0, 33.0, 38.0, 60.0, 61.0, 70.0, 88.0, 72.0, 77.0, 75.0, 52.0, 54.0, 30.0, 32.0, 24.0, 24.0, 12.0, 18.0, 5.0, 11.0, 9.0, 5.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001952648162841797, -0.00018782168626785278, -0.00018037855625152588, -0.00017293542623519897, -0.00016549229621887207, -0.00015804916620254517, -0.00015060603618621826, -0.00014316290616989136, -0.00013571977615356445, -0.00012827664613723755, -0.00012083351612091064, -0.00011339038610458374, -0.00010594725608825684, -9.850412607192993e-05, -9.106099605560303e-05, -8.361786603927612e-05, -7.617473602294922e-05, -6.873160600662231e-05, -6.128847599029541e-05, -5.3845345973968506e-05, -4.64022159576416e-05, -3.89590859413147e-05, -3.151595592498779e-05, -2.407282590866089e-05, -1.6629695892333984e-05, -9.18656587600708e-06, -1.7434358596801758e-06, 5.6996941566467285e-06, 1.3142824172973633e-05, 2.0585954189300537e-05, 2.802908420562744e-05, 3.5472214221954346e-05, 4.291534423828125e-05, 5.0358474254608154e-05, 5.780160427093506e-05, 6.524473428726196e-05, 7.268786430358887e-05, 8.013099431991577e-05, 8.757412433624268e-05, 9.501725435256958e-05, 0.00010246038436889648, 0.00010990351438522339, 0.00011734664440155029, 0.0001247897744178772, 0.0001322329044342041, 0.000139676034450531, 0.0001471191644668579, 0.00015456229448318481, 0.00016200542449951172, 0.00016944855451583862, 0.00017689168453216553, 0.00018433481454849243, 0.00019177794456481934, 0.00019922107458114624, 0.00020666420459747314, 0.00021410733461380005, 0.00022155046463012695, 0.00022899359464645386, 0.00023643672466278076, 0.00024387985467910767, 0.00025132298469543457, 0.0002587661147117615, 0.0002662092447280884, 0.0002736523747444153, 0.0002810955047607422]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 7.0, 8.0, 17.0, 10.0, 14.0, 19.0, 42.0, 39.0, 61.0, 83.0, 126.0, 196.0, 322.0, 476.0, 796.0, 1288.0, 2221.0, 3867.0, 7057.0, 13404.0, 25544.0, 49903.0, 99087.0, 181503.0, 243078.0, 193721.0, 109138.0, 55611.0, 28514.0, 14471.0, 7707.0, 4110.0, 2457.0, 1328.0, 842.0, 490.0, 329.0, 244.0, 132.0, 84.0, 55.0, 29.0, 36.0, 27.0, 13.0, 15.0, 11.0, 6.0, 7.0, 0.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.75146484375, -0.7283935546875, -0.705322265625, -0.6822509765625, -0.6591796875, -0.6361083984375, -0.613037109375, -0.5899658203125, -0.56689453125, -0.5438232421875, -0.520751953125, -0.4976806640625, -0.474609375, -0.4515380859375, -0.428466796875, -0.4053955078125, -0.38232421875, -0.3592529296875, -0.336181640625, -0.3131103515625, -0.2900390625, -0.2669677734375, -0.243896484375, -0.2208251953125, -0.19775390625, -0.1746826171875, -0.151611328125, -0.1285400390625, -0.10546875, -0.0823974609375, -0.059326171875, -0.0362548828125, -0.01318359375, 0.0098876953125, 0.032958984375, 0.0560302734375, 0.0791015625, 0.1021728515625, 0.125244140625, 0.1483154296875, 0.17138671875, 0.1944580078125, 0.217529296875, 0.2406005859375, 0.263671875, 0.2867431640625, 0.309814453125, 0.3328857421875, 0.35595703125, 0.3790283203125, 0.402099609375, 0.4251708984375, 0.4482421875, 0.4713134765625, 0.494384765625, 0.5174560546875, 0.54052734375, 0.5635986328125, 0.586669921875, 0.6097412109375, 0.6328125, 0.6558837890625, 0.678955078125, 0.7020263671875, 0.72509765625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 7.0, 8.0, 7.0, 10.0, 8.0, 7.0, 13.0, 21.0, 19.0, 14.0, 27.0, 28.0, 32.0, 37.0, 47.0, 48.0, 47.0, 39.0, 60.0, 45.0, 45.0, 50.0, 55.0, 46.0, 50.0, 38.0, 28.0, 23.0, 15.0, 20.0, 12.0, 16.0, 19.0, 8.0, 11.0, 8.0, 10.0, 8.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7373046875, -0.7116241455078125, -0.685943603515625, -0.6602630615234375, -0.63458251953125, -0.6089019775390625, -0.583221435546875, -0.5575408935546875, -0.5318603515625, -0.5061798095703125, -0.480499267578125, -0.4548187255859375, -0.42913818359375, -0.4034576416015625, -0.377777099609375, -0.3520965576171875, -0.326416015625, -0.3007354736328125, -0.275054931640625, -0.2493743896484375, -0.22369384765625, -0.1980133056640625, -0.172332763671875, -0.1466522216796875, -0.1209716796875, -0.0952911376953125, -0.069610595703125, -0.0439300537109375, -0.01824951171875, 0.0074310302734375, 0.033111572265625, 0.0587921142578125, 0.08447265625, 0.1101531982421875, 0.135833740234375, 0.1615142822265625, 0.18719482421875, 0.2128753662109375, 0.238555908203125, 0.2642364501953125, 0.2899169921875, 0.3155975341796875, 0.341278076171875, 0.3669586181640625, 0.39263916015625, 0.4183197021484375, 0.444000244140625, 0.4696807861328125, 0.495361328125, 0.5210418701171875, 0.546722412109375, 0.5724029541015625, 0.59808349609375, 0.6237640380859375, 0.649444580078125, 0.6751251220703125, 0.7008056640625, 0.7264862060546875, 0.752166748046875, 0.7778472900390625, 0.80352783203125, 0.8292083740234375, 0.854888916015625, 0.8805694580078125, 0.90625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 11.0, 20.0, 41.0, 80.0, 126.0, 133.0, 193.0, 143.0, 101.0, 64.0, 25.0, 27.0, 12.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-21.16817855834961, -20.616348266601562, -20.064517974853516, -19.51268768310547, -18.960857391357422, -18.409029006958008, -17.85719871520996, -17.305368423461914, -16.753538131713867, -16.20170783996582, -15.649877548217773, -15.098048210144043, -14.546217918395996, -13.99438762664795, -13.442558288574219, -12.890727996826172, -12.338897705078125, -11.787067413330078, -11.235237121582031, -10.6834077835083, -10.131577491760254, -9.579747200012207, -9.027917861938477, -8.47608757019043, -7.924257278442383, -7.372426986694336, -6.820597171783447, -6.268767356872559, -5.716937065124512, -5.165106773376465, -4.613276958465576, -4.0614471435546875, -3.5096168518066406, -2.957786798477173, -2.405956745147705, -1.8541266918182373, -1.3022966384887695, -0.7504665851593018, -0.19863653182983398, 0.3531935214996338, 0.9050235748291016, 1.4568536281585693, 2.008683681488037, 2.560513734817505, 3.1123437881469727, 3.6641738414764404, 4.216003894805908, 4.767833709716797, 5.319664001464844, 5.871494293212891, 6.423324108123779, 6.975153923034668, 7.526984214782715, 8.078814506530762, 8.630643844604492, 9.182474136352539, 9.734304428100586, 10.286134719848633, 10.83796501159668, 11.38979434967041, 11.941624641418457, 12.493454933166504, 13.045284271240234, 13.597114562988281, 14.148944854736328]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 10.0, 6.0, 6.0, 8.0, 9.0, 12.0, 17.0, 12.0, 21.0, 24.0, 25.0, 36.0, 28.0, 35.0, 40.0, 22.0, 43.0, 39.0, 38.0, 38.0, 30.0, 36.0, 42.0, 35.0, 43.0, 38.0, 33.0, 31.0, 30.0, 33.0, 21.0, 22.0, 32.0, 10.0, 16.0, 18.0, 12.0, 7.0, 13.0, 7.0, 7.0, 1.0, 6.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-10.391742706298828, -10.084712028503418, -9.777681350708008, -9.470651626586914, -9.163620948791504, -8.856590270996094, -8.549559593200684, -8.242528915405273, -7.9354987144470215, -7.628468036651611, -7.321437835693359, -7.014407157897949, -6.707376480102539, -6.400346279144287, -6.093315601348877, -5.786285400390625, -5.479254722595215, -5.172224044799805, -4.865193843841553, -4.558163166046143, -4.251132965087891, -3.9441022872924805, -3.6370716094970703, -3.3300411701202393, -3.023010730743408, -2.715980291366577, -2.408949851989746, -2.101919174194336, -1.7948887348175049, -1.4878582954406738, -1.1808277368545532, -0.8737971782684326, -0.5667667388916016, -0.25973623991012573, 0.0472942590713501, 0.3543247580528259, 0.6613552570343018, 0.9683856964111328, 1.2754162549972534, 1.582446813583374, 1.889477252960205, 2.196507692337036, 2.503538131713867, 2.8105688095092773, 3.1175992488861084, 3.4246296882629395, 3.7316603660583496, 4.038690567016602, 4.345721244812012, 4.652751922607422, 4.959782123565674, 5.266812801361084, 5.573843002319336, 5.880873680114746, 6.187904357910156, 6.494935035705566, 6.801965236663818, 7.1089959144592285, 7.4160261154174805, 7.723056793212891, 8.0300874710083, 8.337118148803711, 8.644147872924805, 8.951178550720215, 9.258209228515625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 1.0, 5.0, 6.0, 6.0, 12.0, 23.0, 24.0, 51.0, 59.0, 102.0, 145.0, 228.0, 366.0, 596.0, 1139.0, 2131.0, 4168.0, 8982.0, 20333.0, 51905.0, 154817.0, 537743.0, 1494435.0, 1292555.0, 423268.0, 125667.0, 42989.0, 17162.0, 7579.0, 3570.0, 1789.0, 958.0, 554.0, 305.0, 216.0, 123.0, 91.0, 46.0, 45.0, 27.0, 20.0, 11.0, 9.0, 7.0, 6.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5068359375, -1.4546966552734375, -1.402557373046875, -1.3504180908203125, -1.29827880859375, -1.2461395263671875, -1.194000244140625, -1.1418609619140625, -1.0897216796875, -1.0375823974609375, -0.985443115234375, -0.9333038330078125, -0.88116455078125, -0.8290252685546875, -0.776885986328125, -0.7247467041015625, -0.672607421875, -0.6204681396484375, -0.568328857421875, -0.5161895751953125, -0.46405029296875, -0.4119110107421875, -0.359771728515625, -0.3076324462890625, -0.2554931640625, -0.2033538818359375, -0.151214599609375, -0.0990753173828125, -0.04693603515625, 0.0052032470703125, 0.057342529296875, 0.1094818115234375, 0.16162109375, 0.2137603759765625, 0.265899658203125, 0.3180389404296875, 0.37017822265625, 0.4223175048828125, 0.474456787109375, 0.5265960693359375, 0.5787353515625, 0.6308746337890625, 0.683013916015625, 0.7351531982421875, 0.78729248046875, 0.8394317626953125, 0.891571044921875, 0.9437103271484375, 0.995849609375, 1.0479888916015625, 1.100128173828125, 1.1522674560546875, 1.20440673828125, 1.2565460205078125, 1.308685302734375, 1.3608245849609375, 1.4129638671875, 1.4651031494140625, 1.517242431640625, 1.5693817138671875, 1.62152099609375, 1.6736602783203125, 1.725799560546875, 1.7779388427734375, 1.830078125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 2.0, 4.0, 7.0, 5.0, 4.0, 8.0, 9.0, 6.0, 7.0, 14.0, 14.0, 19.0, 25.0, 29.0, 17.0, 21.0, 29.0, 23.0, 32.0, 34.0, 26.0, 42.0, 43.0, 31.0, 40.0, 37.0, 41.0, 33.0, 53.0, 35.0, 31.0, 33.0, 24.0, 19.0, 26.0, 17.0, 17.0, 26.0, 15.0, 17.0, 21.0, 6.0, 8.0, 6.0, 11.0, 7.0, 7.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-1.28515625, -1.2471923828125, -1.209228515625, -1.1712646484375, -1.13330078125, -1.0953369140625, -1.057373046875, -1.0194091796875, -0.9814453125, -0.9434814453125, -0.905517578125, -0.8675537109375, -0.82958984375, -0.7916259765625, -0.753662109375, -0.7156982421875, -0.677734375, -0.6397705078125, -0.601806640625, -0.5638427734375, -0.52587890625, -0.4879150390625, -0.449951171875, -0.4119873046875, -0.3740234375, -0.3360595703125, -0.298095703125, -0.2601318359375, -0.22216796875, -0.1842041015625, -0.146240234375, -0.1082763671875, -0.0703125, -0.0323486328125, 0.005615234375, 0.0435791015625, 0.08154296875, 0.1195068359375, 0.157470703125, 0.1954345703125, 0.2333984375, 0.2713623046875, 0.309326171875, 0.3472900390625, 0.38525390625, 0.4232177734375, 0.461181640625, 0.4991455078125, 0.537109375, 0.5750732421875, 0.613037109375, 0.6510009765625, 0.68896484375, 0.7269287109375, 0.764892578125, 0.8028564453125, 0.8408203125, 0.8787841796875, 0.916748046875, 0.9547119140625, 0.99267578125, 1.0306396484375, 1.068603515625, 1.1065673828125, 1.14453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 5.0, 10.0, 12.0, 20.0, 43.0, 46.0, 80.0, 117.0, 164.0, 224.0, 360.0, 691.0, 1096.0, 2014.0, 4085.0, 8470.0, 20142.0, 52206.0, 157608.0, 672470.0, 2344050.0, 681461.0, 157983.0, 52834.0, 20260.0, 8789.0, 4066.0, 2126.0, 1102.0, 639.0, 390.0, 247.0, 143.0, 92.0, 79.0, 44.0, 22.0, 16.0, 22.0, 14.0, 6.0, 2.0, 10.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2734375, -2.196380615234375, -2.11932373046875, -2.042266845703125, -1.9652099609375, -1.888153076171875, -1.81109619140625, -1.734039306640625, -1.656982421875, -1.579925537109375, -1.50286865234375, -1.425811767578125, -1.3487548828125, -1.271697998046875, -1.19464111328125, -1.117584228515625, -1.04052734375, -0.963470458984375, -0.88641357421875, -0.809356689453125, -0.7322998046875, -0.655242919921875, -0.57818603515625, -0.501129150390625, -0.424072265625, -0.347015380859375, -0.26995849609375, -0.192901611328125, -0.1158447265625, -0.038787841796875, 0.03826904296875, 0.115325927734375, 0.1923828125, 0.269439697265625, 0.34649658203125, 0.423553466796875, 0.5006103515625, 0.577667236328125, 0.65472412109375, 0.731781005859375, 0.808837890625, 0.885894775390625, 0.96295166015625, 1.040008544921875, 1.1170654296875, 1.194122314453125, 1.27117919921875, 1.348236083984375, 1.42529296875, 1.502349853515625, 1.57940673828125, 1.656463623046875, 1.7335205078125, 1.810577392578125, 1.88763427734375, 1.964691162109375, 2.041748046875, 2.118804931640625, 2.19586181640625, 2.272918701171875, 2.3499755859375, 2.427032470703125, 2.50408935546875, 2.581146240234375, 2.658203125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 5.0, 14.0, 9.0, 16.0, 24.0, 39.0, 46.0, 60.0, 102.0, 128.0, 181.0, 296.0, 451.0, 639.0, 619.0, 459.0, 307.0, 179.0, 142.0, 85.0, 61.0, 63.0, 27.0, 40.0, 14.0, 19.0, 9.0, 4.0, 8.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.814453125, -2.72064208984375, -2.6268310546875, -2.53302001953125, -2.439208984375, -2.34539794921875, -2.2515869140625, -2.15777587890625, -2.06396484375, -1.97015380859375, -1.8763427734375, -1.78253173828125, -1.688720703125, -1.59490966796875, -1.5010986328125, -1.40728759765625, -1.3134765625, -1.21966552734375, -1.1258544921875, -1.03204345703125, -0.938232421875, -0.84442138671875, -0.7506103515625, -0.65679931640625, -0.56298828125, -0.46917724609375, -0.3753662109375, -0.28155517578125, -0.187744140625, -0.09393310546875, -0.0001220703125, 0.09368896484375, 0.1875, 0.28131103515625, 0.3751220703125, 0.46893310546875, 0.562744140625, 0.65655517578125, 0.7503662109375, 0.84417724609375, 0.93798828125, 1.03179931640625, 1.1256103515625, 1.21942138671875, 1.313232421875, 1.40704345703125, 1.5008544921875, 1.59466552734375, 1.6884765625, 1.78228759765625, 1.8760986328125, 1.96990966796875, 2.063720703125, 2.15753173828125, 2.2513427734375, 2.34515380859375, 2.43896484375, 2.53277587890625, 2.6265869140625, 2.72039794921875, 2.814208984375, 2.90802001953125, 3.0018310546875, 3.09564208984375, 3.189453125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 10.0, 25.0, 64.0, 125.0, 226.0, 222.0, 159.0, 86.0, 53.0, 21.0, 10.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.38844871520996, -19.470577239990234, -18.552705764770508, -17.63483428955078, -16.716962814331055, -15.799091339111328, -14.881218910217285, -13.963347434997559, -13.045475959777832, -12.127604484558105, -11.209733009338379, -10.291860580444336, -9.37398910522461, -8.456117630004883, -7.538246154785156, -6.62037467956543, -5.702503204345703, -4.784631729125977, -3.866760015487671, -2.9488883018493652, -2.0310168266296387, -1.113145351409912, -0.19527339935302734, 0.7225980758666992, 1.6404695510864258, 2.5583410263061523, 3.476212739944458, 4.394084453582764, 5.31195592880249, 6.229827404022217, 7.147699356079102, 8.065570831298828, 8.983440399169922, 9.901311874389648, 10.819183349609375, 11.737054824829102, 12.654926300048828, 13.572797775268555, 14.490670204162598, 15.408541679382324, 16.326412200927734, 17.24428367614746, 18.162155151367188, 19.080026626586914, 19.99789810180664, 20.915769577026367, 21.833641052246094, 22.751514434814453, 23.66938591003418, 24.587257385253906, 25.505128860473633, 26.42300033569336, 27.340871810913086, 28.258743286132812, 29.176616668701172, 30.094486236572266, 31.012359619140625, 31.93023109436035, 32.84810256958008, 33.76597595214844, 34.68384552001953, 35.60171890258789, 36.519588470458984, 37.437461853027344, 38.35533142089844]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 7.0, 9.0, 10.0, 16.0, 8.0, 17.0, 17.0, 14.0, 27.0, 26.0, 34.0, 32.0, 41.0, 45.0, 33.0, 46.0, 46.0, 40.0, 37.0, 48.0, 44.0, 35.0, 42.0, 30.0, 32.0, 35.0, 30.0, 26.0, 23.0, 17.0, 16.0, 24.0, 22.0, 8.0, 11.0, 8.0, 15.0, 3.0, 5.0, 8.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.799314975738525, -7.536129951477051, -7.272944450378418, -7.009758949279785, -6.7465739250183105, -6.483388900756836, -6.220203399658203, -5.95701789855957, -5.693832874298096, -5.430647850036621, -5.167462348937988, -4.9042768478393555, -4.641091823577881, -4.377906799316406, -4.114721298217773, -3.8515360355377197, -3.588350772857666, -3.3251655101776123, -3.0619802474975586, -2.798794984817505, -2.535609722137451, -2.2724244594573975, -2.0092391967773438, -1.74605393409729, -1.4828686714172363, -1.2196834087371826, -0.9564981460571289, -0.6933128833770752, -0.4301276206970215, -0.16694235801696777, 0.09624290466308594, 0.35942816734313965, 0.6226139068603516, 0.8857991695404053, 1.148984432220459, 1.4121696949005127, 1.6753549575805664, 1.9385402202606201, 2.201725482940674, 2.4649107456207275, 2.7280960083007812, 2.991281270980835, 3.2544665336608887, 3.5176517963409424, 3.780837059020996, 4.044022560119629, 4.3072075843811035, 4.570392608642578, 4.833578109741211, 5.096763610839844, 5.359948635101318, 5.623133659362793, 5.886319160461426, 6.149504661560059, 6.412689685821533, 6.675874710083008, 6.939060211181641, 7.202245712280273, 7.465430736541748, 7.728615760803223, 7.9918012619018555, 8.254986763000488, 8.518171310424805, 8.781356811523438, 9.04454231262207]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 3.0, 7.0, 5.0, 8.0, 17.0, 27.0, 29.0, 63.0, 80.0, 137.0, 256.0, 403.0, 744.0, 1343.0, 2284.0, 4364.0, 8894.0, 19147.0, 51253.0, 169211.0, 401408.0, 258654.0, 79174.0, 26934.0, 11632.0, 5668.0, 3064.0, 1586.0, 866.0, 502.0, 276.0, 183.0, 125.0, 79.0, 53.0, 26.0, 18.0, 16.0, 10.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.767578125, -2.68023681640625, -2.5928955078125, -2.50555419921875, -2.418212890625, -2.33087158203125, -2.2435302734375, -2.15618896484375, -2.06884765625, -1.98150634765625, -1.8941650390625, -1.80682373046875, -1.719482421875, -1.63214111328125, -1.5447998046875, -1.45745849609375, -1.3701171875, -1.28277587890625, -1.1954345703125, -1.10809326171875, -1.020751953125, -0.93341064453125, -0.8460693359375, -0.75872802734375, -0.67138671875, -0.58404541015625, -0.4967041015625, -0.40936279296875, -0.322021484375, -0.23468017578125, -0.1473388671875, -0.05999755859375, 0.02734375, 0.11468505859375, 0.2020263671875, 0.28936767578125, 0.376708984375, 0.46405029296875, 0.5513916015625, 0.63873291015625, 0.72607421875, 0.81341552734375, 0.9007568359375, 0.98809814453125, 1.075439453125, 1.16278076171875, 1.2501220703125, 1.33746337890625, 1.4248046875, 1.51214599609375, 1.5994873046875, 1.68682861328125, 1.774169921875, 1.86151123046875, 1.9488525390625, 2.03619384765625, 2.12353515625, 2.21087646484375, 2.2982177734375, 2.38555908203125, 2.472900390625, 2.56024169921875, 2.6475830078125, 2.73492431640625, 2.822265625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 1.0, 5.0, 4.0, 3.0, 8.0, 8.0, 8.0, 10.0, 24.0, 14.0, 27.0, 26.0, 26.0, 32.0, 19.0, 30.0, 47.0, 35.0, 46.0, 35.0, 35.0, 44.0, 34.0, 47.0, 44.0, 40.0, 30.0, 34.0, 39.0, 24.0, 35.0, 28.0, 19.0, 22.0, 19.0, 18.0, 11.0, 16.0, 11.0, 17.0, 4.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.4072265625, -1.3636932373046875, -1.320159912109375, -1.2766265869140625, -1.23309326171875, -1.1895599365234375, -1.146026611328125, -1.1024932861328125, -1.0589599609375, -1.0154266357421875, -0.971893310546875, -0.9283599853515625, -0.88482666015625, -0.8412933349609375, -0.797760009765625, -0.7542266845703125, -0.710693359375, -0.6671600341796875, -0.623626708984375, -0.5800933837890625, -0.53656005859375, -0.4930267333984375, -0.449493408203125, -0.4059600830078125, -0.3624267578125, -0.3188934326171875, -0.275360107421875, -0.2318267822265625, -0.18829345703125, -0.1447601318359375, -0.101226806640625, -0.0576934814453125, -0.01416015625, 0.0293731689453125, 0.072906494140625, 0.1164398193359375, 0.15997314453125, 0.2035064697265625, 0.247039794921875, 0.2905731201171875, 0.3341064453125, 0.3776397705078125, 0.421173095703125, 0.4647064208984375, 0.50823974609375, 0.5517730712890625, 0.595306396484375, 0.6388397216796875, 0.682373046875, 0.7259063720703125, 0.769439697265625, 0.8129730224609375, 0.85650634765625, 0.9000396728515625, 0.943572998046875, 0.9871063232421875, 1.0306396484375, 1.0741729736328125, 1.117706298828125, 1.1612396240234375, 1.20477294921875, 1.2483062744140625, 1.291839599609375, 1.3353729248046875, 1.37890625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 10.0, 11.0, 29.0, 37.0, 57.0, 82.0, 135.0, 237.0, 402.0, 743.0, 1439.0, 2905.0, 5906.0, 12540.0, 28871.0, 80993.0, 278195.0, 411523.0, 144167.0, 45468.0, 18059.0, 8195.0, 4083.0, 2071.0, 1063.0, 562.0, 290.0, 189.0, 111.0, 66.0, 44.0, 21.0, 19.0, 9.0, 8.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.111328125, -3.02044677734375, -2.9295654296875, -2.83868408203125, -2.747802734375, -2.65692138671875, -2.5660400390625, -2.47515869140625, -2.38427734375, -2.29339599609375, -2.2025146484375, -2.11163330078125, -2.020751953125, -1.92987060546875, -1.8389892578125, -1.74810791015625, -1.6572265625, -1.56634521484375, -1.4754638671875, -1.38458251953125, -1.293701171875, -1.20281982421875, -1.1119384765625, -1.02105712890625, -0.93017578125, -0.83929443359375, -0.7484130859375, -0.65753173828125, -0.566650390625, -0.47576904296875, -0.3848876953125, -0.29400634765625, -0.203125, -0.11224365234375, -0.0213623046875, 0.06951904296875, 0.160400390625, 0.25128173828125, 0.3421630859375, 0.43304443359375, 0.52392578125, 0.61480712890625, 0.7056884765625, 0.79656982421875, 0.887451171875, 0.97833251953125, 1.0692138671875, 1.16009521484375, 1.2509765625, 1.34185791015625, 1.4327392578125, 1.52362060546875, 1.614501953125, 1.70538330078125, 1.7962646484375, 1.88714599609375, 1.97802734375, 2.06890869140625, 2.1597900390625, 2.25067138671875, 2.341552734375, 2.43243408203125, 2.5233154296875, 2.61419677734375, 2.705078125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 4.0, 3.0, 6.0, 7.0, 8.0, 15.0, 18.0, 17.0, 27.0, 25.0, 21.0, 36.0, 31.0, 41.0, 38.0, 47.0, 44.0, 46.0, 36.0, 42.0, 41.0, 48.0, 36.0, 30.0, 34.0, 38.0, 32.0, 25.0, 28.0, 23.0, 25.0, 22.0, 17.0, 15.0, 11.0, 15.0, 9.0, 5.0, 7.0, 8.0, 5.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.96875, -4.82470703125, -4.6806640625, -4.53662109375, -4.392578125, -4.24853515625, -4.1044921875, -3.96044921875, -3.81640625, -3.67236328125, -3.5283203125, -3.38427734375, -3.240234375, -3.09619140625, -2.9521484375, -2.80810546875, -2.6640625, -2.52001953125, -2.3759765625, -2.23193359375, -2.087890625, -1.94384765625, -1.7998046875, -1.65576171875, -1.51171875, -1.36767578125, -1.2236328125, -1.07958984375, -0.935546875, -0.79150390625, -0.6474609375, -0.50341796875, -0.359375, -0.21533203125, -0.0712890625, 0.07275390625, 0.216796875, 0.36083984375, 0.5048828125, 0.64892578125, 0.79296875, 0.93701171875, 1.0810546875, 1.22509765625, 1.369140625, 1.51318359375, 1.6572265625, 1.80126953125, 1.9453125, 2.08935546875, 2.2333984375, 2.37744140625, 2.521484375, 2.66552734375, 2.8095703125, 2.95361328125, 3.09765625, 3.24169921875, 3.3857421875, 3.52978515625, 3.673828125, 3.81787109375, 3.9619140625, 4.10595703125, 4.25]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 3.0, 5.0, 7.0, 7.0, 10.0, 19.0, 21.0, 39.0, 62.0, 98.0, 133.0, 192.0, 286.0, 470.0, 799.0, 1276.0, 2114.0, 3504.0, 5871.0, 9988.0, 18218.0, 33959.0, 69674.0, 150456.0, 276842.0, 238789.0, 117112.0, 54927.0, 27626.0, 14916.0, 8419.0, 4922.0, 2903.0, 1798.0, 1092.0, 694.0, 457.0, 300.0, 158.0, 122.0, 89.0, 63.0, 35.0, 23.0, 22.0, 12.0, 7.0, 3.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.779296875, -0.75482177734375, -0.7303466796875, -0.70587158203125, -0.681396484375, -0.65692138671875, -0.6324462890625, -0.60797119140625, -0.58349609375, -0.55902099609375, -0.5345458984375, -0.51007080078125, -0.485595703125, -0.46112060546875, -0.4366455078125, -0.41217041015625, -0.3876953125, -0.36322021484375, -0.3387451171875, -0.31427001953125, -0.289794921875, -0.26531982421875, -0.2408447265625, -0.21636962890625, -0.19189453125, -0.16741943359375, -0.1429443359375, -0.11846923828125, -0.093994140625, -0.06951904296875, -0.0450439453125, -0.02056884765625, 0.00390625, 0.02838134765625, 0.0528564453125, 0.07733154296875, 0.101806640625, 0.12628173828125, 0.1507568359375, 0.17523193359375, 0.19970703125, 0.22418212890625, 0.2486572265625, 0.27313232421875, 0.297607421875, 0.32208251953125, 0.3465576171875, 0.37103271484375, 0.3955078125, 0.41998291015625, 0.4444580078125, 0.46893310546875, 0.493408203125, 0.51788330078125, 0.5423583984375, 0.56683349609375, 0.59130859375, 0.61578369140625, 0.6402587890625, 0.66473388671875, 0.689208984375, 0.71368408203125, 0.7381591796875, 0.76263427734375, 0.787109375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 10.0, 6.0, 15.0, 13.0, 22.0, 20.0, 39.0, 66.0, 85.0, 73.0, 104.0, 128.0, 115.0, 82.0, 54.0, 30.0, 30.0, 21.0, 13.0, 14.0, 11.0, 7.0, 3.0, 3.0, 3.0, 7.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.0003910064697265625, -0.00037979334592819214, -0.0003685802221298218, -0.0003573670983314514, -0.00034615397453308105, -0.0003349408507347107, -0.00032372772693634033, -0.00031251460313796997, -0.0003013014793395996, -0.00029008835554122925, -0.0002788752317428589, -0.0002676621079444885, -0.00025644898414611816, -0.0002452358603477478, -0.00023402273654937744, -0.00022280961275100708, -0.00021159648895263672, -0.00020038336515426636, -0.000189170241355896, -0.00017795711755752563, -0.00016674399375915527, -0.0001555308699607849, -0.00014431774616241455, -0.0001331046223640442, -0.00012189149856567383, -0.00011067837476730347, -9.94652509689331e-05, -8.825212717056274e-05, -7.703900337219238e-05, -6.582587957382202e-05, -5.461275577545166e-05, -4.33996319770813e-05, -3.218650817871094e-05, -2.0973384380340576e-05, -9.760260581970215e-06, 1.4528632164001465e-06, 1.2665987014770508e-05, 2.387911081314087e-05, 3.509223461151123e-05, 4.630535840988159e-05, 5.751848220825195e-05, 6.873160600662231e-05, 7.994472980499268e-05, 9.115785360336304e-05, 0.0001023709774017334, 0.00011358410120010376, 0.00012479722499847412, 0.00013601034879684448, 0.00014722347259521484, 0.0001584365963935852, 0.00016964972019195557, 0.00018086284399032593, 0.0001920759677886963, 0.00020328909158706665, 0.000214502215385437, 0.00022571533918380737, 0.00023692846298217773, 0.0002481415867805481, 0.00025935471057891846, 0.0002705678343772888, 0.0002817809581756592, 0.00029299408197402954, 0.0003042072057723999, 0.00031542032957077026, 0.0003266334533691406]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 10.0, 15.0, 16.0, 21.0, 21.0, 28.0, 44.0, 61.0, 96.0, 139.0, 252.0, 408.0, 634.0, 1036.0, 1718.0, 2962.0, 5273.0, 9299.0, 16776.0, 31748.0, 62472.0, 122919.0, 214121.0, 242544.0, 160239.0, 83401.0, 42416.0, 22187.0, 11914.0, 6572.0, 3705.0, 2160.0, 1262.0, 769.0, 454.0, 291.0, 197.0, 109.0, 84.0, 55.0, 45.0, 21.0, 23.0, 17.0, 9.0, 2.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.72900390625, -0.7070541381835938, -0.6851043701171875, -0.6631546020507812, -0.641204833984375, -0.6192550659179688, -0.5973052978515625, -0.5753555297851562, -0.55340576171875, -0.5314559936523438, -0.5095062255859375, -0.48755645751953125, -0.465606689453125, -0.44365692138671875, -0.4217071533203125, -0.39975738525390625, -0.3778076171875, -0.35585784912109375, -0.3339080810546875, -0.31195831298828125, -0.290008544921875, -0.26805877685546875, -0.2461090087890625, -0.22415924072265625, -0.20220947265625, -0.18025970458984375, -0.1583099365234375, -0.13636016845703125, -0.114410400390625, -0.09246063232421875, -0.0705108642578125, -0.04856109619140625, -0.026611328125, -0.00466156005859375, 0.0172882080078125, 0.03923797607421875, 0.061187744140625, 0.08313751220703125, 0.1050872802734375, 0.12703704833984375, 0.14898681640625, 0.17093658447265625, 0.1928863525390625, 0.21483612060546875, 0.236785888671875, 0.25873565673828125, 0.2806854248046875, 0.30263519287109375, 0.3245849609375, 0.34653472900390625, 0.3684844970703125, 0.39043426513671875, 0.412384033203125, 0.43433380126953125, 0.4562835693359375, 0.47823333740234375, 0.50018310546875, 0.5221328735351562, 0.5440826416015625, 0.5660324096679688, 0.587982177734375, 0.6099319458007812, 0.6318817138671875, 0.6538314819335938, 0.67578125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 4.0, 0.0, 6.0, 5.0, 5.0, 3.0, 7.0, 17.0, 15.0, 25.0, 23.0, 24.0, 35.0, 49.0, 45.0, 64.0, 68.0, 66.0, 82.0, 67.0, 53.0, 49.0, 55.0, 49.0, 39.0, 23.0, 20.0, 19.0, 16.0, 7.0, 8.0, 8.0, 3.0, 7.0, 4.0, 4.0, 6.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-1.0849609375, -1.0515899658203125, -1.018218994140625, -0.9848480224609375, -0.95147705078125, -0.9181060791015625, -0.884735107421875, -0.8513641357421875, -0.8179931640625, -0.7846221923828125, -0.751251220703125, -0.7178802490234375, -0.68450927734375, -0.6511383056640625, -0.617767333984375, -0.5843963623046875, -0.551025390625, -0.5176544189453125, -0.484283447265625, -0.4509124755859375, -0.41754150390625, -0.3841705322265625, -0.350799560546875, -0.3174285888671875, -0.2840576171875, -0.2506866455078125, -0.217315673828125, -0.1839447021484375, -0.15057373046875, -0.1172027587890625, -0.083831787109375, -0.0504608154296875, -0.01708984375, 0.0162811279296875, 0.049652099609375, 0.0830230712890625, 0.11639404296875, 0.1497650146484375, 0.183135986328125, 0.2165069580078125, 0.2498779296875, 0.2832489013671875, 0.316619873046875, 0.3499908447265625, 0.38336181640625, 0.4167327880859375, 0.450103759765625, 0.4834747314453125, 0.516845703125, 0.5502166748046875, 0.583587646484375, 0.6169586181640625, 0.65032958984375, 0.6837005615234375, 0.717071533203125, 0.7504425048828125, 0.7838134765625, 0.8171844482421875, 0.850555419921875, 0.8839263916015625, 0.91729736328125, 0.9506683349609375, 0.984039306640625, 1.0174102783203125, 1.05078125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 9.0, 18.0, 35.0, 56.0, 91.0, 142.0, 150.0, 145.0, 129.0, 82.0, 55.0, 37.0, 21.0, 5.0, 10.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.399526596069336, -17.85553741455078, -17.311548233032227, -16.767559051513672, -16.22357177734375, -15.679581642150879, -15.13559341430664, -14.591604232788086, -14.047615051269531, -13.503625869750977, -12.959636688232422, -12.415648460388184, -11.871659278869629, -11.327670097351074, -10.783681869506836, -10.239692687988281, -9.695703506469727, -9.151714324951172, -8.607725143432617, -8.063736915588379, -7.519747734069824, -6.9757585525512695, -6.431769847869873, -5.887781143188477, -5.343791961669922, -4.799802780151367, -4.255814075469971, -3.711825132369995, -3.1678361892700195, -2.623847246170044, -2.0798583030700684, -1.5358693599700928, -0.9918804168701172, -0.4478914737701416, 0.09609746932983398, 0.6400864124298096, 1.1840753555297852, 1.7280642986297607, 2.2720532417297363, 2.816042184829712, 3.3600311279296875, 3.904020071029663, 4.448009014129639, 4.991997718811035, 5.53598690032959, 6.0799760818481445, 6.623964786529541, 7.1679534912109375, 7.711942672729492, 8.255931854248047, 8.799921035766602, 9.34390926361084, 9.887898445129395, 10.43188762664795, 10.975875854492188, 11.519865036010742, 12.063854217529297, 12.607843399047852, 13.151832580566406, 13.695820808410645, 14.2398099899292, 14.783799171447754, 15.327787399291992, 15.871776580810547, 16.4157657623291]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 8.0, 11.0, 8.0, 4.0, 14.0, 16.0, 20.0, 24.0, 17.0, 14.0, 29.0, 25.0, 21.0, 36.0, 27.0, 39.0, 36.0, 48.0, 46.0, 61.0, 37.0, 46.0, 45.0, 45.0, 28.0, 40.0, 37.0, 27.0, 43.0, 23.0, 19.0, 14.0, 17.0, 11.0, 13.0, 10.0, 4.0, 9.0, 6.0, 6.0, 7.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-11.119760513305664, -10.782817840576172, -10.445874214172363, -10.108931541442871, -9.771987915039062, -9.43504524230957, -9.098102569580078, -8.76115894317627, -8.424215316772461, -8.087272644042969, -7.75032901763916, -7.413386344909668, -7.076442718505859, -6.739500045776367, -6.402556896209717, -6.065613746643066, -5.728671073913574, -5.391727924346924, -5.054784774780273, -4.717842102050781, -4.380898475646973, -4.0439558029174805, -3.70701265335083, -3.3700695037841797, -3.0331263542175293, -2.696183204650879, -2.3592400550842285, -2.0222971439361572, -1.6853539943695068, -1.3484108448028564, -1.0114679336547852, -0.6745247840881348, -0.3375816345214844, -0.0006385445594787598, 0.33630454540252686, 0.6732475757598877, 1.010190725326538, 1.3471338748931885, 1.6840767860412598, 2.02101993560791, 2.3579630851745605, 2.694906234741211, 3.0318493843078613, 3.3687922954559326, 3.705735445022583, 4.0426788330078125, 4.379621505737305, 4.716564655303955, 5.0535078048706055, 5.390450954437256, 5.727394104003906, 6.064336776733398, 6.401280403137207, 6.738223075866699, 7.07516622543335, 7.412109375, 7.74905252456665, 8.0859956741333, 8.422938346862793, 8.759881973266602, 9.096824645996094, 9.433768272399902, 9.770710945129395, 10.107654571533203, 10.444597244262695]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 8.0, 11.0, 17.0, 25.0, 47.0, 41.0, 85.0, 121.0, 177.0, 315.0, 474.0, 789.0, 1377.0, 2344.0, 4600.0, 9323.0, 21198.0, 54897.0, 171954.0, 573074.0, 1424450.0, 1257195.0, 452721.0, 137391.0, 45822.0, 18277.0, 8357.0, 4038.0, 2139.0, 1238.0, 721.0, 391.0, 207.0, 150.0, 95.0, 62.0, 50.0, 35.0, 19.0, 17.0, 7.0, 6.0, 8.0, 0.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5791015625, -1.5225067138671875, -1.465911865234375, -1.4093170166015625, -1.35272216796875, -1.2961273193359375, -1.239532470703125, -1.1829376220703125, -1.1263427734375, -1.0697479248046875, -1.013153076171875, -0.9565582275390625, -0.89996337890625, -0.8433685302734375, -0.786773681640625, -0.7301788330078125, -0.673583984375, -0.6169891357421875, -0.560394287109375, -0.5037994384765625, -0.44720458984375, -0.3906097412109375, -0.334014892578125, -0.2774200439453125, -0.2208251953125, -0.1642303466796875, -0.107635498046875, -0.0510406494140625, 0.00555419921875, 0.0621490478515625, 0.118743896484375, 0.1753387451171875, 0.23193359375, 0.2885284423828125, 0.345123291015625, 0.4017181396484375, 0.45831298828125, 0.5149078369140625, 0.571502685546875, 0.6280975341796875, 0.6846923828125, 0.7412872314453125, 0.797882080078125, 0.8544769287109375, 0.91107177734375, 0.9676666259765625, 1.024261474609375, 1.0808563232421875, 1.137451171875, 1.1940460205078125, 1.250640869140625, 1.3072357177734375, 1.36383056640625, 1.4204254150390625, 1.477020263671875, 1.5336151123046875, 1.5902099609375, 1.6468048095703125, 1.703399658203125, 1.7599945068359375, 1.81658935546875, 1.8731842041015625, 1.929779052734375, 1.9863739013671875, 2.04296875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 2.0, 3.0, 1.0, 6.0, 7.0, 13.0, 8.0, 10.0, 17.0, 12.0, 20.0, 11.0, 27.0, 32.0, 32.0, 38.0, 38.0, 35.0, 42.0, 36.0, 53.0, 43.0, 44.0, 45.0, 45.0, 45.0, 43.0, 33.0, 33.0, 25.0, 32.0, 23.0, 21.0, 21.0, 17.0, 18.0, 11.0, 14.0, 7.0, 11.0, 7.0, 5.0, 7.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.587890625, -1.5384979248046875, -1.489105224609375, -1.4397125244140625, -1.39031982421875, -1.3409271240234375, -1.291534423828125, -1.2421417236328125, -1.1927490234375, -1.1433563232421875, -1.093963623046875, -1.0445709228515625, -0.99517822265625, -0.9457855224609375, -0.896392822265625, -0.8470001220703125, -0.797607421875, -0.7482147216796875, -0.698822021484375, -0.6494293212890625, -0.60003662109375, -0.5506439208984375, -0.501251220703125, -0.4518585205078125, -0.4024658203125, -0.3530731201171875, -0.303680419921875, -0.2542877197265625, -0.20489501953125, -0.1555023193359375, -0.106109619140625, -0.0567169189453125, -0.00732421875, 0.0420684814453125, 0.091461181640625, 0.1408538818359375, 0.19024658203125, 0.2396392822265625, 0.289031982421875, 0.3384246826171875, 0.3878173828125, 0.4372100830078125, 0.486602783203125, 0.5359954833984375, 0.58538818359375, 0.6347808837890625, 0.684173583984375, 0.7335662841796875, 0.782958984375, 0.8323516845703125, 0.881744384765625, 0.9311370849609375, 0.98052978515625, 1.0299224853515625, 1.079315185546875, 1.1287078857421875, 1.1781005859375, 1.2274932861328125, 1.276885986328125, 1.3262786865234375, 1.37567138671875, 1.4250640869140625, 1.474456787109375, 1.5238494873046875, 1.5732421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 13.0, 8.0, 22.0, 29.0, 59.0, 75.0, 127.0, 191.0, 340.0, 583.0, 1128.0, 2032.0, 4384.0, 9778.0, 25198.0, 74309.0, 270453.0, 1477128.0, 1844356.0, 343678.0, 89280.0, 29453.0, 11453.0, 4983.0, 2332.0, 1200.0, 666.0, 399.0, 220.0, 127.0, 100.0, 69.0, 30.0, 24.0, 11.0, 7.0, 10.0, 10.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.40625, -2.320556640625, -2.23486328125, -2.149169921875, -2.0634765625, -1.977783203125, -1.89208984375, -1.806396484375, -1.720703125, -1.635009765625, -1.54931640625, -1.463623046875, -1.3779296875, -1.292236328125, -1.20654296875, -1.120849609375, -1.03515625, -0.949462890625, -0.86376953125, -0.778076171875, -0.6923828125, -0.606689453125, -0.52099609375, -0.435302734375, -0.349609375, -0.263916015625, -0.17822265625, -0.092529296875, -0.0068359375, 0.078857421875, 0.16455078125, 0.250244140625, 0.3359375, 0.421630859375, 0.50732421875, 0.593017578125, 0.6787109375, 0.764404296875, 0.85009765625, 0.935791015625, 1.021484375, 1.107177734375, 1.19287109375, 1.278564453125, 1.3642578125, 1.449951171875, 1.53564453125, 1.621337890625, 1.70703125, 1.792724609375, 1.87841796875, 1.964111328125, 2.0498046875, 2.135498046875, 2.22119140625, 2.306884765625, 2.392578125, 2.478271484375, 2.56396484375, 2.649658203125, 2.7353515625, 2.821044921875, 2.90673828125, 2.992431640625, 3.078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 4.0, 8.0, 11.0, 17.0, 15.0, 14.0, 26.0, 29.0, 36.0, 60.0, 61.0, 84.0, 108.0, 151.0, 260.0, 356.0, 435.0, 468.0, 474.0, 407.0, 294.0, 178.0, 134.0, 99.0, 87.0, 50.0, 37.0, 41.0, 23.0, 17.0, 19.0, 11.0, 16.0, 8.0, 10.0, 9.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.810546875, -2.727325439453125, -2.64410400390625, -2.560882568359375, -2.4776611328125, -2.394439697265625, -2.31121826171875, -2.227996826171875, -2.144775390625, -2.061553955078125, -1.97833251953125, -1.895111083984375, -1.8118896484375, -1.728668212890625, -1.64544677734375, -1.562225341796875, -1.47900390625, -1.395782470703125, -1.31256103515625, -1.229339599609375, -1.1461181640625, -1.062896728515625, -0.97967529296875, -0.896453857421875, -0.813232421875, -0.730010986328125, -0.64678955078125, -0.563568115234375, -0.4803466796875, -0.397125244140625, -0.31390380859375, -0.230682373046875, -0.1474609375, -0.064239501953125, 0.01898193359375, 0.102203369140625, 0.1854248046875, 0.268646240234375, 0.35186767578125, 0.435089111328125, 0.518310546875, 0.601531982421875, 0.68475341796875, 0.767974853515625, 0.8511962890625, 0.934417724609375, 1.01763916015625, 1.100860595703125, 1.18408203125, 1.267303466796875, 1.35052490234375, 1.433746337890625, 1.5169677734375, 1.600189208984375, 1.68341064453125, 1.766632080078125, 1.849853515625, 1.933074951171875, 2.01629638671875, 2.099517822265625, 2.1827392578125, 2.265960693359375, 2.34918212890625, 2.432403564453125, 2.515625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 8.0, 7.0, 16.0, 32.0, 60.0, 95.0, 114.0, 171.0, 156.0, 118.0, 101.0, 54.0, 28.0, 15.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.553009033203125, -21.8864803314209, -21.219953536987305, -20.553424835205078, -19.886898040771484, -19.220369338989258, -18.55384063720703, -17.887313842773438, -17.22078514099121, -16.554256439208984, -15.88772964477539, -15.221200942993164, -14.554673194885254, -13.888145446777344, -13.221616744995117, -12.555088996887207, -11.888561248779297, -11.222033500671387, -10.555505752563477, -9.88897705078125, -9.22244930267334, -8.55592155456543, -7.889393329620361, -7.222865104675293, -6.556337356567383, -5.889809608459473, -5.223281383514404, -4.556753158569336, -3.890225410461426, -3.2236974239349365, -2.5571694374084473, -1.890641212463379, -1.2241134643554688, -0.5575854778289795, 0.10894250869750977, 0.775470495223999, 1.4419984817504883, 2.1085264682769775, 2.775054454803467, 3.441582679748535, 4.108110427856445, 4.7746381759643555, 5.441166400909424, 6.107694625854492, 6.774222373962402, 7.4407501220703125, 8.107278823852539, 8.77380657196045, 9.44033432006836, 10.10686206817627, 10.77338981628418, 11.439918518066406, 12.106446266174316, 12.772974014282227, 13.439502716064453, 14.106030464172363, 14.772558212280273, 15.439085960388184, 16.105613708496094, 16.77214241027832, 17.438671112060547, 18.10519790649414, 18.771726608276367, 19.438255310058594, 20.104782104492188]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 4.0, 8.0, 9.0, 10.0, 8.0, 13.0, 8.0, 18.0, 21.0, 27.0, 25.0, 23.0, 32.0, 28.0, 31.0, 30.0, 39.0, 38.0, 39.0, 45.0, 39.0, 41.0, 30.0, 40.0, 45.0, 31.0, 33.0, 29.0, 34.0, 34.0, 30.0, 19.0, 22.0, 20.0, 12.0, 18.0, 14.0, 7.0, 9.0, 8.0, 14.0, 6.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-9.31020736694336, -9.050949096679688, -8.791691780090332, -8.53243350982666, -8.273176193237305, -8.013917922973633, -7.754660129547119, -7.4954023361206055, -7.236144065856934, -6.97688627243042, -6.717628479003906, -6.458370208740234, -6.199112415313721, -5.939854621887207, -5.680596828460693, -5.42133903503418, -5.162081241607666, -4.902823448181152, -4.643565654754639, -4.384307861328125, -4.125049591064453, -3.8657917976379395, -3.606534004211426, -3.347276210784912, -3.0880181789398193, -2.8287603855133057, -2.569502353668213, -2.310244560241699, -2.0509867668151855, -1.7917287349700928, -1.532470941543579, -1.2732130289077759, -1.0139551162719727, -0.7546972036361694, -0.495439350605011, -0.23618149757385254, 0.023076415061950684, 0.2823343276977539, 0.5415921211242676, 0.8008500337600708, 1.060107946395874, 1.3193658590316772, 1.5786237716674805, 1.8378815650939941, 2.097139358520508, 2.3563973903656006, 2.6156551837921143, 2.874913215637207, 3.1341710090637207, 3.3934288024902344, 3.652686834335327, 3.911944627761841, 4.171202659606934, 4.430460453033447, 4.689718246459961, 4.948976039886475, 5.208233833312988, 5.467491626739502, 5.726749420166016, 5.9860076904296875, 6.245265483856201, 6.504523277282715, 6.7637810707092285, 7.023038864135742, 7.282297134399414]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 13.0, 16.0, 22.0, 22.0, 26.0, 61.0, 80.0, 103.0, 177.0, 252.0, 319.0, 469.0, 703.0, 1048.0, 1536.0, 2364.0, 3710.0, 6002.0, 9766.0, 17614.0, 39926.0, 108680.0, 272786.0, 322688.0, 152153.0, 54124.0, 22647.0, 11690.0, 6939.0, 4329.0, 2756.0, 1840.0, 1194.0, 754.0, 527.0, 355.0, 243.0, 170.0, 121.0, 87.0, 55.0, 47.0, 44.0, 24.0, 20.0, 13.0, 17.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0], "bins": [-2.578125, -2.495391845703125, -2.41265869140625, -2.329925537109375, -2.2471923828125, -2.164459228515625, -2.08172607421875, -1.998992919921875, -1.916259765625, -1.833526611328125, -1.75079345703125, -1.668060302734375, -1.5853271484375, -1.502593994140625, -1.41986083984375, -1.337127685546875, -1.25439453125, -1.171661376953125, -1.08892822265625, -1.006195068359375, -0.9234619140625, -0.840728759765625, -0.75799560546875, -0.675262451171875, -0.592529296875, -0.509796142578125, -0.42706298828125, -0.344329833984375, -0.2615966796875, -0.178863525390625, -0.09613037109375, -0.013397216796875, 0.0693359375, 0.152069091796875, 0.23480224609375, 0.317535400390625, 0.4002685546875, 0.483001708984375, 0.56573486328125, 0.648468017578125, 0.731201171875, 0.813934326171875, 0.89666748046875, 0.979400634765625, 1.0621337890625, 1.144866943359375, 1.22760009765625, 1.310333251953125, 1.39306640625, 1.475799560546875, 1.55853271484375, 1.641265869140625, 1.7239990234375, 1.806732177734375, 1.88946533203125, 1.972198486328125, 2.054931640625, 2.137664794921875, 2.22039794921875, 2.303131103515625, 2.3858642578125, 2.468597412109375, 2.55133056640625, 2.634063720703125, 2.716796875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 6.0, 8.0, 19.0, 13.0, 13.0, 15.0, 8.0, 23.0, 19.0, 30.0, 39.0, 31.0, 45.0, 27.0, 35.0, 37.0, 39.0, 39.0, 43.0, 40.0, 46.0, 39.0, 42.0, 37.0, 30.0, 31.0, 34.0, 25.0, 29.0, 23.0, 21.0, 13.0, 16.0, 15.0, 9.0, 9.0, 8.0, 5.0, 4.0, 6.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.546875, -1.49822998046875, -1.4495849609375, -1.40093994140625, -1.352294921875, -1.30364990234375, -1.2550048828125, -1.20635986328125, -1.15771484375, -1.10906982421875, -1.0604248046875, -1.01177978515625, -0.963134765625, -0.91448974609375, -0.8658447265625, -0.81719970703125, -0.7685546875, -0.71990966796875, -0.6712646484375, -0.62261962890625, -0.573974609375, -0.52532958984375, -0.4766845703125, -0.42803955078125, -0.37939453125, -0.33074951171875, -0.2821044921875, -0.23345947265625, -0.184814453125, -0.13616943359375, -0.0875244140625, -0.03887939453125, 0.009765625, 0.05841064453125, 0.1070556640625, 0.15570068359375, 0.204345703125, 0.25299072265625, 0.3016357421875, 0.35028076171875, 0.39892578125, 0.44757080078125, 0.4962158203125, 0.54486083984375, 0.593505859375, 0.64215087890625, 0.6907958984375, 0.73944091796875, 0.7880859375, 0.83673095703125, 0.8853759765625, 0.93402099609375, 0.982666015625, 1.03131103515625, 1.0799560546875, 1.12860107421875, 1.17724609375, 1.22589111328125, 1.2745361328125, 1.32318115234375, 1.371826171875, 1.42047119140625, 1.4691162109375, 1.51776123046875, 1.56640625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 9.0, 18.0, 19.0, 30.0, 52.0, 71.0, 102.0, 201.0, 332.0, 599.0, 1133.0, 2311.0, 5112.0, 11720.0, 33050.0, 146476.0, 517707.0, 249918.0, 51150.0, 15986.0, 6435.0, 2924.0, 1461.0, 758.0, 363.0, 247.0, 115.0, 90.0, 43.0, 32.0, 24.0, 23.0, 6.0, 10.0, 7.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.916015625, -3.779388427734375, -3.64276123046875, -3.506134033203125, -3.3695068359375, -3.232879638671875, -3.09625244140625, -2.959625244140625, -2.822998046875, -2.686370849609375, -2.54974365234375, -2.413116455078125, -2.2764892578125, -2.139862060546875, -2.00323486328125, -1.866607666015625, -1.72998046875, -1.593353271484375, -1.45672607421875, -1.320098876953125, -1.1834716796875, -1.046844482421875, -0.91021728515625, -0.773590087890625, -0.636962890625, -0.500335693359375, -0.36370849609375, -0.227081298828125, -0.0904541015625, 0.046173095703125, 0.18280029296875, 0.319427490234375, 0.4560546875, 0.592681884765625, 0.72930908203125, 0.865936279296875, 1.0025634765625, 1.139190673828125, 1.27581787109375, 1.412445068359375, 1.549072265625, 1.685699462890625, 1.82232666015625, 1.958953857421875, 2.0955810546875, 2.232208251953125, 2.36883544921875, 2.505462646484375, 2.64208984375, 2.778717041015625, 2.91534423828125, 3.051971435546875, 3.1885986328125, 3.325225830078125, 3.46185302734375, 3.598480224609375, 3.735107421875, 3.871734619140625, 4.00836181640625, 4.144989013671875, 4.2816162109375, 4.418243408203125, 4.55487060546875, 4.691497802734375, 4.828125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 13.0, 9.0, 10.0, 17.0, 14.0, 18.0, 17.0, 32.0, 28.0, 23.0, 33.0, 28.0, 43.0, 37.0, 44.0, 43.0, 54.0, 40.0, 48.0, 42.0, 47.0, 44.0, 25.0, 27.0, 35.0, 44.0, 26.0, 16.0, 22.0, 15.0, 17.0, 16.0, 15.0, 14.0, 9.0, 9.0, 7.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.328125, -5.17791748046875, -5.0277099609375, -4.87750244140625, -4.727294921875, -4.57708740234375, -4.4268798828125, -4.27667236328125, -4.12646484375, -3.97625732421875, -3.8260498046875, -3.67584228515625, -3.525634765625, -3.37542724609375, -3.2252197265625, -3.07501220703125, -2.9248046875, -2.77459716796875, -2.6243896484375, -2.47418212890625, -2.323974609375, -2.17376708984375, -2.0235595703125, -1.87335205078125, -1.72314453125, -1.57293701171875, -1.4227294921875, -1.27252197265625, -1.122314453125, -0.97210693359375, -0.8218994140625, -0.67169189453125, -0.521484375, -0.37127685546875, -0.2210693359375, -0.07086181640625, 0.079345703125, 0.22955322265625, 0.3797607421875, 0.52996826171875, 0.68017578125, 0.83038330078125, 0.9805908203125, 1.13079833984375, 1.281005859375, 1.43121337890625, 1.5814208984375, 1.73162841796875, 1.8818359375, 2.03204345703125, 2.1822509765625, 2.33245849609375, 2.482666015625, 2.63287353515625, 2.7830810546875, 2.93328857421875, 3.08349609375, 3.23370361328125, 3.3839111328125, 3.53411865234375, 3.684326171875, 3.83453369140625, 3.9847412109375, 4.13494873046875, 4.28515625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 15.0, 16.0, 14.0, 23.0, 46.0, 41.0, 115.0, 148.0, 220.0, 361.0, 654.0, 1093.0, 2092.0, 3742.0, 7794.0, 16562.0, 41913.0, 131893.0, 363416.0, 314317.0, 101783.0, 33993.0, 14027.0, 6751.0, 3307.0, 1777.0, 979.0, 571.0, 336.0, 220.0, 125.0, 59.0, 49.0, 34.0, 30.0, 14.0, 8.0, 6.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2021484375, -1.1656036376953125, -1.129058837890625, -1.0925140380859375, -1.05596923828125, -1.0194244384765625, -0.982879638671875, -0.9463348388671875, -0.9097900390625, -0.8732452392578125, -0.836700439453125, -0.8001556396484375, -0.76361083984375, -0.7270660400390625, -0.690521240234375, -0.6539764404296875, -0.617431640625, -0.5808868408203125, -0.544342041015625, -0.5077972412109375, -0.47125244140625, -0.4347076416015625, -0.398162841796875, -0.3616180419921875, -0.3250732421875, -0.2885284423828125, -0.251983642578125, -0.2154388427734375, -0.17889404296875, -0.1423492431640625, -0.105804443359375, -0.0692596435546875, -0.03271484375, 0.0038299560546875, 0.040374755859375, 0.0769195556640625, 0.11346435546875, 0.1500091552734375, 0.186553955078125, 0.2230987548828125, 0.2596435546875, 0.2961883544921875, 0.332733154296875, 0.3692779541015625, 0.40582275390625, 0.4423675537109375, 0.478912353515625, 0.5154571533203125, 0.552001953125, 0.5885467529296875, 0.625091552734375, 0.6616363525390625, 0.69818115234375, 0.7347259521484375, 0.771270751953125, 0.8078155517578125, 0.8443603515625, 0.8809051513671875, 0.917449951171875, 0.9539947509765625, 0.99053955078125, 1.0270843505859375, 1.063629150390625, 1.1001739501953125, 1.13671875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 7.0, 12.0, 7.0, 19.0, 17.0, 29.0, 58.0, 81.0, 123.0, 148.0, 161.0, 101.0, 81.0, 52.0, 33.0, 17.0, 21.0, 7.0, 10.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041604042053222656, -0.0004000253975391388, -0.000384010374546051, -0.00036799535155296326, -0.0003519803285598755, -0.0003359653055667877, -0.00031995028257369995, -0.0003039352595806122, -0.0002879202365875244, -0.00027190521359443665, -0.0002558901906013489, -0.0002398751676082611, -0.00022386014461517334, -0.00020784512162208557, -0.0001918300986289978, -0.00017581507563591003, -0.00015980005264282227, -0.0001437850296497345, -0.00012777000665664673, -0.00011175498366355896, -9.573996067047119e-05, -7.972493767738342e-05, -6.370991468429565e-05, -4.7694891691207886e-05, -3.167986869812012e-05, -1.566484570503235e-05, 3.501772880554199e-07, 1.636520028114319e-05, 3.238022327423096e-05, 4.8395246267318726e-05, 6.44102692604065e-05, 8.042529225349426e-05, 9.644031524658203e-05, 0.0001124553382396698, 0.00012847036123275757, 0.00014448538422584534, 0.0001605004072189331, 0.00017651543021202087, 0.00019253045320510864, 0.0002085454761981964, 0.00022456049919128418, 0.00024057552218437195, 0.0002565905451774597, 0.0002726055681705475, 0.00028862059116363525, 0.000304635614156723, 0.0003206506371498108, 0.00033666566014289856, 0.00035268068313598633, 0.0003686957061290741, 0.00038471072912216187, 0.00040072575211524963, 0.0004167407751083374, 0.00043275579810142517, 0.00044877082109451294, 0.0004647858440876007, 0.0004808008670806885, 0.0004968158900737762, 0.000512830913066864, 0.0005288459360599518, 0.0005448609590530396, 0.0005608759820461273, 0.0005768910050392151, 0.0005929060280323029, 0.0006089210510253906]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 7.0, 2.0, 2.0, 7.0, 5.0, 6.0, 15.0, 21.0, 37.0, 60.0, 88.0, 150.0, 258.0, 520.0, 940.0, 1960.0, 4656.0, 12081.0, 36615.0, 126424.0, 352589.0, 339660.0, 118205.0, 34355.0, 11436.0, 4482.0, 1903.0, 947.0, 510.0, 237.0, 162.0, 81.0, 39.0, 31.0, 26.0, 14.0, 10.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2412109375, -1.2035675048828125, -1.165924072265625, -1.1282806396484375, -1.09063720703125, -1.0529937744140625, -1.015350341796875, -0.9777069091796875, -0.9400634765625, -0.9024200439453125, -0.864776611328125, -0.8271331787109375, -0.78948974609375, -0.7518463134765625, -0.714202880859375, -0.6765594482421875, -0.638916015625, -0.6012725830078125, -0.563629150390625, -0.5259857177734375, -0.48834228515625, -0.4506988525390625, -0.413055419921875, -0.3754119873046875, -0.3377685546875, -0.3001251220703125, -0.262481689453125, -0.2248382568359375, -0.18719482421875, -0.1495513916015625, -0.111907958984375, -0.0742645263671875, -0.03662109375, 0.0010223388671875, 0.038665771484375, 0.0763092041015625, 0.11395263671875, 0.1515960693359375, 0.189239501953125, 0.2268829345703125, 0.2645263671875, 0.3021697998046875, 0.339813232421875, 0.3774566650390625, 0.41510009765625, 0.4527435302734375, 0.490386962890625, 0.5280303955078125, 0.565673828125, 0.6033172607421875, 0.640960693359375, 0.6786041259765625, 0.71624755859375, 0.7538909912109375, 0.791534423828125, 0.8291778564453125, 0.8668212890625, 0.9044647216796875, 0.942108154296875, 0.9797515869140625, 1.01739501953125, 1.0550384521484375, 1.092681884765625, 1.1303253173828125, 1.16796875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 4.0, 6.0, 4.0, 11.0, 9.0, 7.0, 12.0, 16.0, 15.0, 23.0, 31.0, 56.0, 46.0, 61.0, 76.0, 90.0, 79.0, 86.0, 69.0, 64.0, 58.0, 36.0, 33.0, 23.0, 20.0, 19.0, 10.0, 12.0, 4.0, 5.0, 5.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.1376953125, -1.1026763916015625, -1.067657470703125, -1.0326385498046875, -0.99761962890625, -0.9626007080078125, -0.927581787109375, -0.8925628662109375, -0.8575439453125, -0.8225250244140625, -0.787506103515625, -0.7524871826171875, -0.71746826171875, -0.6824493408203125, -0.647430419921875, -0.6124114990234375, -0.577392578125, -0.5423736572265625, -0.507354736328125, -0.4723358154296875, -0.43731689453125, -0.4022979736328125, -0.367279052734375, -0.3322601318359375, -0.2972412109375, -0.2622222900390625, -0.227203369140625, -0.1921844482421875, -0.15716552734375, -0.1221466064453125, -0.087127685546875, -0.0521087646484375, -0.01708984375, 0.0179290771484375, 0.052947998046875, 0.0879669189453125, 0.12298583984375, 0.1580047607421875, 0.193023681640625, 0.2280426025390625, 0.2630615234375, 0.2980804443359375, 0.333099365234375, 0.3681182861328125, 0.40313720703125, 0.4381561279296875, 0.473175048828125, 0.5081939697265625, 0.543212890625, 0.5782318115234375, 0.613250732421875, 0.6482696533203125, 0.68328857421875, 0.7183074951171875, 0.753326416015625, 0.7883453369140625, 0.8233642578125, 0.8583831787109375, 0.893402099609375, 0.9284210205078125, 0.96343994140625, 0.9984588623046875, 1.033477783203125, 1.0684967041015625, 1.103515625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 6.0, 7.0, 5.0, 9.0, 24.0, 61.0, 112.0, 169.0, 203.0, 165.0, 118.0, 60.0, 31.0, 14.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.51287841796875, -28.680252075195312, -27.847627639770508, -27.01500129699707, -26.182376861572266, -25.349750518798828, -24.51712417602539, -23.684499740600586, -22.85187339782715, -22.01924705505371, -21.186622619628906, -20.35399627685547, -19.521371841430664, -18.688745498657227, -17.856121063232422, -17.023494720458984, -16.190868377685547, -15.358242988586426, -14.525617599487305, -13.692991256713867, -12.860365867614746, -12.027740478515625, -11.195115089416504, -10.362489700317383, -9.529865264892578, -8.697239875793457, -7.864614009857178, -7.031988620758057, -6.199362754821777, -5.366737365722656, -4.534111976623535, -3.701486110687256, -2.8688602447509766, -2.0362346172332764, -1.2036091089248657, -0.3709836006164551, 0.4616420269012451, 1.2942676544189453, 2.1268930435180664, 2.9595189094543457, 3.792144298553467, 4.624769687652588, 5.457395553588867, 6.290020942687988, 7.122646331787109, 7.955272197723389, 8.787897109985352, 9.620523452758789, 10.45314884185791, 11.285774230957031, 12.118399620056152, 12.951025009155273, 13.783651351928711, 14.616276741027832, 15.448902130126953, 16.28152847290039, 17.114152908325195, 17.946779251098633, 18.779403686523438, 19.612030029296875, 20.44465446472168, 21.277280807495117, 22.109905242919922, 22.94253158569336, 23.775157928466797]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 4.0, 3.0, 5.0, 4.0, 7.0, 3.0, 6.0, 7.0, 8.0, 7.0, 8.0, 10.0, 15.0, 17.0, 8.0, 16.0, 19.0, 20.0, 24.0, 33.0, 23.0, 27.0, 25.0, 39.0, 30.0, 35.0, 38.0, 29.0, 35.0, 30.0, 34.0, 36.0, 28.0, 38.0, 28.0, 21.0, 26.0, 33.0, 30.0, 28.0, 19.0, 15.0, 21.0, 16.0, 15.0, 17.0, 10.0, 9.0, 8.0, 7.0, 4.0, 7.0, 5.0, 9.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0], "bins": [-8.335926055908203, -8.0781888961792, -7.820452690124512, -7.562715530395508, -7.304978847503662, -7.047242164611816, -6.7895050048828125, -6.531768321990967, -6.274031639099121, -6.016294956207275, -5.75855827331543, -5.500821113586426, -5.24308443069458, -4.985347747802734, -4.7276105880737305, -4.469873905181885, -4.212137222290039, -3.9544005393981934, -3.6966636180877686, -3.4389266967773438, -3.181190013885498, -2.9234533309936523, -2.6657164096832275, -2.4079794883728027, -2.150242805480957, -1.8925060033798218, -1.6347692012786865, -1.3770323991775513, -1.119295597076416, -0.8615587949752808, -0.6038219928741455, -0.34608519077301025, -0.088348388671875, 0.16938841342926025, 0.4271252155303955, 0.6848620176315308, 0.942598819732666, 1.2003356218338013, 1.4580724239349365, 1.7158092260360718, 1.973546028137207, 2.2312827110290527, 2.4890196323394775, 2.7467565536499023, 3.004493236541748, 3.2622299194335938, 3.5199668407440186, 3.7777037620544434, 4.035440444946289, 4.293177127838135, 4.5509138107299805, 4.808650970458984, 5.06638765335083, 5.324124336242676, 5.58186149597168, 5.839598178863525, 6.097334861755371, 6.355071544647217, 6.6128082275390625, 6.870545387268066, 7.128282070159912, 7.386018753051758, 7.643755912780762, 7.901492595672607, 8.159229278564453]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 3.0, 5.0, 11.0, 13.0, 26.0, 27.0, 33.0, 56.0, 98.0, 206.0, 418.0, 934.0, 2234.0, 5838.0, 18223.0, 77889.0, 440300.0, 1786381.0, 1482337.0, 302661.0, 54471.0, 14066.0, 4726.0, 1801.0, 774.0, 355.0, 162.0, 73.0, 59.0, 36.0, 23.0, 16.0, 7.0, 4.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.259765625, -3.171417236328125, -3.08306884765625, -2.994720458984375, -2.9063720703125, -2.818023681640625, -2.72967529296875, -2.641326904296875, -2.552978515625, -2.464630126953125, -2.37628173828125, -2.287933349609375, -2.1995849609375, -2.111236572265625, -2.02288818359375, -1.934539794921875, -1.84619140625, -1.757843017578125, -1.66949462890625, -1.581146240234375, -1.4927978515625, -1.404449462890625, -1.31610107421875, -1.227752685546875, -1.139404296875, -1.051055908203125, -0.96270751953125, -0.874359130859375, -0.7860107421875, -0.697662353515625, -0.60931396484375, -0.520965576171875, -0.4326171875, -0.344268798828125, -0.25592041015625, -0.167572021484375, -0.0792236328125, 0.009124755859375, 0.09747314453125, 0.185821533203125, 0.274169921875, 0.362518310546875, 0.45086669921875, 0.539215087890625, 0.6275634765625, 0.715911865234375, 0.80426025390625, 0.892608642578125, 0.98095703125, 1.069305419921875, 1.15765380859375, 1.246002197265625, 1.3343505859375, 1.422698974609375, 1.51104736328125, 1.599395751953125, 1.687744140625, 1.776092529296875, 1.86444091796875, 1.952789306640625, 2.0411376953125, 2.129486083984375, 2.21783447265625, 2.306182861328125, 2.39453125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 4.0, 2.0, 6.0, 5.0, 7.0, 8.0, 15.0, 10.0, 12.0, 19.0, 12.0, 24.0, 21.0, 32.0, 21.0, 33.0, 35.0, 41.0, 37.0, 46.0, 46.0, 45.0, 42.0, 36.0, 46.0, 35.0, 35.0, 33.0, 29.0, 30.0, 40.0, 29.0, 19.0, 26.0, 21.0, 26.0, 14.0, 12.0, 9.0, 9.0, 8.0, 6.0, 3.0, 7.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3759765625, -1.324981689453125, -1.27398681640625, -1.222991943359375, -1.1719970703125, -1.121002197265625, -1.07000732421875, -1.019012451171875, -0.968017578125, -0.917022705078125, -0.86602783203125, -0.815032958984375, -0.7640380859375, -0.713043212890625, -0.66204833984375, -0.611053466796875, -0.56005859375, -0.509063720703125, -0.45806884765625, -0.407073974609375, -0.3560791015625, -0.305084228515625, -0.25408935546875, -0.203094482421875, -0.152099609375, -0.101104736328125, -0.05010986328125, 0.000885009765625, 0.0518798828125, 0.102874755859375, 0.15386962890625, 0.204864501953125, 0.255859375, 0.306854248046875, 0.35784912109375, 0.408843994140625, 0.4598388671875, 0.510833740234375, 0.56182861328125, 0.612823486328125, 0.663818359375, 0.714813232421875, 0.76580810546875, 0.816802978515625, 0.8677978515625, 0.918792724609375, 0.96978759765625, 1.020782470703125, 1.07177734375, 1.122772216796875, 1.17376708984375, 1.224761962890625, 1.2757568359375, 1.326751708984375, 1.37774658203125, 1.428741455078125, 1.479736328125, 1.530731201171875, 1.58172607421875, 1.632720947265625, 1.6837158203125, 1.734710693359375, 1.78570556640625, 1.836700439453125, 1.8876953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 6.0, 5.0, 8.0, 15.0, 29.0, 19.0, 35.0, 56.0, 74.0, 133.0, 207.0, 360.0, 570.0, 993.0, 1874.0, 3671.0, 7583.0, 17899.0, 46776.0, 145334.0, 624375.0, 2223354.0, 842916.0, 182769.0, 56239.0, 21008.0, 8959.0, 4116.0, 2106.0, 1119.0, 637.0, 382.0, 232.0, 131.0, 72.0, 68.0, 52.0, 33.0, 30.0, 13.0, 7.0, 2.0, 3.0, 6.0, 3.0, 2.0, 2.0, 4.0, 1.0], "bins": [-3.115234375, -3.03009033203125, -2.9449462890625, -2.85980224609375, -2.774658203125, -2.68951416015625, -2.6043701171875, -2.51922607421875, -2.43408203125, -2.34893798828125, -2.2637939453125, -2.17864990234375, -2.093505859375, -2.00836181640625, -1.9232177734375, -1.83807373046875, -1.7529296875, -1.66778564453125, -1.5826416015625, -1.49749755859375, -1.412353515625, -1.32720947265625, -1.2420654296875, -1.15692138671875, -1.07177734375, -0.98663330078125, -0.9014892578125, -0.81634521484375, -0.731201171875, -0.64605712890625, -0.5609130859375, -0.47576904296875, -0.390625, -0.30548095703125, -0.2203369140625, -0.13519287109375, -0.050048828125, 0.03509521484375, 0.1202392578125, 0.20538330078125, 0.29052734375, 0.37567138671875, 0.4608154296875, 0.54595947265625, 0.631103515625, 0.71624755859375, 0.8013916015625, 0.88653564453125, 0.9716796875, 1.05682373046875, 1.1419677734375, 1.22711181640625, 1.312255859375, 1.39739990234375, 1.4825439453125, 1.56768798828125, 1.65283203125, 1.73797607421875, 1.8231201171875, 1.90826416015625, 1.993408203125, 2.07855224609375, 2.1636962890625, 2.24884033203125, 2.333984375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 12.0, 7.0, 15.0, 19.0, 17.0, 16.0, 43.0, 47.0, 70.0, 103.0, 138.0, 194.0, 268.0, 444.0, 526.0, 568.0, 446.0, 304.0, 243.0, 150.0, 128.0, 70.0, 63.0, 37.0, 37.0, 20.0, 21.0, 17.0, 10.0, 7.0, 8.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.87890625, -3.777099609375, -3.67529296875, -3.573486328125, -3.4716796875, -3.369873046875, -3.26806640625, -3.166259765625, -3.064453125, -2.962646484375, -2.86083984375, -2.759033203125, -2.6572265625, -2.555419921875, -2.45361328125, -2.351806640625, -2.25, -2.148193359375, -2.04638671875, -1.944580078125, -1.8427734375, -1.740966796875, -1.63916015625, -1.537353515625, -1.435546875, -1.333740234375, -1.23193359375, -1.130126953125, -1.0283203125, -0.926513671875, -0.82470703125, -0.722900390625, -0.62109375, -0.519287109375, -0.41748046875, -0.315673828125, -0.2138671875, -0.112060546875, -0.01025390625, 0.091552734375, 0.193359375, 0.295166015625, 0.39697265625, 0.498779296875, 0.6005859375, 0.702392578125, 0.80419921875, 0.906005859375, 1.0078125, 1.109619140625, 1.21142578125, 1.313232421875, 1.4150390625, 1.516845703125, 1.61865234375, 1.720458984375, 1.822265625, 1.924072265625, 2.02587890625, 2.127685546875, 2.2294921875, 2.331298828125, 2.43310546875, 2.534912109375, 2.63671875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 12.0, 24.0, 30.0, 60.0, 94.0, 151.0, 159.0, 155.0, 104.0, 95.0, 49.0, 19.0, 15.0, 10.0, 10.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-30.89875030517578, -30.135883331298828, -29.373018264770508, -28.610153198242188, -27.847286224365234, -27.08441925048828, -26.32155418395996, -25.55868911743164, -24.795822143554688, -24.032955169677734, -23.270090103149414, -22.507225036621094, -21.74435806274414, -20.981491088867188, -20.218626022338867, -19.455760955810547, -18.692893981933594, -17.93002700805664, -17.16716194152832, -16.404296875, -15.641429901123047, -14.87856388092041, -14.115697860717773, -13.352831840515137, -12.5899658203125, -11.827099800109863, -11.064233779907227, -10.30136775970459, -9.538501739501953, -8.775635719299316, -8.01276969909668, -7.249903678894043, -6.487039566040039, -5.724173545837402, -4.961307525634766, -4.198441505432129, -3.435575485229492, -2.6727094650268555, -1.9098434448242188, -1.146977424621582, -0.3841114044189453, 0.3787546157836914, 1.1416206359863281, 1.9044866561889648, 2.6673526763916016, 3.4302186965942383, 4.193084716796875, 4.955950736999512, 5.718816757202148, 6.481682777404785, 7.244548797607422, 8.007414817810059, 8.770280838012695, 9.533146858215332, 10.296012878417969, 11.058878898620605, 11.821744918823242, 12.584610939025879, 13.347476959228516, 14.110342979431152, 14.873208999633789, 15.636075019836426, 16.398941040039062, 17.161808013916016, 17.924673080444336]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 5.0, 4.0, 6.0, 11.0, 11.0, 20.0, 11.0, 17.0, 30.0, 28.0, 33.0, 37.0, 41.0, 50.0, 39.0, 50.0, 63.0, 57.0, 52.0, 55.0, 50.0, 47.0, 45.0, 43.0, 35.0, 28.0, 27.0, 27.0, 19.0, 14.0, 18.0, 9.0, 5.0, 4.0, 3.0, 7.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.302630424499512, -9.956604957580566, -9.610579490661621, -9.264554023742676, -8.918529510498047, -8.572504043579102, -8.226478576660156, -7.880453109741211, -7.534427642822266, -7.18840217590332, -6.842376708984375, -6.496351718902588, -6.150326251983643, -5.804300785064697, -5.45827579498291, -5.112250328063965, -4.7662248611450195, -4.420199394226074, -4.074173927307129, -3.728148937225342, -3.3821234703063965, -3.036098003387451, -2.690072774887085, -2.3440475463867188, -1.9980220794677734, -1.6519967317581177, -1.305971384048462, -0.9599460363388062, -0.6139206886291504, -0.26789534091949463, 0.07813000679016113, 0.42415523529052734, 0.7701816558837891, 1.1162070035934448, 1.4622323513031006, 1.8082576990127563, 2.154283046722412, 2.5003085136413574, 2.8463337421417236, 3.19235897064209, 3.538384437561035, 3.8844099044799805, 4.230435371398926, 4.576460361480713, 4.922485828399658, 5.2685112953186035, 5.614536285400391, 5.960561752319336, 6.306587219238281, 6.652612686157227, 6.998638153076172, 7.344663143157959, 7.690688610076904, 8.036713600158691, 8.382739067077637, 8.728764533996582, 9.074790000915527, 9.420815467834473, 9.766840934753418, 10.112866401672363, 10.458890914916992, 10.804916381835938, 11.150941848754883, 11.496967315673828, 11.842992782592773]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 13.0, 12.0, 28.0, 27.0, 38.0, 61.0, 73.0, 105.0, 161.0, 240.0, 320.0, 467.0, 742.0, 1073.0, 1540.0, 2533.0, 4214.0, 8182.0, 18820.0, 58555.0, 201034.0, 394668.0, 239518.0, 72091.0, 22299.0, 9030.0, 4694.0, 2795.0, 1710.0, 1095.0, 779.0, 485.0, 334.0, 243.0, 164.0, 113.0, 88.0, 54.0, 41.0, 39.0, 30.0, 20.0, 8.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.052734375, -2.952911376953125, -2.85308837890625, -2.753265380859375, -2.6534423828125, -2.553619384765625, -2.45379638671875, -2.353973388671875, -2.254150390625, -2.154327392578125, -2.05450439453125, -1.954681396484375, -1.8548583984375, -1.755035400390625, -1.65521240234375, -1.555389404296875, -1.45556640625, -1.355743408203125, -1.25592041015625, -1.156097412109375, -1.0562744140625, -0.956451416015625, -0.85662841796875, -0.756805419921875, -0.656982421875, -0.557159423828125, -0.45733642578125, -0.357513427734375, -0.2576904296875, -0.157867431640625, -0.05804443359375, 0.041778564453125, 0.1416015625, 0.241424560546875, 0.34124755859375, 0.441070556640625, 0.5408935546875, 0.640716552734375, 0.74053955078125, 0.840362548828125, 0.940185546875, 1.040008544921875, 1.13983154296875, 1.239654541015625, 1.3394775390625, 1.439300537109375, 1.53912353515625, 1.638946533203125, 1.73876953125, 1.838592529296875, 1.93841552734375, 2.038238525390625, 2.1380615234375, 2.237884521484375, 2.33770751953125, 2.437530517578125, 2.537353515625, 2.637176513671875, 2.73699951171875, 2.836822509765625, 2.9366455078125, 3.036468505859375, 3.13629150390625, 3.236114501953125, 3.3359375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 8.0, 6.0, 7.0, 4.0, 11.0, 11.0, 9.0, 17.0, 13.0, 12.0, 16.0, 22.0, 26.0, 23.0, 32.0, 25.0, 38.0, 34.0, 40.0, 52.0, 39.0, 48.0, 32.0, 40.0, 43.0, 39.0, 38.0, 33.0, 31.0, 25.0, 31.0, 20.0, 34.0, 18.0, 27.0, 14.0, 17.0, 14.0, 12.0, 3.0, 9.0, 6.0, 5.0, 5.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.6513671875, -1.5969696044921875, -1.542572021484375, -1.4881744384765625, -1.43377685546875, -1.3793792724609375, -1.324981689453125, -1.2705841064453125, -1.2161865234375, -1.1617889404296875, -1.107391357421875, -1.0529937744140625, -0.99859619140625, -0.9441986083984375, -0.889801025390625, -0.8354034423828125, -0.781005859375, -0.7266082763671875, -0.672210693359375, -0.6178131103515625, -0.56341552734375, -0.5090179443359375, -0.454620361328125, -0.4002227783203125, -0.3458251953125, -0.2914276123046875, -0.237030029296875, -0.1826324462890625, -0.12823486328125, -0.0738372802734375, -0.019439697265625, 0.0349578857421875, 0.08935546875, 0.1437530517578125, 0.198150634765625, 0.2525482177734375, 0.30694580078125, 0.3613433837890625, 0.415740966796875, 0.4701385498046875, 0.5245361328125, 0.5789337158203125, 0.633331298828125, 0.6877288818359375, 0.74212646484375, 0.7965240478515625, 0.850921630859375, 0.9053192138671875, 0.959716796875, 1.0141143798828125, 1.068511962890625, 1.1229095458984375, 1.17730712890625, 1.2317047119140625, 1.286102294921875, 1.3404998779296875, 1.3948974609375, 1.4492950439453125, 1.503692626953125, 1.5580902099609375, 1.61248779296875, 1.6668853759765625, 1.721282958984375, 1.7756805419921875, 1.830078125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 1.0, 3.0, 9.0, 11.0, 22.0, 31.0, 57.0, 93.0, 166.0, 275.0, 462.0, 793.0, 1482.0, 2783.0, 6007.0, 14555.0, 49253.0, 237978.0, 508666.0, 167457.0, 36152.0, 11689.0, 5103.0, 2441.0, 1309.0, 740.0, 429.0, 247.0, 144.0, 69.0, 40.0, 37.0, 24.0, 9.0, 10.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.638671875, -3.514862060546875, -3.39105224609375, -3.267242431640625, -3.1434326171875, -3.019622802734375, -2.89581298828125, -2.772003173828125, -2.648193359375, -2.524383544921875, -2.40057373046875, -2.276763916015625, -2.1529541015625, -2.029144287109375, -1.90533447265625, -1.781524658203125, -1.65771484375, -1.533905029296875, -1.41009521484375, -1.286285400390625, -1.1624755859375, -1.038665771484375, -0.91485595703125, -0.791046142578125, -0.667236328125, -0.543426513671875, -0.41961669921875, -0.295806884765625, -0.1719970703125, -0.048187255859375, 0.07562255859375, 0.199432373046875, 0.3232421875, 0.447052001953125, 0.57086181640625, 0.694671630859375, 0.8184814453125, 0.942291259765625, 1.06610107421875, 1.189910888671875, 1.313720703125, 1.437530517578125, 1.56134033203125, 1.685150146484375, 1.8089599609375, 1.932769775390625, 2.05657958984375, 2.180389404296875, 2.30419921875, 2.428009033203125, 2.55181884765625, 2.675628662109375, 2.7994384765625, 2.923248291015625, 3.04705810546875, 3.170867919921875, 3.294677734375, 3.418487548828125, 3.54229736328125, 3.666107177734375, 3.7899169921875, 3.913726806640625, 4.03753662109375, 4.161346435546875, 4.28515625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 10.0, 8.0, 11.0, 11.0, 11.0, 10.0, 16.0, 31.0, 34.0, 22.0, 31.0, 27.0, 44.0, 40.0, 47.0, 44.0, 58.0, 38.0, 56.0, 41.0, 42.0, 41.0, 34.0, 42.0, 45.0, 28.0, 39.0, 17.0, 22.0, 17.0, 23.0, 13.0, 11.0, 9.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.2001953125, -5.029296875, -4.8583984375, -4.6875, -4.5166015625, -4.345703125, -4.1748046875, -4.00390625, -3.8330078125, -3.662109375, -3.4912109375, -3.3203125, -3.1494140625, -2.978515625, -2.8076171875, -2.63671875, -2.4658203125, -2.294921875, -2.1240234375, -1.953125, -1.7822265625, -1.611328125, -1.4404296875, -1.26953125, -1.0986328125, -0.927734375, -0.7568359375, -0.5859375, -0.4150390625, -0.244140625, -0.0732421875, 0.09765625, 0.2685546875, 0.439453125, 0.6103515625, 0.78125, 0.9521484375, 1.123046875, 1.2939453125, 1.46484375, 1.6357421875, 1.806640625, 1.9775390625, 2.1484375, 2.3193359375, 2.490234375, 2.6611328125, 2.83203125, 3.0029296875, 3.173828125, 3.3447265625, 3.515625, 3.6865234375, 3.857421875, 4.0283203125, 4.19921875, 4.3701171875, 4.541015625, 4.7119140625, 4.8828125, 5.0537109375, 5.224609375, 5.3955078125, 5.56640625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 4.0, 12.0, 11.0, 18.0, 22.0, 39.0, 46.0, 86.0, 154.0, 222.0, 376.0, 645.0, 1133.0, 2030.0, 4009.0, 7991.0, 17795.0, 40764.0, 103404.0, 245045.0, 320977.0, 178320.0, 70654.0, 28743.0, 12926.0, 6092.0, 3165.0, 1580.0, 929.0, 520.0, 312.0, 192.0, 118.0, 66.0, 51.0, 29.0, 24.0, 9.0, 13.0, 9.0, 4.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79150390625, -0.765380859375, -0.7392578125, -0.713134765625, -0.68701171875, -0.660888671875, -0.634765625, -0.608642578125, -0.58251953125, -0.556396484375, -0.5302734375, -0.504150390625, -0.47802734375, -0.451904296875, -0.42578125, -0.399658203125, -0.37353515625, -0.347412109375, -0.3212890625, -0.295166015625, -0.26904296875, -0.242919921875, -0.216796875, -0.190673828125, -0.16455078125, -0.138427734375, -0.1123046875, -0.086181640625, -0.06005859375, -0.033935546875, -0.0078125, 0.018310546875, 0.04443359375, 0.070556640625, 0.0966796875, 0.122802734375, 0.14892578125, 0.175048828125, 0.201171875, 0.227294921875, 0.25341796875, 0.279541015625, 0.3056640625, 0.331787109375, 0.35791015625, 0.384033203125, 0.41015625, 0.436279296875, 0.46240234375, 0.488525390625, 0.5146484375, 0.540771484375, 0.56689453125, 0.593017578125, 0.619140625, 0.645263671875, 0.67138671875, 0.697509765625, 0.7236328125, 0.749755859375, 0.77587890625, 0.802001953125, 0.828125, 0.854248046875, 0.88037109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 5.0, 10.0, 7.0, 10.0, 10.0, 12.0, 16.0, 30.0, 44.0, 52.0, 49.0, 85.0, 82.0, 92.0, 92.0, 79.0, 69.0, 57.0, 51.0, 36.0, 20.0, 25.0, 16.0, 16.0, 6.0, 4.0, 1.0, 5.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002980232238769531, -0.00028840452432632446, -0.0002787858247756958, -0.00026916712522506714, -0.0002595484256744385, -0.0002499297261238098, -0.00024031102657318115, -0.0002306923270225525, -0.00022107362747192383, -0.00021145492792129517, -0.0002018362283706665, -0.00019221752882003784, -0.00018259882926940918, -0.00017298012971878052, -0.00016336143016815186, -0.0001537427306175232, -0.00014412403106689453, -0.00013450533151626587, -0.0001248866319656372, -0.00011526793241500854, -0.00010564923286437988, -9.603053331375122e-05, -8.641183376312256e-05, -7.67931342124939e-05, -6.717443466186523e-05, -5.755573511123657e-05, -4.793703556060791e-05, -3.831833600997925e-05, -2.8699636459350586e-05, -1.9080936908721924e-05, -9.462237358093262e-06, 1.564621925354004e-07, 9.775161743164062e-06, 1.9393861293792725e-05, 2.9012560844421387e-05, 3.863126039505005e-05, 4.824995994567871e-05, 5.786865949630737e-05, 6.748735904693604e-05, 7.71060585975647e-05, 8.672475814819336e-05, 9.634345769882202e-05, 0.00010596215724945068, 0.00011558085680007935, 0.000125199556350708, 0.00013481825590133667, 0.00014443695545196533, 0.000154055655002594, 0.00016367435455322266, 0.00017329305410385132, 0.00018291175365447998, 0.00019253045320510864, 0.0002021491527557373, 0.00021176785230636597, 0.00022138655185699463, 0.0002310052514076233, 0.00024062395095825195, 0.0002502426505088806, 0.0002598613500595093, 0.00026948004961013794, 0.0002790987491607666, 0.00028871744871139526, 0.0002983361482620239, 0.0003079548478126526, 0.00031757354736328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 8.0, 2.0, 4.0, 4.0, 4.0, 9.0, 14.0, 20.0, 20.0, 51.0, 71.0, 103.0, 169.0, 285.0, 512.0, 939.0, 1935.0, 3784.0, 7908.0, 17356.0, 40571.0, 96383.0, 208376.0, 294587.0, 207106.0, 94889.0, 40199.0, 17657.0, 7765.0, 3692.0, 1826.0, 982.0, 548.0, 272.0, 180.0, 109.0, 68.0, 38.0, 50.0, 18.0, 15.0, 16.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.80322265625, -0.77850341796875, -0.7537841796875, -0.72906494140625, -0.704345703125, -0.67962646484375, -0.6549072265625, -0.63018798828125, -0.60546875, -0.58074951171875, -0.5560302734375, -0.53131103515625, -0.506591796875, -0.48187255859375, -0.4571533203125, -0.43243408203125, -0.40771484375, -0.38299560546875, -0.3582763671875, -0.33355712890625, -0.308837890625, -0.28411865234375, -0.2593994140625, -0.23468017578125, -0.2099609375, -0.18524169921875, -0.1605224609375, -0.13580322265625, -0.111083984375, -0.08636474609375, -0.0616455078125, -0.03692626953125, -0.01220703125, 0.01251220703125, 0.0372314453125, 0.06195068359375, 0.086669921875, 0.11138916015625, 0.1361083984375, 0.16082763671875, 0.185546875, 0.21026611328125, 0.2349853515625, 0.25970458984375, 0.284423828125, 0.30914306640625, 0.3338623046875, 0.35858154296875, 0.38330078125, 0.40802001953125, 0.4327392578125, 0.45745849609375, 0.482177734375, 0.50689697265625, 0.5316162109375, 0.55633544921875, 0.5810546875, 0.60577392578125, 0.6304931640625, 0.65521240234375, 0.679931640625, 0.70465087890625, 0.7293701171875, 0.75408935546875, 0.77880859375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 5.0, 6.0, 6.0, 15.0, 23.0, 22.0, 27.0, 50.0, 45.0, 52.0, 67.0, 59.0, 67.0, 65.0, 75.0, 67.0, 66.0, 46.0, 39.0, 35.0, 36.0, 23.0, 24.0, 10.0, 16.0, 8.0, 16.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0693359375, -1.036773681640625, -1.00421142578125, -0.971649169921875, -0.9390869140625, -0.906524658203125, -0.87396240234375, -0.841400146484375, -0.808837890625, -0.776275634765625, -0.74371337890625, -0.711151123046875, -0.6785888671875, -0.646026611328125, -0.61346435546875, -0.580902099609375, -0.54833984375, -0.515777587890625, -0.48321533203125, -0.450653076171875, -0.4180908203125, -0.385528564453125, -0.35296630859375, -0.320404052734375, -0.287841796875, -0.255279541015625, -0.22271728515625, -0.190155029296875, -0.1575927734375, -0.125030517578125, -0.09246826171875, -0.059906005859375, -0.02734375, 0.005218505859375, 0.03778076171875, 0.070343017578125, 0.1029052734375, 0.135467529296875, 0.16802978515625, 0.200592041015625, 0.233154296875, 0.265716552734375, 0.29827880859375, 0.330841064453125, 0.3634033203125, 0.395965576171875, 0.42852783203125, 0.461090087890625, 0.49365234375, 0.526214599609375, 0.55877685546875, 0.591339111328125, 0.6239013671875, 0.656463623046875, 0.68902587890625, 0.721588134765625, 0.754150390625, 0.786712646484375, 0.81927490234375, 0.851837158203125, 0.8843994140625, 0.916961669921875, 0.94952392578125, 0.982086181640625, 1.0146484375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 9.0, 17.0, 27.0, 58.0, 80.0, 126.0, 170.0, 157.0, 154.0, 83.0, 48.0, 25.0, 13.0, 6.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.245893478393555, -21.448122024536133, -20.650352478027344, -19.852581024169922, -19.054811477661133, -18.25704002380371, -17.459270477294922, -16.6614990234375, -15.863728523254395, -15.065958023071289, -14.268187522888184, -13.470417022705078, -12.672645568847656, -11.874876022338867, -11.077104568481445, -10.27933406829834, -9.481563568115234, -8.683793067932129, -7.886022567749023, -7.08825159072876, -6.290481090545654, -5.492710590362549, -4.694939613342285, -3.8971691131591797, -3.099398612976074, -2.3016281127929688, -1.5038573741912842, -0.7060866355895996, 0.09168386459350586, 0.8894543647766113, 1.687225341796875, 2.4849958419799805, 3.282764434814453, 4.080534934997559, 4.878305435180664, 5.676076412200928, 6.473846912384033, 7.271617412567139, 8.069388389587402, 8.867158889770508, 9.664929389953613, 10.462699890136719, 11.260470390319824, 12.05824089050293, 12.856012344360352, 13.65378189086914, 14.451553344726562, 15.249323844909668, 16.047094345092773, 16.844865798950195, 17.642635345458984, 18.440406799316406, 19.238176345825195, 20.035947799682617, 20.833717346191406, 21.631488800048828, 22.42926025390625, 23.227031707763672, 24.02480125427246, 24.822572708129883, 25.620342254638672, 26.418113708496094, 27.215885162353516, 28.013654708862305, 28.811424255371094]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 5.0, 0.0, 4.0, 11.0, 6.0, 11.0, 13.0, 7.0, 18.0, 19.0, 24.0, 24.0, 25.0, 22.0, 28.0, 40.0, 39.0, 45.0, 41.0, 43.0, 57.0, 40.0, 39.0, 46.0, 38.0, 36.0, 44.0, 31.0, 31.0, 27.0, 29.0, 28.0, 22.0, 22.0, 16.0, 17.0, 7.0, 7.0, 10.0, 9.0, 5.0, 5.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.220782279968262, -10.84721851348877, -10.473653793334961, -10.100090026855469, -9.726526260375977, -9.352962493896484, -8.979398727416992, -8.605834007263184, -8.232270240783691, -7.858706474304199, -7.485142230987549, -7.111577987670898, -6.738014221191406, -6.364450454711914, -5.990886211395264, -5.617321968078613, -5.243758201599121, -4.870194435119629, -4.4966301918029785, -4.123065948486328, -3.749502182006836, -3.3759381771087646, -3.0023741722106934, -2.628810167312622, -2.255246162414551, -1.8816821575164795, -1.5081181526184082, -1.134554147720337, -0.7609901428222656, -0.38742613792419434, -0.013862133026123047, 0.35970187187194824, 0.7332658767700195, 1.1068298816680908, 1.480393886566162, 1.8539578914642334, 2.2275218963623047, 2.601085901260376, 2.9746499061584473, 3.3482139110565186, 3.72177791595459, 4.095341682434082, 4.468905925750732, 4.842470169067383, 5.216033935546875, 5.589597702026367, 5.963161945343018, 6.336726188659668, 6.71028995513916, 7.083853721618652, 7.457417964935303, 7.830982208251953, 8.204545974731445, 8.578109741210938, 8.95167350769043, 9.325238227844238, 9.69880199432373, 10.072365760803223, 10.445930480957031, 10.819494247436523, 11.193058013916016, 11.566621780395508, 11.940185546875, 12.313750267028809, 12.6873140335083]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 6.0, 5.0, 10.0, 13.0, 22.0, 33.0, 40.0, 76.0, 90.0, 166.0, 244.0, 433.0, 703.0, 1270.0, 2336.0, 4744.0, 10855.0, 28409.0, 94199.0, 379487.0, 1233344.0, 1592546.0, 623098.0, 151829.0, 41984.0, 14790.0, 6494.0, 3148.0, 1573.0, 900.0, 550.0, 304.0, 195.0, 111.0, 91.0, 56.0, 38.0, 30.0, 14.0, 20.0, 14.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.341796875, -2.26904296875, -2.1962890625, -2.12353515625, -2.05078125, -1.97802734375, -1.9052734375, -1.83251953125, -1.759765625, -1.68701171875, -1.6142578125, -1.54150390625, -1.46875, -1.39599609375, -1.3232421875, -1.25048828125, -1.177734375, -1.10498046875, -1.0322265625, -0.95947265625, -0.88671875, -0.81396484375, -0.7412109375, -0.66845703125, -0.595703125, -0.52294921875, -0.4501953125, -0.37744140625, -0.3046875, -0.23193359375, -0.1591796875, -0.08642578125, -0.013671875, 0.05908203125, 0.1318359375, 0.20458984375, 0.27734375, 0.35009765625, 0.4228515625, 0.49560546875, 0.568359375, 0.64111328125, 0.7138671875, 0.78662109375, 0.859375, 0.93212890625, 1.0048828125, 1.07763671875, 1.150390625, 1.22314453125, 1.2958984375, 1.36865234375, 1.44140625, 1.51416015625, 1.5869140625, 1.65966796875, 1.732421875, 1.80517578125, 1.8779296875, 1.95068359375, 2.0234375, 2.09619140625, 2.1689453125, 2.24169921875, 2.314453125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 14.0, 6.0, 9.0, 10.0, 8.0, 18.0, 30.0, 24.0, 18.0, 28.0, 34.0, 36.0, 31.0, 27.0, 34.0, 45.0, 38.0, 35.0, 30.0, 34.0, 34.0, 35.0, 36.0, 35.0, 25.0, 31.0, 36.0, 33.0, 19.0, 35.0, 18.0, 24.0, 18.0, 22.0, 11.0, 16.0, 17.0, 14.0, 5.0, 5.0, 8.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.310546875, -1.263092041015625, -1.21563720703125, -1.168182373046875, -1.1207275390625, -1.073272705078125, -1.02581787109375, -0.978363037109375, -0.930908203125, -0.883453369140625, -0.83599853515625, -0.788543701171875, -0.7410888671875, -0.693634033203125, -0.64617919921875, -0.598724365234375, -0.55126953125, -0.503814697265625, -0.45635986328125, -0.408905029296875, -0.3614501953125, -0.313995361328125, -0.26654052734375, -0.219085693359375, -0.171630859375, -0.124176025390625, -0.07672119140625, -0.029266357421875, 0.0181884765625, 0.065643310546875, 0.11309814453125, 0.160552978515625, 0.2080078125, 0.255462646484375, 0.30291748046875, 0.350372314453125, 0.3978271484375, 0.445281982421875, 0.49273681640625, 0.540191650390625, 0.587646484375, 0.635101318359375, 0.68255615234375, 0.730010986328125, 0.7774658203125, 0.824920654296875, 0.87237548828125, 0.919830322265625, 0.96728515625, 1.014739990234375, 1.06219482421875, 1.109649658203125, 1.1571044921875, 1.204559326171875, 1.25201416015625, 1.299468994140625, 1.346923828125, 1.394378662109375, 1.44183349609375, 1.489288330078125, 1.5367431640625, 1.584197998046875, 1.63165283203125, 1.679107666015625, 1.7265625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 0.0, 2.0, 5.0, 14.0, 6.0, 12.0, 13.0, 30.0, 41.0, 51.0, 59.0, 108.0, 116.0, 237.0, 380.0, 570.0, 1045.0, 1768.0, 3339.0, 6769.0, 15243.0, 39581.0, 129832.0, 633776.0, 2390045.0, 749359.0, 146391.0, 43245.0, 16695.0, 7280.0, 3562.0, 1905.0, 1043.0, 621.0, 343.0, 252.0, 167.0, 127.0, 72.0, 54.0, 46.0, 23.0, 24.0, 10.0, 10.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7734375, -2.685516357421875, -2.59759521484375, -2.509674072265625, -2.4217529296875, -2.333831787109375, -2.24591064453125, -2.157989501953125, -2.070068359375, -1.982147216796875, -1.89422607421875, -1.806304931640625, -1.7183837890625, -1.630462646484375, -1.54254150390625, -1.454620361328125, -1.36669921875, -1.278778076171875, -1.19085693359375, -1.102935791015625, -1.0150146484375, -0.927093505859375, -0.83917236328125, -0.751251220703125, -0.663330078125, -0.575408935546875, -0.48748779296875, -0.399566650390625, -0.3116455078125, -0.223724365234375, -0.13580322265625, -0.047882080078125, 0.0400390625, 0.127960205078125, 0.21588134765625, 0.303802490234375, 0.3917236328125, 0.479644775390625, 0.56756591796875, 0.655487060546875, 0.743408203125, 0.831329345703125, 0.91925048828125, 1.007171630859375, 1.0950927734375, 1.183013916015625, 1.27093505859375, 1.358856201171875, 1.44677734375, 1.534698486328125, 1.62261962890625, 1.710540771484375, 1.7984619140625, 1.886383056640625, 1.97430419921875, 2.062225341796875, 2.150146484375, 2.238067626953125, 2.32598876953125, 2.413909912109375, 2.5018310546875, 2.589752197265625, 2.67767333984375, 2.765594482421875, 2.853515625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 9.0, 18.0, 22.0, 22.0, 32.0, 42.0, 45.0, 91.0, 133.0, 191.0, 319.0, 457.0, 619.0, 585.0, 505.0, 293.0, 224.0, 135.0, 85.0, 65.0, 44.0, 35.0, 28.0, 17.0, 5.0, 11.0, 8.0, 7.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.970703125, -3.85736083984375, -3.7440185546875, -3.63067626953125, -3.517333984375, -3.40399169921875, -3.2906494140625, -3.17730712890625, -3.06396484375, -2.95062255859375, -2.8372802734375, -2.72393798828125, -2.610595703125, -2.49725341796875, -2.3839111328125, -2.27056884765625, -2.1572265625, -2.04388427734375, -1.9305419921875, -1.81719970703125, -1.703857421875, -1.59051513671875, -1.4771728515625, -1.36383056640625, -1.25048828125, -1.13714599609375, -1.0238037109375, -0.91046142578125, -0.797119140625, -0.68377685546875, -0.5704345703125, -0.45709228515625, -0.34375, -0.23040771484375, -0.1170654296875, -0.00372314453125, 0.109619140625, 0.22296142578125, 0.3363037109375, 0.44964599609375, 0.56298828125, 0.67633056640625, 0.7896728515625, 0.90301513671875, 1.016357421875, 1.12969970703125, 1.2430419921875, 1.35638427734375, 1.4697265625, 1.58306884765625, 1.6964111328125, 1.80975341796875, 1.923095703125, 2.03643798828125, 2.1497802734375, 2.26312255859375, 2.37646484375, 2.48980712890625, 2.6031494140625, 2.71649169921875, 2.829833984375, 2.94317626953125, 3.0565185546875, 3.16986083984375, 3.283203125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 8.0, 10.0, 21.0, 46.0, 126.0, 192.0, 209.0, 173.0, 103.0, 55.0, 33.0, 13.0, 7.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-54.64356994628906, -53.56089401245117, -52.478214263916016, -51.395538330078125, -50.312862396240234, -49.230186462402344, -48.14750671386719, -47.0648307800293, -45.982154846191406, -44.899478912353516, -43.81679916381836, -42.73412322998047, -41.65144729614258, -40.56877136230469, -39.48609161376953, -38.40341567993164, -37.32073974609375, -36.23806381225586, -35.1553840637207, -34.07270812988281, -32.99003219604492, -31.9073543548584, -30.824676513671875, -29.742000579833984, -28.659320831298828, -27.576642990112305, -26.493967056274414, -25.41128921508789, -24.32861328125, -23.245935440063477, -22.163257598876953, -21.080581665039062, -19.997909545898438, -18.915231704711914, -17.832555770874023, -16.7498779296875, -15.66720199584961, -14.584524154663086, -13.501847267150879, -12.419170379638672, -11.336492538452148, -10.253815650939941, -9.171138763427734, -8.088460922241211, -7.005784511566162, -5.923107624053955, -4.84043025970459, -3.757753372192383, -2.675076484680176, -1.5923994779586792, -0.5097224712371826, 0.5729546546936035, 1.6556315422058105, 2.7383084297180176, 3.820985794067383, 4.90366268157959, 5.986339569091797, 7.069016456604004, 8.151693344116211, 9.234371185302734, 10.317047119140625, 11.399724960327148, 12.482401847839355, 13.565078735351562, 14.64775562286377]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 5.0, 6.0, 12.0, 9.0, 16.0, 13.0, 4.0, 13.0, 23.0, 23.0, 31.0, 36.0, 26.0, 29.0, 23.0, 36.0, 39.0, 44.0, 47.0, 50.0, 48.0, 54.0, 53.0, 41.0, 44.0, 35.0, 29.0, 26.0, 32.0, 21.0, 29.0, 18.0, 20.0, 22.0, 14.0, 5.0, 9.0, 7.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.718246459960938, -8.39199447631836, -8.065743446350098, -7.7394914627075195, -7.4132399559021, -7.08698844909668, -6.760736465454102, -6.434484958648682, -6.108233451843262, -5.781981945037842, -5.455730438232422, -5.129478454589844, -4.803226947784424, -4.476975440979004, -4.150723457336426, -3.824471950531006, -3.498220443725586, -3.171968936920166, -2.845717191696167, -2.519465446472168, -2.193213939666748, -1.8669623136520386, -1.540710687637329, -1.21445894241333, -0.8882074356079102, -0.5619558095932007, -0.2357041835784912, 0.09054744243621826, 0.41679906845092773, 0.7430506944656372, 1.0693023204803467, 1.3955540657043457, 1.7218055725097656, 2.0480570793151855, 2.3743088245391846, 2.7005605697631836, 3.0268120765686035, 3.3530635833740234, 3.6793153285980225, 4.0055670738220215, 4.331818580627441, 4.658070087432861, 4.984321594238281, 5.310573577880859, 5.636825084686279, 5.963076591491699, 6.289328575134277, 6.615580081939697, 6.941831588745117, 7.268083095550537, 7.594334602355957, 7.920586585998535, 8.246837615966797, 8.573089599609375, 8.899341583251953, 9.225593566894531, 9.551844596862793, 9.878096580505371, 10.204347610473633, 10.530599594116211, 10.856851577758789, 11.18310260772705, 11.509354591369629, 11.83560562133789, 12.161857604980469]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 12.0, 18.0, 13.0, 35.0, 42.0, 46.0, 94.0, 128.0, 217.0, 275.0, 490.0, 726.0, 1169.0, 1913.0, 3094.0, 5133.0, 8311.0, 14327.0, 24280.0, 41107.0, 68925.0, 109316.0, 156807.0, 182875.0, 155027.0, 107083.0, 67193.0, 40613.0, 23885.0, 14226.0, 8365.0, 4881.0, 2913.0, 1843.0, 1153.0, 716.0, 451.0, 312.0, 183.0, 122.0, 74.0, 62.0, 35.0, 22.0, 12.0, 13.0, 7.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2861328125, -1.2465362548828125, -1.206939697265625, -1.1673431396484375, -1.12774658203125, -1.0881500244140625, -1.048553466796875, -1.0089569091796875, -0.9693603515625, -0.9297637939453125, -0.890167236328125, -0.8505706787109375, -0.81097412109375, -0.7713775634765625, -0.731781005859375, -0.6921844482421875, -0.652587890625, -0.6129913330078125, -0.573394775390625, -0.5337982177734375, -0.49420166015625, -0.4546051025390625, -0.415008544921875, -0.3754119873046875, -0.3358154296875, -0.2962188720703125, -0.256622314453125, -0.2170257568359375, -0.17742919921875, -0.1378326416015625, -0.098236083984375, -0.0586395263671875, -0.01904296875, 0.0205535888671875, 0.060150146484375, 0.0997467041015625, 0.13934326171875, 0.1789398193359375, 0.218536376953125, 0.2581329345703125, 0.2977294921875, 0.3373260498046875, 0.376922607421875, 0.4165191650390625, 0.45611572265625, 0.4957122802734375, 0.535308837890625, 0.5749053955078125, 0.614501953125, 0.6540985107421875, 0.693695068359375, 0.7332916259765625, 0.77288818359375, 0.8124847412109375, 0.852081298828125, 0.8916778564453125, 0.9312744140625, 0.9708709716796875, 1.010467529296875, 1.0500640869140625, 1.08966064453125, 1.1292572021484375, 1.168853759765625, 1.2084503173828125, 1.248046875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 4.0, 8.0, 11.0, 9.0, 16.0, 17.0, 24.0, 19.0, 31.0, 31.0, 26.0, 27.0, 33.0, 40.0, 35.0, 47.0, 28.0, 44.0, 44.0, 43.0, 51.0, 27.0, 38.0, 38.0, 30.0, 36.0, 29.0, 30.0, 9.0, 24.0, 22.0, 20.0, 15.0, 13.0, 14.0, 14.0, 16.0, 6.0, 9.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0], "bins": [-2.0625, -2.00579833984375, -1.9490966796875, -1.89239501953125, -1.835693359375, -1.77899169921875, -1.7222900390625, -1.66558837890625, -1.60888671875, -1.55218505859375, -1.4954833984375, -1.43878173828125, -1.382080078125, -1.32537841796875, -1.2686767578125, -1.21197509765625, -1.1552734375, -1.09857177734375, -1.0418701171875, -0.98516845703125, -0.928466796875, -0.87176513671875, -0.8150634765625, -0.75836181640625, -0.70166015625, -0.64495849609375, -0.5882568359375, -0.53155517578125, -0.474853515625, -0.41815185546875, -0.3614501953125, -0.30474853515625, -0.248046875, -0.19134521484375, -0.1346435546875, -0.07794189453125, -0.021240234375, 0.03546142578125, 0.0921630859375, 0.14886474609375, 0.20556640625, 0.26226806640625, 0.3189697265625, 0.37567138671875, 0.432373046875, 0.48907470703125, 0.5457763671875, 0.60247802734375, 0.6591796875, 0.71588134765625, 0.7725830078125, 0.82928466796875, 0.885986328125, 0.94268798828125, 0.9993896484375, 1.05609130859375, 1.11279296875, 1.16949462890625, 1.2261962890625, 1.28289794921875, 1.339599609375, 1.39630126953125, 1.4530029296875, 1.50970458984375, 1.56640625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 11.0, 6.0, 26.0, 32.0, 59.0, 104.0, 188.0, 422.0, 933.0, 2066.0, 4835.0, 12602.0, 34830.0, 100387.0, 257762.0, 370316.0, 168241.0, 60844.0, 21278.0, 7853.0, 3203.0, 1316.0, 626.0, 299.0, 164.0, 72.0, 34.0, 18.0, 15.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.599609375, -2.52587890625, -2.4521484375, -2.37841796875, -2.3046875, -2.23095703125, -2.1572265625, -2.08349609375, -2.009765625, -1.93603515625, -1.8623046875, -1.78857421875, -1.71484375, -1.64111328125, -1.5673828125, -1.49365234375, -1.419921875, -1.34619140625, -1.2724609375, -1.19873046875, -1.125, -1.05126953125, -0.9775390625, -0.90380859375, -0.830078125, -0.75634765625, -0.6826171875, -0.60888671875, -0.53515625, -0.46142578125, -0.3876953125, -0.31396484375, -0.240234375, -0.16650390625, -0.0927734375, -0.01904296875, 0.0546875, 0.12841796875, 0.2021484375, 0.27587890625, 0.349609375, 0.42333984375, 0.4970703125, 0.57080078125, 0.64453125, 0.71826171875, 0.7919921875, 0.86572265625, 0.939453125, 1.01318359375, 1.0869140625, 1.16064453125, 1.234375, 1.30810546875, 1.3818359375, 1.45556640625, 1.529296875, 1.60302734375, 1.6767578125, 1.75048828125, 1.82421875, 1.89794921875, 1.9716796875, 2.04541015625, 2.119140625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 3.0, 7.0, 4.0, 5.0, 3.0, 11.0, 10.0, 17.0, 20.0, 21.0, 20.0, 25.0, 39.0, 36.0, 26.0, 35.0, 35.0, 44.0, 34.0, 41.0, 46.0, 40.0, 52.0, 47.0, 44.0, 39.0, 55.0, 32.0, 38.0, 22.0, 27.0, 21.0, 13.0, 15.0, 11.0, 13.0, 11.0, 10.0, 8.0, 4.0, 0.0, 2.0, 7.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.7890625, -4.6383056640625, -4.487548828125, -4.3367919921875, -4.18603515625, -4.0352783203125, -3.884521484375, -3.7337646484375, -3.5830078125, -3.4322509765625, -3.281494140625, -3.1307373046875, -2.97998046875, -2.8292236328125, -2.678466796875, -2.5277099609375, -2.376953125, -2.2261962890625, -2.075439453125, -1.9246826171875, -1.77392578125, -1.6231689453125, -1.472412109375, -1.3216552734375, -1.1708984375, -1.0201416015625, -0.869384765625, -0.7186279296875, -0.56787109375, -0.4171142578125, -0.266357421875, -0.1156005859375, 0.03515625, 0.1859130859375, 0.336669921875, 0.4874267578125, 0.63818359375, 0.7889404296875, 0.939697265625, 1.0904541015625, 1.2412109375, 1.3919677734375, 1.542724609375, 1.6934814453125, 1.84423828125, 1.9949951171875, 2.145751953125, 2.2965087890625, 2.447265625, 2.5980224609375, 2.748779296875, 2.8995361328125, 3.05029296875, 3.2010498046875, 3.351806640625, 3.5025634765625, 3.6533203125, 3.8040771484375, 3.954833984375, 4.1055908203125, 4.25634765625, 4.4071044921875, 4.557861328125, 4.7086181640625, 4.859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 6.0, 11.0, 23.0, 20.0, 23.0, 42.0, 63.0, 114.0, 174.0, 305.0, 567.0, 967.0, 1845.0, 3496.0, 7146.0, 15044.0, 32136.0, 71483.0, 152066.0, 292232.0, 238475.0, 124519.0, 57527.0, 25921.0, 12169.0, 5802.0, 2846.0, 1534.0, 837.0, 457.0, 269.0, 166.0, 95.0, 60.0, 35.0, 20.0, 23.0, 5.0, 12.0, 9.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51318359375, -0.4980278015136719, -0.48287200927734375, -0.4677162170410156, -0.4525604248046875, -0.4374046325683594, -0.42224884033203125, -0.4070930480957031, -0.391937255859375, -0.3767814636230469, -0.36162567138671875, -0.3464698791503906, -0.3313140869140625, -0.3161582946777344, -0.30100250244140625, -0.2858467102050781, -0.27069091796875, -0.2555351257324219, -0.24037933349609375, -0.22522354125976562, -0.2100677490234375, -0.19491195678710938, -0.17975616455078125, -0.16460037231445312, -0.149444580078125, -0.13428878784179688, -0.11913299560546875, -0.10397720336914062, -0.0888214111328125, -0.07366561889648438, -0.05850982666015625, -0.043354034423828125, -0.0281982421875, -0.013042449951171875, 0.00211334228515625, 0.017269134521484375, 0.0324249267578125, 0.047580718994140625, 0.06273651123046875, 0.07789230346679688, 0.093048095703125, 0.10820388793945312, 0.12335968017578125, 0.13851547241210938, 0.1536712646484375, 0.16882705688476562, 0.18398284912109375, 0.19913864135742188, 0.21429443359375, 0.22945022583007812, 0.24460601806640625, 0.2597618103027344, 0.2749176025390625, 0.2900733947753906, 0.30522918701171875, 0.3203849792480469, 0.335540771484375, 0.3506965637207031, 0.36585235595703125, 0.3810081481933594, 0.3961639404296875, 0.4113197326660156, 0.42647552490234375, 0.4416313171386719, 0.456787109375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 4.0, 6.0, 8.0, 1.0, 3.0, 3.0, 4.0, 7.0, 14.0, 13.0, 13.0, 14.0, 26.0, 29.0, 28.0, 38.0, 45.0, 41.0, 57.0, 70.0, 87.0, 70.0, 74.0, 59.0, 46.0, 40.0, 27.0, 32.0, 22.0, 21.0, 21.0, 13.0, 11.0, 13.0, 7.0, 8.0, 6.0, 1.0, 8.0, 4.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00017642974853515625, -0.0001703612506389618, -0.00016429275274276733, -0.00015822425484657288, -0.00015215575695037842, -0.00014608725905418396, -0.0001400187611579895, -0.00013395026326179504, -0.00012788176536560059, -0.00012181326746940613, -0.00011574476957321167, -0.00010967627167701721, -0.00010360777378082275, -9.75392758846283e-05, -9.147077798843384e-05, -8.540228009223938e-05, -7.933378219604492e-05, -7.326528429985046e-05, -6.7196786403656e-05, -6.112828850746155e-05, -5.505979061126709e-05, -4.899129271507263e-05, -4.2922794818878174e-05, -3.6854296922683716e-05, -3.078579902648926e-05, -2.47173011302948e-05, -1.8648803234100342e-05, -1.2580305337905884e-05, -6.511807441711426e-06, -4.4330954551696777e-07, 5.62518835067749e-06, 1.1693686246871948e-05, 1.7762184143066406e-05, 2.3830682039260864e-05, 2.9899179935455322e-05, 3.596767783164978e-05, 4.203617572784424e-05, 4.8104673624038696e-05, 5.4173171520233154e-05, 6.024166941642761e-05, 6.631016731262207e-05, 7.237866520881653e-05, 7.844716310501099e-05, 8.451566100120544e-05, 9.05841588973999e-05, 9.665265679359436e-05, 0.00010272115468978882, 0.00010878965258598328, 0.00011485815048217773, 0.00012092664837837219, 0.00012699514627456665, 0.0001330636441707611, 0.00013913214206695557, 0.00014520063996315002, 0.00015126913785934448, 0.00015733763575553894, 0.0001634061336517334, 0.00016947463154792786, 0.00017554312944412231, 0.00018161162734031677, 0.00018768012523651123, 0.0001937486231327057, 0.00019981712102890015, 0.0002058856189250946, 0.00021195411682128906]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 0.0, 2.0, 6.0, 3.0, 4.0, 2.0, 4.0, 6.0, 13.0, 19.0, 24.0, 34.0, 72.0, 112.0, 206.0, 379.0, 695.0, 1464.0, 3113.0, 7300.0, 18539.0, 51252.0, 138360.0, 333102.0, 292729.0, 125502.0, 46027.0, 17081.0, 6773.0, 2841.0, 1415.0, 658.0, 354.0, 202.0, 100.0, 67.0, 26.0, 18.0, 14.0, 10.0, 6.0, 6.0, 5.0, 9.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59619140625, -0.574859619140625, -0.55352783203125, -0.532196044921875, -0.5108642578125, -0.489532470703125, -0.46820068359375, -0.446868896484375, -0.425537109375, -0.404205322265625, -0.38287353515625, -0.361541748046875, -0.3402099609375, -0.318878173828125, -0.29754638671875, -0.276214599609375, -0.2548828125, -0.233551025390625, -0.21221923828125, -0.190887451171875, -0.1695556640625, -0.148223876953125, -0.12689208984375, -0.105560302734375, -0.084228515625, -0.062896728515625, -0.04156494140625, -0.020233154296875, 0.0010986328125, 0.022430419921875, 0.04376220703125, 0.065093994140625, 0.08642578125, 0.107757568359375, 0.12908935546875, 0.150421142578125, 0.1717529296875, 0.193084716796875, 0.21441650390625, 0.235748291015625, 0.257080078125, 0.278411865234375, 0.29974365234375, 0.321075439453125, 0.3424072265625, 0.363739013671875, 0.38507080078125, 0.406402587890625, 0.427734375, 0.449066162109375, 0.47039794921875, 0.491729736328125, 0.5130615234375, 0.534393310546875, 0.55572509765625, 0.577056884765625, 0.598388671875, 0.619720458984375, 0.64105224609375, 0.662384033203125, 0.6837158203125, 0.705047607421875, 0.72637939453125, 0.747711181640625, 0.76904296875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 5.0, 1.0, 5.0, 9.0, 11.0, 3.0, 11.0, 12.0, 15.0, 23.0, 34.0, 46.0, 54.0, 75.0, 83.0, 100.0, 75.0, 69.0, 75.0, 53.0, 43.0, 54.0, 28.0, 32.0, 17.0, 8.0, 9.0, 12.0, 9.0, 5.0, 1.0, 7.0, 6.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7275390625, -0.700775146484375, -0.67401123046875, -0.647247314453125, -0.6204833984375, -0.593719482421875, -0.56695556640625, -0.540191650390625, -0.513427734375, -0.486663818359375, -0.45989990234375, -0.433135986328125, -0.4063720703125, -0.379608154296875, -0.35284423828125, -0.326080322265625, -0.29931640625, -0.272552490234375, -0.24578857421875, -0.219024658203125, -0.1922607421875, -0.165496826171875, -0.13873291015625, -0.111968994140625, -0.085205078125, -0.058441162109375, -0.03167724609375, -0.004913330078125, 0.0218505859375, 0.048614501953125, 0.07537841796875, 0.102142333984375, 0.12890625, 0.155670166015625, 0.18243408203125, 0.209197998046875, 0.2359619140625, 0.262725830078125, 0.28948974609375, 0.316253662109375, 0.343017578125, 0.369781494140625, 0.39654541015625, 0.423309326171875, 0.4500732421875, 0.476837158203125, 0.50360107421875, 0.530364990234375, 0.55712890625, 0.583892822265625, 0.61065673828125, 0.637420654296875, 0.6641845703125, 0.690948486328125, 0.71771240234375, 0.744476318359375, 0.771240234375, 0.798004150390625, 0.82476806640625, 0.851531982421875, 0.8782958984375, 0.905059814453125, 0.93182373046875, 0.958587646484375, 0.9853515625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 2.0, 4.0, 9.0, 12.0, 34.0, 52.0, 143.0, 223.0, 232.0, 174.0, 70.0, 21.0, 14.0, 8.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.539241790771484, -38.65019607543945, -37.76115036010742, -36.87210464477539, -35.98305892944336, -35.09400939941406, -34.20496368408203, -33.31591796875, -32.42687225341797, -31.537826538085938, -30.648780822753906, -29.759735107421875, -28.87068748474121, -27.98164176940918, -27.09259605407715, -26.203550338745117, -25.314504623413086, -24.425458908081055, -23.536413192749023, -22.64736557006836, -21.758319854736328, -20.869274139404297, -19.980228424072266, -19.091182708740234, -18.202136993408203, -17.313091278076172, -16.42404556274414, -15.534998893737793, -14.645952224731445, -13.756906509399414, -12.867860794067383, -11.978815078735352, -11.089767456054688, -10.200721740722656, -9.311675071716309, -8.422629356384277, -7.533583164215088, -6.644536972045898, -5.755491256713867, -4.866445064544678, -3.9773988723754883, -3.088352680206299, -2.1993067264556885, -1.3102607727050781, -0.42121458053588867, 0.4678316116333008, 1.356877326965332, 2.2459235191345215, 3.134969711303711, 4.0240159034729, 4.91306209564209, 5.802107810974121, 6.6911540031433105, 7.5802001953125, 8.469245910644531, 9.358291625976562, 10.24733829498291, 11.136384010314941, 12.025430679321289, 12.91447639465332, 13.803522109985352, 14.6925687789917, 15.58161449432373, 16.470661163330078, 17.35970687866211]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 4.0, 5.0, 7.0, 4.0, 7.0, 7.0, 13.0, 7.0, 19.0, 14.0, 23.0, 22.0, 27.0, 31.0, 30.0, 31.0, 35.0, 35.0, 44.0, 45.0, 30.0, 51.0, 42.0, 31.0, 41.0, 32.0, 33.0, 31.0, 38.0, 21.0, 34.0, 28.0, 16.0, 29.0, 22.0, 16.0, 18.0, 16.0, 16.0, 7.0, 8.0, 10.0, 6.0, 4.0, 3.0, 7.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.169981002807617, -10.834380149841309, -10.498779296875, -10.163177490234375, -9.827576637268066, -9.491975784301758, -9.156373977661133, -8.820773124694824, -8.485172271728516, -8.149571418762207, -7.81397008895874, -7.478368759155273, -7.142767906188965, -6.807167053222656, -6.4715657234191895, -6.135964393615723, -5.800363540649414, -5.4647626876831055, -5.129161357879639, -4.793560028076172, -4.457959175109863, -4.122358322143555, -3.786756992340088, -3.4511559009552, -3.1155548095703125, -2.779953718185425, -2.444352626800537, -2.1087515354156494, -1.7731504440307617, -1.437549352645874, -1.1019482612609863, -0.7663471698760986, -0.43074607849121094, -0.09514498710632324, 0.24045610427856445, 0.5760571956634521, 0.9116582870483398, 1.2472593784332275, 1.5828604698181152, 1.918461561203003, 2.2540626525878906, 2.5896637439727783, 2.925264835357666, 3.2608659267425537, 3.5964670181274414, 3.932068109512329, 4.267669200897217, 4.603270530700684, 4.938871383666992, 5.274472236633301, 5.610073566436768, 5.945674896240234, 6.281275749206543, 6.616876602172852, 6.952477931976318, 7.288079261779785, 7.623680114746094, 7.959280967712402, 8.294881820678711, 8.630483627319336, 8.966084480285645, 9.301685333251953, 9.637287139892578, 9.972887992858887, 10.308488845825195]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 11.0, 13.0, 22.0, 37.0, 49.0, 80.0, 149.0, 288.0, 444.0, 802.0, 1704.0, 3287.0, 7357.0, 19788.0, 63355.0, 211403.0, 604601.0, 1172053.0, 1183315.0, 626819.0, 209585.0, 57103.0, 17982.0, 7185.0, 3149.0, 1696.0, 809.0, 482.0, 277.0, 160.0, 103.0, 61.0, 27.0, 23.0, 19.0, 13.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8154296875, -1.7505950927734375, -1.685760498046875, -1.6209259033203125, -1.55609130859375, -1.4912567138671875, -1.426422119140625, -1.3615875244140625, -1.2967529296875, -1.2319183349609375, -1.167083740234375, -1.1022491455078125, -1.03741455078125, -0.9725799560546875, -0.907745361328125, -0.8429107666015625, -0.778076171875, -0.7132415771484375, -0.648406982421875, -0.5835723876953125, -0.51873779296875, -0.4539031982421875, -0.389068603515625, -0.3242340087890625, -0.2593994140625, -0.1945648193359375, -0.129730224609375, -0.0648956298828125, -6.103515625e-05, 0.0647735595703125, 0.129608154296875, 0.1944427490234375, 0.25927734375, 0.3241119384765625, 0.388946533203125, 0.4537811279296875, 0.51861572265625, 0.5834503173828125, 0.648284912109375, 0.7131195068359375, 0.7779541015625, 0.8427886962890625, 0.907623291015625, 0.9724578857421875, 1.03729248046875, 1.1021270751953125, 1.166961669921875, 1.2317962646484375, 1.296630859375, 1.3614654541015625, 1.426300048828125, 1.4911346435546875, 1.55596923828125, 1.6208038330078125, 1.685638427734375, 1.7504730224609375, 1.8153076171875, 1.8801422119140625, 1.944976806640625, 2.0098114013671875, 2.07464599609375, 2.1394805908203125, 2.204315185546875, 2.2691497802734375, 2.333984375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 5.0, 10.0, 9.0, 3.0, 13.0, 17.0, 26.0, 24.0, 14.0, 22.0, 25.0, 42.0, 25.0, 37.0, 38.0, 49.0, 36.0, 59.0, 44.0, 49.0, 44.0, 37.0, 47.0, 38.0, 40.0, 37.0, 33.0, 23.0, 30.0, 18.0, 12.0, 16.0, 9.0, 16.0, 14.0, 7.0, 4.0, 12.0, 4.0, 1.0, 3.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6669921875, -1.6116485595703125, -1.556304931640625, -1.5009613037109375, -1.44561767578125, -1.3902740478515625, -1.334930419921875, -1.2795867919921875, -1.2242431640625, -1.1688995361328125, -1.113555908203125, -1.0582122802734375, -1.00286865234375, -0.9475250244140625, -0.892181396484375, -0.8368377685546875, -0.781494140625, -0.7261505126953125, -0.670806884765625, -0.6154632568359375, -0.56011962890625, -0.5047760009765625, -0.449432373046875, -0.3940887451171875, -0.3387451171875, -0.2834014892578125, -0.228057861328125, -0.1727142333984375, -0.11737060546875, -0.0620269775390625, -0.006683349609375, 0.0486602783203125, 0.10400390625, 0.1593475341796875, 0.214691162109375, 0.2700347900390625, 0.32537841796875, 0.3807220458984375, 0.436065673828125, 0.4914093017578125, 0.5467529296875, 0.6020965576171875, 0.657440185546875, 0.7127838134765625, 0.76812744140625, 0.8234710693359375, 0.878814697265625, 0.9341583251953125, 0.989501953125, 1.0448455810546875, 1.100189208984375, 1.1555328369140625, 1.21087646484375, 1.2662200927734375, 1.321563720703125, 1.3769073486328125, 1.4322509765625, 1.4875946044921875, 1.542938232421875, 1.5982818603515625, 1.65362548828125, 1.7089691162109375, 1.764312744140625, 1.8196563720703125, 1.875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 8.0, 15.0, 19.0, 27.0, 47.0, 47.0, 92.0, 141.0, 235.0, 350.0, 628.0, 1216.0, 2623.0, 6761.0, 21273.0, 93534.0, 649007.0, 2718261.0, 582243.0, 86046.0, 20156.0, 6373.0, 2562.0, 1118.0, 609.0, 369.0, 174.0, 115.0, 73.0, 48.0, 34.0, 20.0, 11.0, 8.0, 10.0, 10.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.931640625, -3.8238525390625, -3.716064453125, -3.6082763671875, -3.50048828125, -3.3927001953125, -3.284912109375, -3.1771240234375, -3.0693359375, -2.9615478515625, -2.853759765625, -2.7459716796875, -2.63818359375, -2.5303955078125, -2.422607421875, -2.3148193359375, -2.20703125, -2.0992431640625, -1.991455078125, -1.8836669921875, -1.77587890625, -1.6680908203125, -1.560302734375, -1.4525146484375, -1.3447265625, -1.2369384765625, -1.129150390625, -1.0213623046875, -0.91357421875, -0.8057861328125, -0.697998046875, -0.5902099609375, -0.482421875, -0.3746337890625, -0.266845703125, -0.1590576171875, -0.05126953125, 0.0565185546875, 0.164306640625, 0.2720947265625, 0.3798828125, 0.4876708984375, 0.595458984375, 0.7032470703125, 0.81103515625, 0.9188232421875, 1.026611328125, 1.1343994140625, 1.2421875, 1.3499755859375, 1.457763671875, 1.5655517578125, 1.67333984375, 1.7811279296875, 1.888916015625, 1.9967041015625, 2.1044921875, 2.2122802734375, 2.320068359375, 2.4278564453125, 2.53564453125, 2.6434326171875, 2.751220703125, 2.8590087890625, 2.966796875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 2.0, 4.0, 2.0, 8.0, 16.0, 20.0, 24.0, 34.0, 48.0, 81.0, 83.0, 146.0, 191.0, 282.0, 381.0, 448.0, 494.0, 436.0, 391.0, 272.0, 210.0, 149.0, 112.0, 64.0, 40.0, 45.0, 28.0, 16.0, 14.0, 11.0, 9.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.826171875, -3.696136474609375, -3.56610107421875, -3.436065673828125, -3.3060302734375, -3.175994873046875, -3.04595947265625, -2.915924072265625, -2.785888671875, -2.655853271484375, -2.52581787109375, -2.395782470703125, -2.2657470703125, -2.135711669921875, -2.00567626953125, -1.875640869140625, -1.74560546875, -1.615570068359375, -1.48553466796875, -1.355499267578125, -1.2254638671875, -1.095428466796875, -0.96539306640625, -0.835357666015625, -0.705322265625, -0.575286865234375, -0.44525146484375, -0.315216064453125, -0.1851806640625, -0.055145263671875, 0.07489013671875, 0.204925537109375, 0.3349609375, 0.464996337890625, 0.59503173828125, 0.725067138671875, 0.8551025390625, 0.985137939453125, 1.11517333984375, 1.245208740234375, 1.375244140625, 1.505279541015625, 1.63531494140625, 1.765350341796875, 1.8953857421875, 2.025421142578125, 2.15545654296875, 2.285491943359375, 2.41552734375, 2.545562744140625, 2.67559814453125, 2.805633544921875, 2.9356689453125, 3.065704345703125, 3.19573974609375, 3.325775146484375, 3.455810546875, 3.585845947265625, 3.71588134765625, 3.845916748046875, 3.9759521484375, 4.105987548828125, 4.23602294921875, 4.366058349609375, 4.49609375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 13.0, 18.0, 52.0, 68.0, 121.0, 148.0, 189.0, 139.0, 96.0, 56.0, 31.0, 23.0, 17.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.293617248535156, -56.54188919067383, -54.7901611328125, -53.03843307495117, -51.286705017089844, -49.53497314453125, -47.78324890136719, -46.031517028808594, -44.279788970947266, -42.52806091308594, -40.77633285522461, -39.02460479736328, -37.27287673950195, -35.521148681640625, -33.76941680908203, -32.0176887512207, -30.265962600708008, -28.51423454284668, -26.76250648498535, -25.01077651977539, -23.259048461914062, -21.507320404052734, -19.755592346191406, -18.003864288330078, -16.25213623046875, -14.500408172607422, -12.748679161071777, -10.99695110321045, -9.245222091674805, -7.493494033813477, -5.741765975952148, -3.990036964416504, -2.2383079528808594, -0.4865795373916626, 1.2651488780975342, 3.0168771743774414, 4.768605709075928, 6.520334243774414, 8.272062301635742, 10.023791313171387, 11.775519371032715, 13.527247428894043, 15.278976440429688, 17.030704498291016, 18.782432556152344, 20.534160614013672, 22.285888671875, 24.03761863708496, 25.78934669494629, 27.541074752807617, 29.292802810668945, 31.044532775878906, 32.796260833740234, 34.54798889160156, 36.29971694946289, 38.05144500732422, 39.80317306518555, 41.554901123046875, 43.3066291809082, 45.05835723876953, 46.81008529663086, 48.56181335449219, 50.31354522705078, 52.06527328491211, 53.81700134277344]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 8.0, 13.0, 10.0, 15.0, 19.0, 16.0, 15.0, 25.0, 26.0, 20.0, 31.0, 33.0, 35.0, 47.0, 45.0, 54.0, 50.0, 44.0, 48.0, 34.0, 39.0, 41.0, 36.0, 34.0, 39.0, 33.0, 26.0, 25.0, 24.0, 16.0, 15.0, 13.0, 15.0, 18.0, 10.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-17.511730194091797, -17.03697967529297, -16.56222915649414, -16.087478637695312, -15.6127290725708, -15.137979507446289, -14.663228988647461, -14.188478469848633, -13.713727951049805, -13.238977432250977, -12.764227867126465, -12.289477348327637, -11.814726829528809, -11.339977264404297, -10.865226745605469, -10.39047622680664, -9.915725708007812, -9.440975189208984, -8.966225624084473, -8.491475105285645, -8.016724586486816, -7.5419745445251465, -7.067224502563477, -6.592473983764648, -6.117724418640137, -5.642974376678467, -5.168223857879639, -4.693473815917969, -4.218723297119141, -3.7439732551574707, -3.2692229747772217, -2.7944726943969727, -2.3197221755981445, -1.8449718952178955, -1.3702216148376465, -0.895471453666687, -0.420721173286438, 0.054028987884521484, 0.5287792682647705, 1.0035295486450195, 1.4782798290252686, 1.9530301094055176, 2.4277803897857666, 2.9025306701660156, 3.3772807121276855, 3.8520309925079346, 4.326781272888184, 4.801531791687012, 5.276281833648682, 5.751031875610352, 6.22578239440918, 6.70053243637085, 7.175282955169678, 7.650032997131348, 8.124783515930176, 8.599533081054688, 9.074283599853516, 9.549034118652344, 10.023783683776855, 10.498534202575684, 10.973284721374512, 11.448034286499023, 11.922784805297852, 12.39753532409668, 12.872285842895508]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 6.0, 9.0, 13.0, 18.0, 18.0, 30.0, 40.0, 71.0, 75.0, 99.0, 170.0, 225.0, 315.0, 440.0, 705.0, 1134.0, 1710.0, 3060.0, 5253.0, 9652.0, 18970.0, 40304.0, 93632.0, 223291.0, 329154.0, 178497.0, 73811.0, 32560.0, 15567.0, 8048.0, 4393.0, 2720.0, 1587.0, 975.0, 648.0, 395.0, 267.0, 214.0, 133.0, 97.0, 66.0, 55.0, 37.0, 21.0, 16.0, 12.0, 14.0, 6.0, 6.0, 2.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.3681640625, -1.3245391845703125, -1.280914306640625, -1.2372894287109375, -1.19366455078125, -1.1500396728515625, -1.106414794921875, -1.0627899169921875, -1.0191650390625, -0.9755401611328125, -0.931915283203125, -0.8882904052734375, -0.84466552734375, -0.8010406494140625, -0.757415771484375, -0.7137908935546875, -0.670166015625, -0.6265411376953125, -0.582916259765625, -0.5392913818359375, -0.49566650390625, -0.4520416259765625, -0.408416748046875, -0.3647918701171875, -0.3211669921875, -0.2775421142578125, -0.233917236328125, -0.1902923583984375, -0.14666748046875, -0.1030426025390625, -0.059417724609375, -0.0157928466796875, 0.02783203125, 0.0714569091796875, 0.115081787109375, 0.1587066650390625, 0.20233154296875, 0.2459564208984375, 0.289581298828125, 0.3332061767578125, 0.3768310546875, 0.4204559326171875, 0.464080810546875, 0.5077056884765625, 0.55133056640625, 0.5949554443359375, 0.638580322265625, 0.6822052001953125, 0.725830078125, 0.7694549560546875, 0.813079833984375, 0.8567047119140625, 0.90032958984375, 0.9439544677734375, 0.987579345703125, 1.0312042236328125, 1.0748291015625, 1.1184539794921875, 1.162078857421875, 1.2057037353515625, 1.24932861328125, 1.2929534912109375, 1.336578369140625, 1.3802032470703125, 1.423828125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 0.0, 6.0, 4.0, 7.0, 2.0, 5.0, 10.0, 9.0, 13.0, 18.0, 12.0, 25.0, 26.0, 20.0, 20.0, 28.0, 37.0, 36.0, 31.0, 47.0, 44.0, 54.0, 60.0, 46.0, 28.0, 46.0, 45.0, 45.0, 37.0, 34.0, 28.0, 22.0, 21.0, 31.0, 16.0, 20.0, 9.0, 10.0, 14.0, 4.0, 11.0, 6.0, 2.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.501953125, -2.4256591796875, -2.349365234375, -2.2730712890625, -2.19677734375, -2.1204833984375, -2.044189453125, -1.9678955078125, -1.8916015625, -1.8153076171875, -1.739013671875, -1.6627197265625, -1.58642578125, -1.5101318359375, -1.433837890625, -1.3575439453125, -1.28125, -1.2049560546875, -1.128662109375, -1.0523681640625, -0.97607421875, -0.8997802734375, -0.823486328125, -0.7471923828125, -0.6708984375, -0.5946044921875, -0.518310546875, -0.4420166015625, -0.36572265625, -0.2894287109375, -0.213134765625, -0.1368408203125, -0.060546875, 0.0157470703125, 0.092041015625, 0.1683349609375, 0.24462890625, 0.3209228515625, 0.397216796875, 0.4735107421875, 0.5498046875, 0.6260986328125, 0.702392578125, 0.7786865234375, 0.85498046875, 0.9312744140625, 1.007568359375, 1.0838623046875, 1.16015625, 1.2364501953125, 1.312744140625, 1.3890380859375, 1.46533203125, 1.5416259765625, 1.617919921875, 1.6942138671875, 1.7705078125, 1.8468017578125, 1.923095703125, 1.9993896484375, 2.07568359375, 2.1519775390625, 2.228271484375, 2.3045654296875, 2.380859375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 6.0, 7.0, 9.0, 9.0, 14.0, 26.0, 29.0, 53.0, 88.0, 126.0, 244.0, 330.0, 723.0, 1455.0, 3331.0, 7798.0, 21698.0, 73276.0, 338759.0, 474260.0, 85876.0, 24394.0, 8817.0, 3657.0, 1711.0, 855.0, 457.0, 222.0, 138.0, 75.0, 44.0, 29.0, 16.0, 10.0, 7.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8271484375, -1.7642669677734375, -1.701385498046875, -1.6385040283203125, -1.57562255859375, -1.5127410888671875, -1.449859619140625, -1.3869781494140625, -1.3240966796875, -1.2612152099609375, -1.198333740234375, -1.1354522705078125, -1.07257080078125, -1.0096893310546875, -0.946807861328125, -0.8839263916015625, -0.821044921875, -0.7581634521484375, -0.695281982421875, -0.6324005126953125, -0.56951904296875, -0.5066375732421875, -0.443756103515625, -0.3808746337890625, -0.3179931640625, -0.2551116943359375, -0.192230224609375, -0.1293487548828125, -0.06646728515625, -0.0035858154296875, 0.059295654296875, 0.1221771240234375, 0.18505859375, 0.2479400634765625, 0.310821533203125, 0.3737030029296875, 0.43658447265625, 0.4994659423828125, 0.562347412109375, 0.6252288818359375, 0.6881103515625, 0.7509918212890625, 0.813873291015625, 0.8767547607421875, 0.93963623046875, 1.0025177001953125, 1.065399169921875, 1.1282806396484375, 1.191162109375, 1.2540435791015625, 1.316925048828125, 1.3798065185546875, 1.44268798828125, 1.5055694580078125, 1.568450927734375, 1.6313323974609375, 1.6942138671875, 1.7570953369140625, 1.819976806640625, 1.8828582763671875, 1.94573974609375, 2.0086212158203125, 2.071502685546875, 2.1343841552734375, 2.197265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 9.0, 7.0, 8.0, 9.0, 20.0, 17.0, 23.0, 22.0, 24.0, 44.0, 45.0, 68.0, 73.0, 71.0, 79.0, 59.0, 60.0, 68.0, 54.0, 58.0, 26.0, 30.0, 36.0, 26.0, 19.0, 15.0, 4.0, 4.0, 8.0, 2.0, 1.0, 5.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.14495849609375, -4.9188232421875, -4.69268798828125, -4.466552734375, -4.24041748046875, -4.0142822265625, -3.78814697265625, -3.56201171875, -3.33587646484375, -3.1097412109375, -2.88360595703125, -2.657470703125, -2.43133544921875, -2.2052001953125, -1.97906494140625, -1.7529296875, -1.52679443359375, -1.3006591796875, -1.07452392578125, -0.848388671875, -0.62225341796875, -0.3961181640625, -0.16998291015625, 0.05615234375, 0.28228759765625, 0.5084228515625, 0.73455810546875, 0.960693359375, 1.18682861328125, 1.4129638671875, 1.63909912109375, 1.865234375, 2.09136962890625, 2.3175048828125, 2.54364013671875, 2.769775390625, 2.99591064453125, 3.2220458984375, 3.44818115234375, 3.67431640625, 3.90045166015625, 4.1265869140625, 4.35272216796875, 4.578857421875, 4.80499267578125, 5.0311279296875, 5.25726318359375, 5.4833984375, 5.70953369140625, 5.9356689453125, 6.16180419921875, 6.387939453125, 6.61407470703125, 6.8402099609375, 7.06634521484375, 7.29248046875, 7.51861572265625, 7.7447509765625, 7.97088623046875, 8.197021484375, 8.42315673828125, 8.6492919921875, 8.87542724609375, 9.1015625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 7.0, 9.0, 10.0, 13.0, 25.0, 23.0, 34.0, 61.0, 102.0, 180.0, 342.0, 945.0, 2315.0, 7242.0, 34184.0, 234676.0, 651418.0, 93438.0, 16484.0, 4285.0, 1446.0, 606.0, 288.0, 151.0, 87.0, 42.0, 32.0, 26.0, 18.0, 11.0, 8.0, 8.0, 10.0, 7.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63134765625, -0.611785888671875, -0.59222412109375, -0.572662353515625, -0.5531005859375, -0.533538818359375, -0.51397705078125, -0.494415283203125, -0.474853515625, -0.455291748046875, -0.43572998046875, -0.416168212890625, -0.3966064453125, -0.377044677734375, -0.35748291015625, -0.337921142578125, -0.318359375, -0.298797607421875, -0.27923583984375, -0.259674072265625, -0.2401123046875, -0.220550537109375, -0.20098876953125, -0.181427001953125, -0.161865234375, -0.142303466796875, -0.12274169921875, -0.103179931640625, -0.0836181640625, -0.064056396484375, -0.04449462890625, -0.024932861328125, -0.00537109375, 0.014190673828125, 0.03375244140625, 0.053314208984375, 0.0728759765625, 0.092437744140625, 0.11199951171875, 0.131561279296875, 0.151123046875, 0.170684814453125, 0.19024658203125, 0.209808349609375, 0.2293701171875, 0.248931884765625, 0.26849365234375, 0.288055419921875, 0.3076171875, 0.327178955078125, 0.34674072265625, 0.366302490234375, 0.3858642578125, 0.405426025390625, 0.42498779296875, 0.444549560546875, 0.464111328125, 0.483673095703125, 0.50323486328125, 0.522796630859375, 0.5423583984375, 0.561920166015625, 0.58148193359375, 0.601043701171875, 0.62060546875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 10.0, 4.0, 8.0, 14.0, 18.0, 18.0, 16.0, 42.0, 42.0, 70.0, 82.0, 87.0, 109.0, 117.0, 75.0, 56.0, 53.0, 39.0, 21.0, 27.0, 22.0, 8.0, 9.0, 11.0, 10.0, 7.0, 3.0, 2.0, 1.0, 4.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00018084049224853516, -0.00017603673040866852, -0.00017123296856880188, -0.00016642920672893524, -0.0001616254448890686, -0.00015682168304920197, -0.00015201792120933533, -0.0001472141593694687, -0.00014241039752960205, -0.0001376066356897354, -0.00013280287384986877, -0.00012799911201000214, -0.0001231953501701355, -0.00011839158833026886, -0.00011358782649040222, -0.00010878406465053558, -0.00010398030281066895, -9.917654097080231e-05, -9.437277913093567e-05, -8.956901729106903e-05, -8.476525545120239e-05, -7.996149361133575e-05, -7.515773177146912e-05, -7.035396993160248e-05, -6.555020809173584e-05, -6.07464462518692e-05, -5.5942684412002563e-05, -5.1138922572135925e-05, -4.633516073226929e-05, -4.153139889240265e-05, -3.672763705253601e-05, -3.192387521266937e-05, -2.7120113372802734e-05, -2.2316351532936096e-05, -1.7512589693069458e-05, -1.270882785320282e-05, -7.905066013336182e-06, -3.1013041734695435e-06, 1.7024576663970947e-06, 6.506219506263733e-06, 1.1309981346130371e-05, 1.611374318599701e-05, 2.0917505025863647e-05, 2.5721266865730286e-05, 3.0525028705596924e-05, 3.532879054546356e-05, 4.01325523853302e-05, 4.493631422519684e-05, 4.9740076065063477e-05, 5.4543837904930115e-05, 5.934759974479675e-05, 6.415136158466339e-05, 6.895512342453003e-05, 7.375888526439667e-05, 7.85626471042633e-05, 8.336640894412994e-05, 8.817017078399658e-05, 9.297393262386322e-05, 9.777769446372986e-05, 0.0001025814563035965, 0.00010738521814346313, 0.00011218897998332977, 0.00011699274182319641, 0.00012179650366306305, 0.0001266002655029297]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 5.0, 2.0, 3.0, 7.0, 6.0, 15.0, 26.0, 35.0, 52.0, 70.0, 115.0, 183.0, 385.0, 704.0, 1602.0, 3646.0, 11266.0, 42156.0, 209956.0, 597906.0, 136984.0, 29461.0, 8457.0, 2873.0, 1236.0, 597.0, 331.0, 182.0, 104.0, 72.0, 38.0, 15.0, 16.0, 13.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.755859375, -0.7356338500976562, -0.7154083251953125, -0.6951828002929688, -0.674957275390625, -0.6547317504882812, -0.6345062255859375, -0.6142807006835938, -0.59405517578125, -0.5738296508789062, -0.5536041259765625, -0.5333786010742188, -0.513153076171875, -0.49292755126953125, -0.4727020263671875, -0.45247650146484375, -0.4322509765625, -0.41202545166015625, -0.3917999267578125, -0.37157440185546875, -0.351348876953125, -0.33112335205078125, -0.3108978271484375, -0.29067230224609375, -0.27044677734375, -0.25022125244140625, -0.2299957275390625, -0.20977020263671875, -0.189544677734375, -0.16931915283203125, -0.1490936279296875, -0.12886810302734375, -0.108642578125, -0.08841705322265625, -0.0681915283203125, -0.04796600341796875, -0.027740478515625, -0.00751495361328125, 0.0127105712890625, 0.03293609619140625, 0.05316162109375, 0.07338714599609375, 0.0936126708984375, 0.11383819580078125, 0.134063720703125, 0.15428924560546875, 0.1745147705078125, 0.19474029541015625, 0.2149658203125, 0.23519134521484375, 0.2554168701171875, 0.27564239501953125, 0.295867919921875, 0.31609344482421875, 0.3363189697265625, 0.35654449462890625, 0.37677001953125, 0.39699554443359375, 0.4172210693359375, 0.43744659423828125, 0.457672119140625, 0.47789764404296875, 0.4981231689453125, 0.5183486938476562, 0.53857421875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 5.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 14.0, 15.0, 27.0, 29.0, 35.0, 39.0, 48.0, 50.0, 66.0, 81.0, 66.0, 71.0, 67.0, 84.0, 46.0, 49.0, 35.0, 37.0, 24.0, 18.0, 15.0, 12.0, 10.0, 6.0, 5.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.60498046875, -0.586181640625, -0.5673828125, -0.548583984375, -0.52978515625, -0.510986328125, -0.4921875, -0.473388671875, -0.45458984375, -0.435791015625, -0.4169921875, -0.398193359375, -0.37939453125, -0.360595703125, -0.341796875, -0.322998046875, -0.30419921875, -0.285400390625, -0.2666015625, -0.247802734375, -0.22900390625, -0.210205078125, -0.19140625, -0.172607421875, -0.15380859375, -0.135009765625, -0.1162109375, -0.097412109375, -0.07861328125, -0.059814453125, -0.041015625, -0.022216796875, -0.00341796875, 0.015380859375, 0.0341796875, 0.052978515625, 0.07177734375, 0.090576171875, 0.109375, 0.128173828125, 0.14697265625, 0.165771484375, 0.1845703125, 0.203369140625, 0.22216796875, 0.240966796875, 0.259765625, 0.278564453125, 0.29736328125, 0.316162109375, 0.3349609375, 0.353759765625, 0.37255859375, 0.391357421875, 0.41015625, 0.428955078125, 0.44775390625, 0.466552734375, 0.4853515625, 0.504150390625, 0.52294921875, 0.541748046875, 0.560546875, 0.579345703125, 0.59814453125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 9.0, 11.0, 7.0, 17.0, 25.0, 48.0, 61.0, 94.0, 142.0, 168.0, 157.0, 84.0, 68.0, 44.0, 19.0, 16.0, 7.0, 5.0, 7.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.344114303588867, -10.865782737731934, -10.387450218200684, -9.90911865234375, -9.430787086486816, -8.952454566955566, -8.474123001098633, -7.995790958404541, -7.517458915710449, -7.039126873016357, -6.560795307159424, -6.082463264465332, -5.60413122177124, -5.125799179077148, -4.647467613220215, -4.169135570526123, -3.6908040046691895, -3.2124722003936768, -2.734140157699585, -2.2558083534240723, -1.77747642993927, -1.2991445064544678, -0.8208127021789551, -0.3424806594848633, 0.13585114479064941, 0.6141830682754517, 1.092514991760254, 1.5708467960357666, 2.0491786003112793, 2.527510643005371, 3.005842447280884, 3.4841744899749756, 3.9625062942504883, 4.44083833694458, 4.919169902801514, 5.3975019454956055, 5.875833988189697, 6.354166030883789, 6.832497596740723, 7.3108296394348145, 7.789161682128906, 8.26749324798584, 8.74582576751709, 9.224157333374023, 9.702488899230957, 10.180821418762207, 10.65915298461914, 11.13748550415039, 11.615816116333008, 12.094147682189941, 12.572480201721191, 13.050811767578125, 13.529143333435059, 14.007475852966309, 14.485807418823242, 14.964139938354492, 15.442471504211426, 15.92080307006836, 16.39913558959961, 16.87746810913086, 17.355798721313477, 17.834131240844727, 18.312461853027344, 18.790794372558594, 19.269126892089844]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 8.0, 12.0, 4.0, 12.0, 10.0, 12.0, 16.0, 17.0, 28.0, 25.0, 28.0, 28.0, 26.0, 36.0, 48.0, 50.0, 43.0, 62.0, 66.0, 60.0, 59.0, 45.0, 41.0, 32.0, 27.0, 30.0, 37.0, 26.0, 27.0, 14.0, 14.0, 16.0, 8.0, 7.0, 8.0, 7.0, 4.0, 1.0, 6.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-17.014812469482422, -16.573213577270508, -16.131614685058594, -15.69001579284668, -15.248416900634766, -14.806818008422852, -14.365218162536621, -13.923619270324707, -13.482020378112793, -13.040421485900879, -12.598822593688965, -12.15722370147705, -11.71562385559082, -11.274024963378906, -10.832426071166992, -10.390827178955078, -9.949228286743164, -9.50762939453125, -9.066030502319336, -8.624431610107422, -8.182832717895508, -7.7412333488464355, -7.299633979797363, -6.858035087585449, -6.416436195373535, -5.974837303161621, -5.533238410949707, -5.091639041900635, -4.650040149688721, -4.208441257476807, -3.7668421268463135, -3.3252429962158203, -2.88364315032959, -2.442044258117676, -2.0004451274871826, -1.558846116065979, -1.1172471046447754, -0.6756482124328613, -0.23404908180236816, 0.207550048828125, 0.6491489410400391, 1.0907479524612427, 1.5323469638824463, 1.97394597530365, 2.4155449867248535, 2.8571438789367676, 3.2987430095672607, 3.740342140197754, 4.181941032409668, 4.623539924621582, 5.065138816833496, 5.506738185882568, 5.948337078094482, 6.3899359703063965, 6.831535339355469, 7.273134231567383, 7.714733123779297, 8.156332015991211, 8.597930908203125, 9.039529800415039, 9.481128692626953, 9.922727584838867, 10.364327430725098, 10.805926322937012, 11.247525215148926]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 4.0, 3.0, 3.0, 2.0, 3.0, 12.0, 8.0, 9.0, 9.0, 8.0, 10.0, 15.0, 20.0, 23.0, 28.0, 21.0, 29.0, 56.0, 132.0, 235.0, 97.0, 53.0, 34.0, 26.0, 24.0, 25.0, 19.0, 25.0, 15.0, 6.0, 11.0, 9.0, 5.0, 4.0, 2.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.29296875, -2.20941162109375, -2.1258544921875, -2.04229736328125, -1.958740234375, -1.87518310546875, -1.7916259765625, -1.70806884765625, -1.62451171875, -1.54095458984375, -1.4573974609375, -1.37384033203125, -1.290283203125, -1.20672607421875, -1.1231689453125, -1.03961181640625, -0.9560546875, -0.87249755859375, -0.7889404296875, -0.70538330078125, -0.621826171875, -0.53826904296875, -0.4547119140625, -0.37115478515625, -0.28759765625, -0.20404052734375, -0.1204833984375, -0.03692626953125, 0.046630859375, 0.13018798828125, 0.2137451171875, 0.29730224609375, 0.380859375, 0.46441650390625, 0.5479736328125, 0.63153076171875, 0.715087890625, 0.79864501953125, 0.8822021484375, 0.96575927734375, 1.04931640625, 1.13287353515625, 1.2164306640625, 1.29998779296875, 1.383544921875, 1.46710205078125, 1.5506591796875, 1.63421630859375, 1.7177734375, 1.80133056640625, 1.8848876953125, 1.96844482421875, 2.052001953125, 2.13555908203125, 2.2191162109375, 2.30267333984375, 2.38623046875, 2.46978759765625, 2.5533447265625, 2.63690185546875, 2.720458984375, 2.80401611328125, 2.8875732421875, 2.97113037109375, 3.0546875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 5.0, 10.0, 14.0, 20.0, 17.0, 31.0, 52.0, 72.0, 113.0, 209.0, 306.0, 616.0, 1184.0, 2482.0, 6369.0, 23912.0, 8082352.0, 247563.0, 14286.0, 4666.0, 2030.0, 930.0, 521.0, 275.0, 184.0, 110.0, 70.0, 48.0, 33.0, 25.0, 12.0, 14.0, 13.0, 12.0, 10.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.297609806060791, -5.0753374099731445, -4.853065013885498, -4.630792617797852, -4.408519744873047, -4.1862473487854, -3.963974952697754, -3.7417025566101074, -3.519429922103882, -3.2971575260162354, -3.0748848915100098, -2.8526124954223633, -2.630340099334717, -2.408067464828491, -2.1857950687408447, -1.9635225534439087, -1.7412500381469727, -1.5189775228500366, -1.2967050075531006, -1.074432611465454, -0.8521600961685181, -0.629887580871582, -0.40761518478393555, -0.1853426694869995, 0.03692984580993652, 0.25920233130455017, 0.4814748167991638, 0.7037472724914551, 0.9260197877883911, 1.1482923030853271, 1.3705646991729736, 1.5928372144699097, 1.815110206604004, 2.0373826026916504, 2.259655237197876, 2.4819276332855225, 2.704200267791748, 2.9264726638793945, 3.148745059967041, 3.3710174560546875, 3.593290090560913, 3.8155624866485596, 4.037835121154785, 4.260107517242432, 4.482379913330078, 4.704652786254883, 4.926924705505371, 5.149197578430176, 5.371469974517822, 5.593742370605469, 5.816014766693115, 6.038287162780762, 6.260560035705566, 6.482832431793213, 6.705104827880859, 6.927377223968506, 7.149649620056152, 7.371922016143799, 7.594194412231445, 7.81646728515625, 8.038739204406738, 8.261012077331543, 8.483283996582031, 8.705556869506836, 8.92782974243164]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 7.0, 4.0, 2.0, 5.0, 3.0, 4.0, 7.0, 4.0, 8.0, 2.0, 10.0, 5.0, 2.0, 1.0, 2.0, 5.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.423004150390625, -14.056509971618652, -13.690014839172363, -13.32352066040039, -12.957025527954102, -12.590531349182129, -12.224037170410156, -11.857542037963867, -11.491046905517578, -11.124552726745605, -10.758057594299316, -10.391563415527344, -10.025068283081055, -9.658574104309082, -9.29207992553711, -8.92558479309082, -8.559090614318848, -8.192596435546875, -7.826101303100586, -7.459607124328613, -7.093111991882324, -6.726617813110352, -6.360123157501221, -5.99362850189209, -5.627133846282959, -5.260639190673828, -4.894144535064697, -4.527649879455566, -4.161155700683594, -3.794660806655884, -3.428166389465332, -3.061671733856201, -2.695176124572754, -2.328681468963623, -1.9621869325637817, -1.5956923961639404, -1.2291977405548096, -0.8627030849456787, -0.49620866775512695, -0.1297140121459961, 0.23678064346313477, 0.6032752394676208, 0.9697698354721069, 1.3362643718719482, 1.702759027481079, 2.06925368309021, 2.4357481002807617, 2.8022427558898926, 3.1687374114990234, 3.5352320671081543, 3.901726722717285, 4.268220901489258, 4.634716033935547, 5.0012102127075195, 5.36770486831665, 5.734199523925781, 6.100694179534912, 6.467188835144043, 6.833683490753174, 7.200178146362305, 7.566672325134277, 7.933167457580566, 8.299661636352539, 8.666156768798828, 9.0326509475708]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 3.0, 9.0, 10.0, 12.0, 10.0, 24.0, 20.0, 26.0, 29.0, 36.0, 52.0, 38.0, 62.0, 55.0, 66.0, 53.0, 69.0, 64.0, 56.0, 43.0, 50.0, 41.0, 32.0, 33.0, 24.0, 19.0, 17.0, 17.0, 7.0, 11.0, 9.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.166015625, -2.0966796875, -2.02734375, -1.9580078125, -1.888671875, -1.8193359375, -1.75, -1.6806640625, -1.611328125, -1.5419921875, -1.47265625, -1.4033203125, -1.333984375, -1.2646484375, -1.1953125, -1.1259765625, -1.056640625, -0.9873046875, -0.91796875, -0.8486328125, -0.779296875, -0.7099609375, -0.640625, -0.5712890625, -0.501953125, -0.4326171875, -0.36328125, -0.2939453125, -0.224609375, -0.1552734375, -0.0859375, -0.0166015625, 0.052734375, 0.1220703125, 0.19140625, 0.2607421875, 0.330078125, 0.3994140625, 0.46875, 0.5380859375, 0.607421875, 0.6767578125, 0.74609375, 0.8154296875, 0.884765625, 0.9541015625, 1.0234375, 1.0927734375, 1.162109375, 1.2314453125, 1.30078125, 1.3701171875, 1.439453125, 1.5087890625, 1.578125, 1.6474609375, 1.716796875, 1.7861328125, 1.85546875, 1.9248046875, 1.994140625, 2.0634765625, 2.1328125, 2.2021484375, 2.271484375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 10.0, 21.0, 13.0, 27.0, 27.0, 50.0, 69.0, 92.0, 126.0, 194.0, 262.0, 384.0, 590.0, 909.0, 1593.0, 2691.0, 5343.0, 11715.0, 29861.0, 101588.0, 233130.0, 87293.0, 26239.0, 10527.0, 4842.0, 2529.0, 1424.0, 868.0, 542.0, 417.0, 262.0, 141.0, 129.0, 100.0, 64.0, 52.0, 36.0, 29.0, 16.0, 13.0, 9.0, 6.0, 6.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.484375, -24.673828125, -23.86328125, -23.052734375, -22.2421875, -21.431640625, -20.62109375, -19.810546875, -19.0, -18.189453125, -17.37890625, -16.568359375, -15.7578125, -14.947265625, -14.13671875, -13.326171875, -12.515625, -11.705078125, -10.89453125, -10.083984375, -9.2734375, -8.462890625, -7.65234375, -6.841796875, -6.03125, -5.220703125, -4.41015625, -3.599609375, -2.7890625, -1.978515625, -1.16796875, -0.357421875, 0.453125, 1.263671875, 2.07421875, 2.884765625, 3.6953125, 4.505859375, 5.31640625, 6.126953125, 6.9375, 7.748046875, 8.55859375, 9.369140625, 10.1796875, 10.990234375, 11.80078125, 12.611328125, 13.421875, 14.232421875, 15.04296875, 15.853515625, 16.6640625, 17.474609375, 18.28515625, 19.095703125, 19.90625, 20.716796875, 21.52734375, 22.337890625, 23.1484375, 23.958984375, 24.76953125, 25.580078125, 26.390625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 9.0, 11.0, 15.0, 12.0, 12.0, 17.0, 24.0, 21.0, 25.0, 24.0, 47.0, 41.0, 38.0, 44.0, 45.0, 50.0, 46.0, 45.0, 50.0, 52.0, 52.0, 52.0, 40.0, 33.0, 36.0, 17.0, 33.0, 21.0, 13.0, 14.0, 10.0, 3.0, 7.0, 8.0, 5.0, 8.0, 9.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.138671875, -2.067535400390625, -1.99639892578125, -1.925262451171875, -1.8541259765625, -1.782989501953125, -1.71185302734375, -1.640716552734375, -1.569580078125, -1.498443603515625, -1.42730712890625, -1.356170654296875, -1.2850341796875, -1.213897705078125, -1.14276123046875, -1.071624755859375, -1.00048828125, -0.929351806640625, -0.85821533203125, -0.787078857421875, -0.7159423828125, -0.644805908203125, -0.57366943359375, -0.502532958984375, -0.431396484375, -0.360260009765625, -0.28912353515625, -0.217987060546875, -0.1468505859375, -0.075714111328125, -0.00457763671875, 0.066558837890625, 0.1376953125, 0.208831787109375, 0.27996826171875, 0.351104736328125, 0.4222412109375, 0.493377685546875, 0.56451416015625, 0.635650634765625, 0.706787109375, 0.777923583984375, 0.84906005859375, 0.920196533203125, 0.9913330078125, 1.062469482421875, 1.13360595703125, 1.204742431640625, 1.27587890625, 1.347015380859375, 1.41815185546875, 1.489288330078125, 1.5604248046875, 1.631561279296875, 1.70269775390625, 1.773834228515625, 1.844970703125, 1.916107177734375, 1.98724365234375, 2.058380126953125, 2.1295166015625, 2.200653076171875, 2.27178955078125, 2.342926025390625, 2.4140625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 8.0, 4.0, 9.0, 9.0, 12.0, 17.0, 23.0, 30.0, 47.0, 51.0, 60.0, 43.0, 41.0, 22.0, 15.0, 12.0, 9.0, 10.0, 6.0, 8.0, 3.0, 3.0, 5.0, 6.0, 7.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-8.499866485595703, -8.27392292022705, -8.047980308532715, -7.822037220001221, -7.596094131469727, -7.370150566101074, -7.144207954406738, -6.918264389038086, -6.692321300506592, -6.466378211975098, -6.2404351234436035, -6.014492034912109, -5.788548946380615, -5.562605857849121, -5.336662292480469, -5.110719203948975, -4.8847761154174805, -4.658833026885986, -4.432889938354492, -4.206946849822998, -3.981003522872925, -3.7550604343414307, -3.5291173458099365, -3.3031740188598633, -3.0772314071655273, -2.851288318634033, -2.625345230102539, -2.399402141571045, -2.1734588146209717, -1.9475157260894775, -1.7215726375579834, -1.4956294298171997, -1.269686222076416, -1.0437431335449219, -0.8177999258041382, -0.591856837272644, -0.3659136891365051, -0.1399705410003662, 0.08597254753112793, 0.3119157552719116, 0.5378588438034058, 0.7638019919395447, 0.9897451400756836, 1.2156882286071777, 1.4416313171386719, 1.6675745248794556, 1.8935176134109497, 2.1194608211517334, 2.3454039096832275, 2.5713469982147217, 2.797290086746216, 3.023233413696289, 3.249176502227783, 3.4751195907592773, 3.7010626792907715, 3.9270057678222656, 4.15294885635376, 4.378891944885254, 4.604835033416748, 4.830778121948242, 5.056721210479736, 5.2826642990112305, 5.508607864379883, 5.734550952911377, 5.960494041442871]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 4.0, 2.0, 4.0, 0.0, 5.0, 9.0, 8.0, 7.0, 8.0, 9.0, 16.0, 31.0, 77.0, 108.0, 64.0, 33.0, 20.0, 6.0, 3.0, 11.0, 9.0, 5.0, 8.0, 6.0, 2.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.064303398132324, -8.723264694213867, -8.382225036621094, -8.04118537902832, -7.700146675109863, -7.359107494354248, -7.018068313598633, -6.677029132843018, -6.335989952087402, -5.994950771331787, -5.653911590576172, -5.312872409820557, -4.971833229064941, -4.630794048309326, -4.289754867553711, -3.9487156867980957, -3.6076765060424805, -3.2666373252868652, -2.92559814453125, -2.5845589637756348, -2.2435197830200195, -1.9024806022644043, -1.561441421508789, -1.2204022407531738, -0.8793630599975586, -0.5383238792419434, -0.19728469848632812, 0.1437544822692871, 0.48479366302490234, 0.8258328437805176, 1.1668720245361328, 1.507911205291748, 1.8489503860473633, 2.1899895668029785, 2.5310287475585938, 2.872067928314209, 3.213107109069824, 3.5541462898254395, 3.8951854705810547, 4.23622465133667, 4.577263832092285, 4.9183030128479, 5.259342193603516, 5.600381374359131, 5.941420555114746, 6.282459735870361, 6.623498916625977, 6.964538097381592, 7.305577278137207, 7.646616458892822, 7.9876556396484375, 8.328695297241211, 8.669734001159668, 9.010772705078125, 9.351812362670898, 9.692852020263672, 10.033890724182129, 10.374929428100586, 10.71596908569336, 11.057008743286133, 11.39804744720459, 11.739086151123047, 12.08012580871582, 12.421165466308594, 12.76220417022705]}, "eval/loss": 1.642454743385315, "eval/bleu": 2.691896075803751e-15, "eval/runtime": 2632.4174, "eval/samples_per_second": 5.607, "eval/steps_per_second": 0.701} \ No newline at end of file