diff --git "a/wandb/run-20220505_173748-b097rk18/files/wandb-summary.json" "b/wandb/run-20220505_173748-b097rk18/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220505_173748-b097rk18/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 2.6458, "train/learning_rate": 2.9520000000000002e-05, "train/epoch": 0.31, "train/global_step": 500, "_runtime": 7074, "_timestamp": 1651779342, "_step": 500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 14.0, 65.0, 316.0, 493.0, 106.0, 15.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3495769500732422, -1.285817265510559, -1.222057580947876, -1.1582978963851929, -1.0945382118225098, -1.0307785272598267, -0.9670188426971436, -0.9032591581344604, -0.8394994735717773, -0.7757397890090942, -0.7119801044464111, -0.648220419883728, -0.5844607353210449, -0.5207010507583618, -0.4569413661956787, -0.3931816816329956, -0.3294219970703125, -0.2656623125076294, -0.2019026279449463, -0.13814294338226318, -0.07438325881958008, -0.010623574256896973, 0.05313611030578613, 0.11689579486846924, 0.18065547943115234, 0.24441516399383545, 0.30817484855651855, 0.37193453311920166, 0.43569421768188477, 0.49945390224456787, 0.563213586807251, 0.6269732713699341, 0.6907331943511963, 0.7544928789138794, 0.8182525634765625, 0.8820122480392456, 0.9457719326019287, 1.0095316171646118, 1.073291301727295, 1.137050986289978, 1.2008106708526611, 1.2645703554153442, 1.3283300399780273, 1.3920897245407104, 1.4558494091033936, 1.5196090936660767, 1.5833687782287598, 1.6471284627914429, 1.710888147354126, 1.774647831916809, 1.8384075164794922, 1.9021672010421753, 1.9659268856048584, 2.029686450958252, 2.0934462547302246, 2.1572060585021973, 2.220965623855591, 2.2847251892089844, 2.348484992980957, 2.4122447967529297, 2.4760043621063232, 2.539763927459717, 2.6035237312316895, 2.667283535003662, 2.7310431003570557]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 7.0, 5.0, 4.0, 8.0, 9.0, 27.0, 30.0, 32.0, 38.0, 35.0, 44.0, 50.0, 56.0, 68.0, 69.0, 74.0, 65.0, 65.0, 53.0, 50.0, 46.0, 37.0, 40.0, 21.0, 20.0, 12.0, 14.0, 11.0, 5.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5811864137649536, -0.5565242767333984, -0.5318621397018433, -0.5072000026702881, -0.4825378954410553, -0.4578757584095001, -0.43321365118026733, -0.40855151414871216, -0.383889377117157, -0.3592272400856018, -0.33456510305404663, -0.30990299582481384, -0.28524085879325867, -0.2605787217617035, -0.2359165996313095, -0.21125447750091553, -0.18659234046936035, -0.16193020343780518, -0.1372680813074112, -0.11260595172643661, -0.08794382214546204, -0.06328169256448746, -0.03861956298351288, -0.013957440853118896, 0.01070469617843628, 0.03536682575941086, 0.06002895534038544, 0.08469108492136002, 0.1093532145023346, 0.13401535153388977, 0.15867747366428375, 0.18333959579467773, 0.2080017328262329, 0.23266386985778809, 0.25732600688934326, 0.28198811411857605, 0.3066502511501312, 0.3313123881816864, 0.3559744954109192, 0.38063663244247437, 0.40529876947402954, 0.4299609065055847, 0.4546230435371399, 0.4792851507663727, 0.5039472579956055, 0.5286093950271606, 0.5532715320587158, 0.577933669090271, 0.6025958061218262, 0.6272579431533813, 0.6519200801849365, 0.6765822172164917, 0.7012443542480469, 0.7259064316749573, 0.7505685687065125, 0.7752307057380676, 0.7998928427696228, 0.824554979801178, 0.8492171168327332, 0.8738792538642883, 0.8985413312911987, 0.9232034683227539, 0.9478656053543091, 0.9725277423858643, 0.9971898794174194]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 8.0, 3.0, 6.0, 10.0, 9.0, 12.0, 8.0, 10.0, 17.0, 39.0, 34.0, 49.0, 55.0, 79.0, 135.0, 178.0, 487.0, 1697.0, 2789.0, 5429.0, 19231.0, 145835.0, 1098518.0, 2307316.0, 546421.0, 55085.0, 7382.0, 1498.0, 710.0, 396.0, 245.0, 151.0, 101.0, 68.0, 67.0, 51.0, 35.0, 31.0, 24.0, 15.0, 5.0, 4.0, 14.0, 10.0, 5.0, 8.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.025390625, -0.991546630859375, -0.95770263671875, -0.923858642578125, -0.8900146484375, -0.856170654296875, -0.82232666015625, -0.788482666015625, -0.754638671875, -0.720794677734375, -0.68695068359375, -0.653106689453125, -0.6192626953125, -0.585418701171875, -0.55157470703125, -0.517730712890625, -0.48388671875, -0.450042724609375, -0.41619873046875, -0.382354736328125, -0.3485107421875, -0.314666748046875, -0.28082275390625, -0.246978759765625, -0.213134765625, -0.179290771484375, -0.14544677734375, -0.111602783203125, -0.0777587890625, -0.043914794921875, -0.01007080078125, 0.023773193359375, 0.0576171875, 0.091461181640625, 0.12530517578125, 0.159149169921875, 0.1929931640625, 0.226837158203125, 0.26068115234375, 0.294525146484375, 0.328369140625, 0.362213134765625, 0.39605712890625, 0.429901123046875, 0.4637451171875, 0.497589111328125, 0.53143310546875, 0.565277099609375, 0.59912109375, 0.632965087890625, 0.66680908203125, 0.700653076171875, 0.7344970703125, 0.768341064453125, 0.80218505859375, 0.836029052734375, 0.869873046875, 0.903717041015625, 0.93756103515625, 0.971405029296875, 1.0052490234375, 1.039093017578125, 1.07293701171875, 1.106781005859375, 1.140625]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 19.0, 3.0, 11.0, 25.0, 32.0, 30.0, 38.0, 41.0, 68.0, 50.0, 55.0, 72.0, 53.0, 60.0, 74.0, 70.0, 55.0, 55.0, 33.0, 21.0, 32.0, 34.0, 20.0, 11.0, 14.0, 11.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.65380859375, -0.6241073608398438, -0.5944061279296875, -0.5647048950195312, -0.535003662109375, -0.5053024291992188, -0.4756011962890625, -0.44589996337890625, -0.41619873046875, -0.38649749755859375, -0.3567962646484375, -0.32709503173828125, -0.297393798828125, -0.26769256591796875, -0.2379913330078125, -0.20829010009765625, -0.1785888671875, -0.14888763427734375, -0.1191864013671875, -0.08948516845703125, -0.059783935546875, -0.03008270263671875, -0.0003814697265625, 0.02931976318359375, 0.05902099609375, 0.08872222900390625, 0.1184234619140625, 0.14812469482421875, 0.177825927734375, 0.20752716064453125, 0.2372283935546875, 0.26692962646484375, 0.296630859375, 0.32633209228515625, 0.3560333251953125, 0.38573455810546875, 0.415435791015625, 0.44513702392578125, 0.4748382568359375, 0.5045394897460938, 0.53424072265625, 0.5639419555664062, 0.5936431884765625, 0.6233444213867188, 0.653045654296875, 0.6827468872070312, 0.7124481201171875, 0.7421493530273438, 0.7718505859375, 0.8015518188476562, 0.8312530517578125, 0.8609542846679688, 0.890655517578125, 0.9203567504882812, 0.9500579833984375, 0.9797592163085938, 1.00946044921875, 1.0391616821289062, 1.0688629150390625, 1.0985641479492188, 1.128265380859375, 1.1579666137695312, 1.1876678466796875, 1.2173690795898438, 1.2470703125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 0.0, 0.0, 5.0, 8.0, 13.0, 4.0, 19.0, 31.0, 78.0, 174.0, 1101.0, 4189799.0, 2562.0, 278.0, 83.0, 51.0, 26.0, 11.0, 11.0, 9.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.3125, -16.747314453125, -16.18212890625, -15.616943359375, -15.0517578125, -14.486572265625, -13.92138671875, -13.356201171875, -12.791015625, -12.225830078125, -11.66064453125, -11.095458984375, -10.5302734375, -9.965087890625, -9.39990234375, -8.834716796875, -8.26953125, -7.704345703125, -7.13916015625, -6.573974609375, -6.0087890625, -5.443603515625, -4.87841796875, -4.313232421875, -3.748046875, -3.182861328125, -2.61767578125, -2.052490234375, -1.4873046875, -0.922119140625, -0.35693359375, 0.208251953125, 0.7734375, 1.338623046875, 1.90380859375, 2.468994140625, 3.0341796875, 3.599365234375, 4.16455078125, 4.729736328125, 5.294921875, 5.860107421875, 6.42529296875, 6.990478515625, 7.5556640625, 8.120849609375, 8.68603515625, 9.251220703125, 9.81640625, 10.381591796875, 10.94677734375, 11.511962890625, 12.0771484375, 12.642333984375, 13.20751953125, 13.772705078125, 14.337890625, 14.903076171875, 15.46826171875, 16.033447265625, 16.5986328125, 17.163818359375, 17.72900390625, 18.294189453125, 18.859375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 6.0, 7.0, 13.0, 24.0, 45.0, 89.0, 445.0, 1807.0, 1225.0, 226.0, 68.0, 45.0, 21.0, 11.0, 12.0, 6.0, 9.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53662109375, -0.5192108154296875, -0.501800537109375, -0.4843902587890625, -0.46697998046875, -0.4495697021484375, -0.432159423828125, -0.4147491455078125, -0.3973388671875, -0.3799285888671875, -0.362518310546875, -0.3451080322265625, -0.32769775390625, -0.3102874755859375, -0.292877197265625, -0.2754669189453125, -0.258056640625, -0.2406463623046875, -0.223236083984375, -0.2058258056640625, -0.18841552734375, -0.1710052490234375, -0.153594970703125, -0.1361846923828125, -0.1187744140625, -0.1013641357421875, -0.083953857421875, -0.0665435791015625, -0.04913330078125, -0.0317230224609375, -0.014312744140625, 0.0030975341796875, 0.0205078125, 0.0379180908203125, 0.055328369140625, 0.0727386474609375, 0.09014892578125, 0.1075592041015625, 0.124969482421875, 0.1423797607421875, 0.1597900390625, 0.1772003173828125, 0.194610595703125, 0.2120208740234375, 0.22943115234375, 0.2468414306640625, 0.264251708984375, 0.2816619873046875, 0.299072265625, 0.3164825439453125, 0.333892822265625, 0.3513031005859375, 0.36871337890625, 0.3861236572265625, 0.403533935546875, 0.4209442138671875, 0.4383544921875, 0.4557647705078125, 0.473175048828125, 0.4905853271484375, 0.50799560546875, 0.5254058837890625, 0.542816162109375, 0.5602264404296875, 0.57763671875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 15.0, 18.0, 17.0, 42.0, 54.0, 126.0, 125.0, 160.0, 160.0, 95.0, 72.0, 55.0, 21.0, 18.0, 9.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9502484798431396, -0.9117231369018555, -0.8731978535652161, -0.8346725106239319, -0.7961471676826477, -0.7576218843460083, -0.7190965414047241, -0.6805711984634399, -0.6420458555221558, -0.6035205125808716, -0.5649952292442322, -0.526469886302948, -0.4879445433616638, -0.449419230222702, -0.41089391708374023, -0.37236857414245605, -0.33384329080581665, -0.29531797766685486, -0.2567926347255707, -0.2182673215866089, -0.1797419935464859, -0.14121666550636292, -0.10269135236740112, -0.06416600942611694, -0.02564069628715515, 0.012884628027677536, 0.05140995234251022, 0.08993527293205261, 0.1284606009721756, 0.16698592901229858, 0.20551124215126038, 0.24403658509254456, 0.28256189823150635, 0.32108721137046814, 0.3596125543117523, 0.3981378674507141, 0.4366632103919983, 0.4751885235309601, 0.5137138366699219, 0.552239179611206, 0.5907645225524902, 0.6292898654937744, 0.6678151488304138, 0.706340491771698, 0.7448658347129822, 0.7833911180496216, 0.8219164609909058, 0.8604418039321899, 0.8989670872688293, 0.9374924302101135, 0.9760177135467529, 1.014543056488037, 1.0530683994293213, 1.0915937423706055, 1.1301190853118896, 1.1686444282531738, 1.2071696519851685, 1.2456949949264526, 1.2842203378677368, 1.3227455615997314, 1.3612709045410156, 1.3997962474822998, 1.438321590423584, 1.4768469333648682, 1.5153722763061523]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 8.0, 9.0, 9.0, 4.0, 13.0, 21.0, 25.0, 29.0, 37.0, 30.0, 42.0, 42.0, 48.0, 50.0, 45.0, 71.0, 60.0, 61.0, 66.0, 39.0, 44.0, 47.0, 40.0, 38.0, 31.0, 30.0, 17.0, 9.0, 11.0, 10.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6284670233726501, -0.6051810383796692, -0.581895112991333, -0.558609127998352, -0.5353231430053711, -0.5120371580123901, -0.48875123262405396, -0.465465247631073, -0.44217929244041443, -0.41889333724975586, -0.3956073522567749, -0.37232139706611633, -0.34903544187545776, -0.3257494568824768, -0.30246350169181824, -0.27917754650115967, -0.2558915615081787, -0.23260559141635895, -0.20931962132453918, -0.18603366613388062, -0.16274769604206085, -0.1394617259502411, -0.11617577075958252, -0.09288980066776276, -0.069603830575943, -0.04631786420941353, -0.023031897842884064, 0.00025406479835510254, 0.023540034890174866, 0.04682600498199463, 0.0701119601726532, 0.09339793026447296, 0.11668384075164795, 0.1399698108434677, 0.16325578093528748, 0.18654173612594604, 0.2098277062177658, 0.23311367630958557, 0.25639963150024414, 0.2796856164932251, 0.30297157168388367, 0.32625752687454224, 0.3495435118675232, 0.37282946705818176, 0.39611542224884033, 0.4194014072418213, 0.44268736243247986, 0.4659733176231384, 0.4892593026161194, 0.5125452876091003, 0.5358312129974365, 0.5591171979904175, 0.5824031829833984, 0.6056891679763794, 0.6289750933647156, 0.6522610783576965, 0.6755470037460327, 0.6988329887390137, 0.7221189141273499, 0.7454048991203308, 0.7686908841133118, 0.791976809501648, 0.8152627944946289, 0.8385487794876099, 0.8618347644805908]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 7.0, 21.0, 32.0, 41.0, 63.0, 113.0, 194.0, 339.0, 648.0, 1326.0, 3263.0, 8845.0, 30277.0, 135098.0, 534028.0, 259591.0, 52414.0, 13958.0, 4616.0, 1862.0, 838.0, 383.0, 231.0, 146.0, 74.0, 44.0, 27.0, 22.0, 19.0, 9.0, 9.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.317138671875, -0.30872535705566406, -0.3003120422363281, -0.2918987274169922, -0.28348541259765625, -0.2750720977783203, -0.2666587829589844, -0.25824546813964844, -0.2498321533203125, -0.24141883850097656, -0.23300552368164062, -0.2245922088623047, -0.21617889404296875, -0.2077655792236328, -0.19935226440429688, -0.19093894958496094, -0.182525634765625, -0.17411231994628906, -0.16569900512695312, -0.1572856903076172, -0.14887237548828125, -0.1404590606689453, -0.13204574584960938, -0.12363243103027344, -0.1152191162109375, -0.10680580139160156, -0.09839248657226562, -0.08997917175292969, -0.08156585693359375, -0.07315254211425781, -0.06473922729492188, -0.05632591247558594, -0.04791259765625, -0.03949928283691406, -0.031085968017578125, -0.022672653198242188, -0.01425933837890625, -0.0058460235595703125, 0.002567291259765625, 0.010980606079101562, 0.0193939208984375, 0.027807235717773438, 0.036220550537109375, 0.04463386535644531, 0.05304718017578125, 0.06146049499511719, 0.06987380981445312, 0.07828712463378906, 0.086700439453125, 0.09511375427246094, 0.10352706909179688, 0.11194038391113281, 0.12035369873046875, 0.1287670135498047, 0.13718032836914062, 0.14559364318847656, 0.1540069580078125, 0.16242027282714844, 0.17083358764648438, 0.1792469024658203, 0.18766021728515625, 0.1960735321044922, 0.20448684692382812, 0.21290016174316406, 0.2213134765625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 7.0, 11.0, 15.0, 23.0, 20.0, 30.0, 33.0, 37.0, 47.0, 50.0, 55.0, 51.0, 55.0, 68.0, 69.0, 54.0, 76.0, 50.0, 54.0, 45.0, 34.0, 20.0, 27.0, 20.0, 17.0, 4.0, 9.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5458984375, -0.5254669189453125, -0.505035400390625, -0.4846038818359375, -0.46417236328125, -0.4437408447265625, -0.423309326171875, -0.4028778076171875, -0.3824462890625, -0.3620147705078125, -0.341583251953125, -0.3211517333984375, -0.30072021484375, -0.2802886962890625, -0.259857177734375, -0.2394256591796875, -0.218994140625, -0.1985626220703125, -0.178131103515625, -0.1576995849609375, -0.13726806640625, -0.1168365478515625, -0.096405029296875, -0.0759735107421875, -0.0555419921875, -0.0351104736328125, -0.014678955078125, 0.0057525634765625, 0.02618408203125, 0.0466156005859375, 0.067047119140625, 0.0874786376953125, 0.10791015625, 0.1283416748046875, 0.148773193359375, 0.1692047119140625, 0.18963623046875, 0.2100677490234375, 0.230499267578125, 0.2509307861328125, 0.2713623046875, 0.2917938232421875, 0.312225341796875, 0.3326568603515625, 0.35308837890625, 0.3735198974609375, 0.393951416015625, 0.4143829345703125, 0.434814453125, 0.4552459716796875, 0.475677490234375, 0.4961090087890625, 0.51654052734375, 0.5369720458984375, 0.557403564453125, 0.5778350830078125, 0.5982666015625, 0.6186981201171875, 0.639129638671875, 0.6595611572265625, 0.67999267578125, 0.7004241943359375, 0.720855712890625, 0.7412872314453125, 0.76171875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 18.0, 10.0, 16.0, 32.0, 38.0, 51.0, 78.0, 116.0, 172.0, 227.0, 324.0, 503.0, 751.0, 1104.0, 1726.0, 2659.0, 4131.0, 6599.0, 10752.0, 17692.0, 30981.0, 55518.0, 103484.0, 183751.0, 235429.0, 172390.0, 95962.0, 51000.0, 28658.0, 16902.0, 10001.0, 6015.0, 3908.0, 2504.0, 1678.0, 1037.0, 763.0, 488.0, 347.0, 222.0, 168.0, 109.0, 76.0, 48.0, 34.0, 22.0, 18.0, 14.0, 7.0, 3.0, 2.0, 4.0, 5.0, 3.0, 0.0, 2.0], "bins": [-0.08660888671875, -0.0839385986328125, -0.081268310546875, -0.0785980224609375, -0.075927734375, -0.0732574462890625, -0.070587158203125, -0.0679168701171875, -0.06524658203125, -0.0625762939453125, -0.059906005859375, -0.0572357177734375, -0.0545654296875, -0.0518951416015625, -0.049224853515625, -0.0465545654296875, -0.04388427734375, -0.0412139892578125, -0.038543701171875, -0.0358734130859375, -0.033203125, -0.0305328369140625, -0.027862548828125, -0.0251922607421875, -0.02252197265625, -0.0198516845703125, -0.017181396484375, -0.0145111083984375, -0.0118408203125, -0.0091705322265625, -0.006500244140625, -0.0038299560546875, -0.00115966796875, 0.0015106201171875, 0.004180908203125, 0.0068511962890625, 0.009521484375, 0.0121917724609375, 0.014862060546875, 0.0175323486328125, 0.02020263671875, 0.0228729248046875, 0.025543212890625, 0.0282135009765625, 0.0308837890625, 0.0335540771484375, 0.036224365234375, 0.0388946533203125, 0.04156494140625, 0.0442352294921875, 0.046905517578125, 0.0495758056640625, 0.05224609375, 0.0549163818359375, 0.057586669921875, 0.0602569580078125, 0.06292724609375, 0.0655975341796875, 0.068267822265625, 0.0709381103515625, 0.0736083984375, 0.0762786865234375, 0.078948974609375, 0.0816192626953125, 0.08428955078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 1.0, 1.0, 10.0, 8.0, 5.0, 8.0, 17.0, 17.0, 19.0, 20.0, 21.0, 23.0, 41.0, 40.0, 42.0, 51.0, 48.0, 37.0, 39.0, 35.0, 53.0, 51.0, 54.0, 55.0, 35.0, 42.0, 35.0, 32.0, 27.0, 33.0, 22.0, 19.0, 15.0, 14.0, 5.0, 7.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.94287109375, -0.9125137329101562, -0.8821563720703125, -0.8517990112304688, -0.821441650390625, -0.7910842895507812, -0.7607269287109375, -0.7303695678710938, -0.70001220703125, -0.6696548461914062, -0.6392974853515625, -0.6089401245117188, -0.578582763671875, -0.5482254028320312, -0.5178680419921875, -0.48751068115234375, -0.4571533203125, -0.42679595947265625, -0.3964385986328125, -0.36608123779296875, -0.335723876953125, -0.30536651611328125, -0.2750091552734375, -0.24465179443359375, -0.21429443359375, -0.18393707275390625, -0.1535797119140625, -0.12322235107421875, -0.092864990234375, -0.06250762939453125, -0.0321502685546875, -0.00179290771484375, 0.028564453125, 0.05892181396484375, 0.0892791748046875, 0.11963653564453125, 0.149993896484375, 0.18035125732421875, 0.2107086181640625, 0.24106597900390625, 0.27142333984375, 0.30178070068359375, 0.3321380615234375, 0.36249542236328125, 0.392852783203125, 0.42321014404296875, 0.4535675048828125, 0.48392486572265625, 0.5142822265625, 0.5446395874023438, 0.5749969482421875, 0.6053543090820312, 0.635711669921875, 0.6660690307617188, 0.6964263916015625, 0.7267837524414062, 0.75714111328125, 0.7874984741210938, 0.8178558349609375, 0.8482131958007812, 0.878570556640625, 0.9089279174804688, 0.9392852783203125, 0.9696426391601562, 1.0]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 10.0, 6.0, 15.0, 19.0, 14.0, 45.0, 54.0, 77.0, 102.0, 171.0, 269.0, 442.0, 668.0, 1066.0, 1776.0, 2969.0, 5151.0, 9712.0, 18705.0, 38328.0, 81622.0, 165692.0, 254566.0, 223397.0, 124287.0, 59251.0, 28302.0, 14012.0, 7433.0, 4103.0, 2370.0, 1429.0, 858.0, 567.0, 350.0, 226.0, 147.0, 90.0, 76.0, 53.0, 30.0, 23.0, 18.0, 16.0, 9.0, 7.0, 7.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.007076263427734375, -0.006853640079498291, -0.006631016731262207, -0.006408393383026123, -0.006185770034790039, -0.005963146686553955, -0.005740523338317871, -0.005517899990081787, -0.005295276641845703, -0.005072653293609619, -0.004850029945373535, -0.004627406597137451, -0.004404783248901367, -0.004182159900665283, -0.003959536552429199, -0.0037369132041931152, -0.0035142898559570312, -0.0032916665077209473, -0.0030690431594848633, -0.0028464198112487793, -0.0026237964630126953, -0.0024011731147766113, -0.0021785497665405273, -0.0019559264183044434, -0.0017333030700683594, -0.0015106797218322754, -0.0012880563735961914, -0.0010654330253601074, -0.0008428096771240234, -0.0006201863288879395, -0.00039756298065185547, -0.00017493963241577148, 4.76837158203125e-05, 0.0002703070640563965, 0.0004929304122924805, 0.0007155537605285645, 0.0009381771087646484, 0.0011608004570007324, 0.0013834238052368164, 0.0016060471534729004, 0.0018286705017089844, 0.0020512938499450684, 0.0022739171981811523, 0.0024965405464172363, 0.0027191638946533203, 0.0029417872428894043, 0.0031644105911254883, 0.0033870339393615723, 0.0036096572875976562, 0.0038322806358337402, 0.004054903984069824, 0.004277527332305908, 0.004500150680541992, 0.004722774028778076, 0.00494539737701416, 0.005168020725250244, 0.005390644073486328, 0.005613267421722412, 0.005835890769958496, 0.00605851411819458, 0.006281137466430664, 0.006503760814666748, 0.006726384162902832, 0.006949007511138916, 0.007171630859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 10.0, 16.0, 13.0, 21.0, 22.0, 35.0, 47.0, 60.0, 82.0, 95.0, 103.0, 82.0, 86.0, 67.0, 60.0, 34.0, 38.0, 32.0, 22.0, 12.0, 11.0, 15.0, 6.0, 1.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.47955322265625e-05, -2.410542219877243e-05, -2.341531217098236e-05, -2.272520214319229e-05, -2.203509211540222e-05, -2.1344982087612152e-05, -2.0654872059822083e-05, -1.9964762032032013e-05, -1.9274652004241943e-05, -1.8584541976451874e-05, -1.7894431948661804e-05, -1.7204321920871735e-05, -1.6514211893081665e-05, -1.5824101865291595e-05, -1.5133991837501526e-05, -1.4443881809711456e-05, -1.3753771781921387e-05, -1.3063661754131317e-05, -1.2373551726341248e-05, -1.1683441698551178e-05, -1.0993331670761108e-05, -1.0303221642971039e-05, -9.61311161518097e-06, -8.9230015873909e-06, -8.23289155960083e-06, -7.5427815318107605e-06, -6.852671504020691e-06, -6.162561476230621e-06, -5.472451448440552e-06, -4.782341420650482e-06, -4.092231392860413e-06, -3.402121365070343e-06, -2.7120113372802734e-06, -2.021901309490204e-06, -1.3317912817001343e-06, -6.416812539100647e-07, 4.842877388000488e-08, 7.385388016700745e-07, 1.428648829460144e-06, 2.1187588572502136e-06, 2.808868885040283e-06, 3.4989789128303528e-06, 4.189088940620422e-06, 4.879198968410492e-06, 5.5693089962005615e-06, 6.259419023990631e-06, 6.949529051780701e-06, 7.63963907957077e-06, 8.32974910736084e-06, 9.01985913515091e-06, 9.709969162940979e-06, 1.0400079190731049e-05, 1.1090189218521118e-05, 1.1780299246311188e-05, 1.2470409274101257e-05, 1.3160519301891327e-05, 1.3850629329681396e-05, 1.4540739357471466e-05, 1.5230849385261536e-05, 1.5920959413051605e-05, 1.6611069440841675e-05, 1.7301179468631744e-05, 1.7991289496421814e-05, 1.8681399524211884e-05, 1.9371509552001953e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 7.0, 9.0, 4.0, 12.0, 8.0, 9.0, 13.0, 22.0, 25.0, 17.0, 25.0, 33.0, 37.0, 44.0, 58.0, 64.0, 84.0, 91.0, 131.0, 236.0, 725.0, 7133.0, 265056.0, 743605.0, 28565.0, 1439.0, 311.0, 162.0, 98.0, 84.0, 58.0, 52.0, 39.0, 47.0, 43.0, 48.0, 34.0, 41.0, 18.0, 11.0, 18.0, 13.0, 11.0, 4.0, 1.0, 8.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.021728515625, -0.020929813385009766, -0.02013111114501953, -0.019332408905029297, -0.018533706665039062, -0.017735004425048828, -0.016936302185058594, -0.01613759994506836, -0.015338897705078125, -0.01454019546508789, -0.013741493225097656, -0.012942790985107422, -0.012144088745117188, -0.011345386505126953, -0.010546684265136719, -0.009747982025146484, -0.00894927978515625, -0.008150577545166016, -0.007351875305175781, -0.006553173065185547, -0.0057544708251953125, -0.004955768585205078, -0.004157066345214844, -0.0033583641052246094, -0.002559661865234375, -0.0017609596252441406, -0.0009622573852539062, -0.00016355514526367188, 0.0006351470947265625, 0.0014338493347167969, 0.0022325515747070312, 0.0030312538146972656, 0.0038299560546875, 0.004628658294677734, 0.005427360534667969, 0.006226062774658203, 0.0070247650146484375, 0.007823467254638672, 0.008622169494628906, 0.00942087173461914, 0.010219573974609375, 0.01101827621459961, 0.011816978454589844, 0.012615680694580078, 0.013414382934570312, 0.014213085174560547, 0.015011787414550781, 0.015810489654541016, 0.01660919189453125, 0.017407894134521484, 0.01820659637451172, 0.019005298614501953, 0.019804000854492188, 0.020602703094482422, 0.021401405334472656, 0.02220010757446289, 0.022998809814453125, 0.02379751205444336, 0.024596214294433594, 0.025394916534423828, 0.026193618774414062, 0.026992321014404297, 0.02779102325439453, 0.028589725494384766, 0.029388427734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 6.0, 6.0, 4.0, 7.0, 11.0, 10.0, 7.0, 10.0, 13.0, 16.0, 27.0, 29.0, 25.0, 36.0, 43.0, 34.0, 36.0, 42.0, 41.0, 47.0, 35.0, 41.0, 46.0, 41.0, 58.0, 40.0, 31.0, 31.0, 29.0, 24.0, 18.0, 25.0, 14.0, 20.0, 25.0, 19.0, 16.0, 7.0, 5.0, 10.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002010345458984375, -0.001935720443725586, -0.0018610954284667969, -0.0017864704132080078, -0.0017118453979492188, -0.0016372203826904297, -0.0015625953674316406, -0.0014879703521728516, -0.0014133453369140625, -0.0013387203216552734, -0.0012640953063964844, -0.0011894702911376953, -0.0011148452758789062, -0.0010402202606201172, -0.0009655952453613281, -0.0008909702301025391, -0.00081634521484375, -0.0007417201995849609, -0.0006670951843261719, -0.0005924701690673828, -0.0005178451538085938, -0.0004432201385498047, -0.0003685951232910156, -0.00029397010803222656, -0.0002193450927734375, -0.00014472007751464844, -7.009506225585938e-05, 4.5299530029296875e-06, 7.915496826171875e-05, 0.0001537799835205078, 0.00022840499877929688, 0.00030303001403808594, 0.000377655029296875, 0.00045228004455566406, 0.0005269050598144531, 0.0006015300750732422, 0.0006761550903320312, 0.0007507801055908203, 0.0008254051208496094, 0.0009000301361083984, 0.0009746551513671875, 0.0010492801666259766, 0.0011239051818847656, 0.0011985301971435547, 0.0012731552124023438, 0.0013477802276611328, 0.0014224052429199219, 0.001497030258178711, 0.0015716552734375, 0.001646280288696289, 0.0017209053039550781, 0.0017955303192138672, 0.0018701553344726562, 0.0019447803497314453, 0.0020194053649902344, 0.0020940303802490234, 0.0021686553955078125, 0.0022432804107666016, 0.0023179054260253906, 0.0023925304412841797, 0.0024671554565429688, 0.002541780471801758, 0.002616405487060547, 0.002691030502319336, 0.002765655517578125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 15.0, 49.0, 87.0, 307.0, 330.0, 140.0, 49.0, 14.0, 9.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0766605138778687, -1.0138804912567139, -0.9511003494262695, -0.88832026720047, -0.8255401849746704, -0.7627601027488708, -0.6999800205230713, -0.6371999382972717, -0.5744198560714722, -0.5116397738456726, -0.44885969161987305, -0.3860796093940735, -0.3232995271682739, -0.26051944494247437, -0.1977393627166748, -0.13495928049087524, -0.07217919826507568, -0.009399116039276123, 0.05338096618652344, 0.116161048412323, 0.17894113063812256, 0.24172121286392212, 0.3045012950897217, 0.36728137731552124, 0.4300614595413208, 0.49284154176712036, 0.5556216239929199, 0.6184017062187195, 0.681181788444519, 0.7439618706703186, 0.8067419528961182, 0.8695220351219177, 0.9323019981384277, 0.9950820803642273, 1.0578621625900269, 1.1206421852111816, 1.183422327041626, 1.2462024688720703, 1.308982491493225, 1.3717625141143799, 1.4345426559448242, 1.4973227977752686, 1.5601028203964233, 1.6228828430175781, 1.6856629848480225, 1.7484431266784668, 1.8112231492996216, 1.8740031719207764, 1.9367833137512207, 1.999563455581665, 2.0623435974121094, 2.1251235008239746, 2.187903642654419, 2.2506837844848633, 2.3134636878967285, 2.376243829727173, 2.439023971557617, 2.5018041133880615, 2.564584255218506, 2.627364158630371, 2.6901443004608154, 2.7529244422912598, 2.815704345703125, 2.8784844875335693, 2.9412646293640137]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 8.0, 10.0, 13.0, 27.0, 34.0, 36.0, 32.0, 30.0, 60.0, 62.0, 48.0, 62.0, 71.0, 76.0, 71.0, 48.0, 60.0, 44.0, 46.0, 35.0, 35.0, 28.0, 18.0, 7.0, 7.0, 10.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5167196989059448, -0.49668681621551514, -0.47665393352508545, -0.4566210210323334, -0.4365881383419037, -0.416555255651474, -0.3965223431587219, -0.37648946046829224, -0.35645657777786255, -0.33642369508743286, -0.3163908123970032, -0.2963578999042511, -0.2763250172138214, -0.2562921345233917, -0.23625923693180084, -0.21622633934020996, -0.19619345664978027, -0.17616057395935059, -0.1561276763677597, -0.13609477877616882, -0.11606189608573914, -0.09602900594472885, -0.07599611580371857, -0.055963218212127686, -0.035930335521698, -0.015897445380687714, 0.004135444760322571, 0.024168334901332855, 0.04420122504234314, 0.06423411518335342, 0.08426700532436371, 0.10429990291595459, 0.12433284521102905, 0.14436572790145874, 0.16439862549304962, 0.1844315230846405, 0.2044644057750702, 0.22449728846549988, 0.24453018605709076, 0.26456308364868164, 0.28459596633911133, 0.304628849029541, 0.3246617317199707, 0.3446946442127228, 0.36472752690315247, 0.38476040959358215, 0.40479332208633423, 0.4248262047767639, 0.4448590874671936, 0.4648919701576233, 0.484924852848053, 0.5049577355384827, 0.5249906778335571, 0.5450235605239868, 0.5650564432144165, 0.5850893259048462, 0.6051222085952759, 0.6251550912857056, 0.6451879739761353, 0.6652208566665649, 0.6852537393569946, 0.7052866816520691, 0.7253195643424988, 0.7453524470329285, 0.7653853297233582]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 6.0, 8.0, 9.0, 11.0, 7.0, 12.0, 30.0, 37.0, 41.0, 51.0, 70.0, 106.0, 130.0, 217.0, 286.0, 445.0, 632.0, 928.0, 1566.0, 2436.0, 4101.0, 7223.0, 13351.0, 26951.0, 58750.0, 139844.0, 286137.0, 268768.0, 127638.0, 54310.0, 24929.0, 12350.0, 6687.0, 3833.0, 2285.0, 1388.0, 921.0, 604.0, 429.0, 277.0, 197.0, 158.0, 109.0, 67.0, 67.0, 49.0, 32.0, 15.0, 18.0, 12.0, 13.0, 2.0, 9.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.313232421875, -0.30277252197265625, -0.2923126220703125, -0.28185272216796875, -0.271392822265625, -0.26093292236328125, -0.2504730224609375, -0.24001312255859375, -0.22955322265625, -0.21909332275390625, -0.2086334228515625, -0.19817352294921875, -0.187713623046875, -0.17725372314453125, -0.1667938232421875, -0.15633392333984375, -0.1458740234375, -0.13541412353515625, -0.1249542236328125, -0.11449432373046875, -0.104034423828125, -0.09357452392578125, -0.0831146240234375, -0.07265472412109375, -0.06219482421875, -0.05173492431640625, -0.0412750244140625, -0.03081512451171875, -0.020355224609375, -0.00989532470703125, 0.0005645751953125, 0.01102447509765625, 0.021484375, 0.03194427490234375, 0.0424041748046875, 0.05286407470703125, 0.063323974609375, 0.07378387451171875, 0.0842437744140625, 0.09470367431640625, 0.10516357421875, 0.11562347412109375, 0.1260833740234375, 0.13654327392578125, 0.147003173828125, 0.15746307373046875, 0.1679229736328125, 0.17838287353515625, 0.1888427734375, 0.19930267333984375, 0.2097625732421875, 0.22022247314453125, 0.230682373046875, 0.24114227294921875, 0.2516021728515625, 0.26206207275390625, 0.27252197265625, 0.28298187255859375, 0.2934417724609375, 0.30390167236328125, 0.314361572265625, 0.32482147216796875, 0.3352813720703125, 0.34574127197265625, 0.356201171875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 4.0, 6.0, 6.0, 6.0, 9.0, 9.0, 12.0, 9.0, 9.0, 17.0, 15.0, 17.0, 19.0, 20.0, 36.0, 29.0, 26.0, 28.0, 36.0, 32.0, 32.0, 37.0, 37.0, 39.0, 46.0, 30.0, 41.0, 31.0, 29.0, 28.0, 33.0, 29.0, 28.0, 21.0, 16.0, 24.0, 24.0, 19.0, 12.0, 14.0, 14.0, 11.0, 11.0, 11.0, 9.0, 4.0, 5.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-6.4765625, -6.27984619140625, -6.0831298828125, -5.88641357421875, -5.689697265625, -5.49298095703125, -5.2962646484375, -5.09954833984375, -4.90283203125, -4.70611572265625, -4.5093994140625, -4.31268310546875, -4.115966796875, -3.91925048828125, -3.7225341796875, -3.52581787109375, -3.3291015625, -3.13238525390625, -2.9356689453125, -2.73895263671875, -2.542236328125, -2.34552001953125, -2.1488037109375, -1.95208740234375, -1.75537109375, -1.55865478515625, -1.3619384765625, -1.16522216796875, -0.968505859375, -0.77178955078125, -0.5750732421875, -0.37835693359375, -0.181640625, 0.01507568359375, 0.2117919921875, 0.40850830078125, 0.605224609375, 0.80194091796875, 0.9986572265625, 1.19537353515625, 1.39208984375, 1.58880615234375, 1.7855224609375, 1.98223876953125, 2.178955078125, 2.37567138671875, 2.5723876953125, 2.76910400390625, 2.9658203125, 3.16253662109375, 3.3592529296875, 3.55596923828125, 3.752685546875, 3.94940185546875, 4.1461181640625, 4.34283447265625, 4.53955078125, 4.73626708984375, 4.9329833984375, 5.12969970703125, 5.326416015625, 5.52313232421875, 5.7198486328125, 5.91656494140625, 6.11328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 11.0, 17.0, 11.0, 18.0, 26.0, 41.0, 50.0, 72.0, 80.0, 114.0, 175.0, 248.0, 392.0, 713.0, 2714.0, 889534.0, 151112.0, 1446.0, 586.0, 342.0, 222.0, 141.0, 109.0, 78.0, 56.0, 49.0, 42.0, 29.0, 22.0, 20.0, 22.0, 12.0, 6.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.11328125, -3.015533447265625, -2.91778564453125, -2.820037841796875, -2.7222900390625, -2.624542236328125, -2.52679443359375, -2.429046630859375, -2.331298828125, -2.233551025390625, -2.13580322265625, -2.038055419921875, -1.9403076171875, -1.842559814453125, -1.74481201171875, -1.647064208984375, -1.54931640625, -1.451568603515625, -1.35382080078125, -1.256072998046875, -1.1583251953125, -1.060577392578125, -0.96282958984375, -0.865081787109375, -0.767333984375, -0.669586181640625, -0.57183837890625, -0.474090576171875, -0.3763427734375, -0.278594970703125, -0.18084716796875, -0.083099365234375, 0.0146484375, 0.112396240234375, 0.21014404296875, 0.307891845703125, 0.4056396484375, 0.503387451171875, 0.60113525390625, 0.698883056640625, 0.796630859375, 0.894378662109375, 0.99212646484375, 1.089874267578125, 1.1876220703125, 1.285369873046875, 1.38311767578125, 1.480865478515625, 1.57861328125, 1.676361083984375, 1.77410888671875, 1.871856689453125, 1.9696044921875, 2.067352294921875, 2.16510009765625, 2.262847900390625, 2.360595703125, 2.458343505859375, 2.55609130859375, 2.653839111328125, 2.7515869140625, 2.849334716796875, 2.94708251953125, 3.044830322265625, 3.142578125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 9.0, 11.0, 7.0, 11.0, 13.0, 27.0, 27.0, 32.0, 38.0, 39.0, 35.0, 48.0, 42.0, 63.0, 43.0, 50.0, 47.0, 59.0, 49.0, 54.0, 39.0, 34.0, 30.0, 36.0, 15.0, 26.0, 17.0, 17.0, 14.0, 15.0, 14.0, 9.0, 4.0, 4.0, 7.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.390625, -8.1263427734375, -7.862060546875, -7.5977783203125, -7.33349609375, -7.0692138671875, -6.804931640625, -6.5406494140625, -6.2763671875, -6.0120849609375, -5.747802734375, -5.4835205078125, -5.21923828125, -4.9549560546875, -4.690673828125, -4.4263916015625, -4.162109375, -3.8978271484375, -3.633544921875, -3.3692626953125, -3.10498046875, -2.8406982421875, -2.576416015625, -2.3121337890625, -2.0478515625, -1.7835693359375, -1.519287109375, -1.2550048828125, -0.99072265625, -0.7264404296875, -0.462158203125, -0.1978759765625, 0.06640625, 0.3306884765625, 0.594970703125, 0.8592529296875, 1.12353515625, 1.3878173828125, 1.652099609375, 1.9163818359375, 2.1806640625, 2.4449462890625, 2.709228515625, 2.9735107421875, 3.23779296875, 3.5020751953125, 3.766357421875, 4.0306396484375, 4.294921875, 4.5592041015625, 4.823486328125, 5.0877685546875, 5.35205078125, 5.6163330078125, 5.880615234375, 6.1448974609375, 6.4091796875, 6.6734619140625, 6.937744140625, 7.2020263671875, 7.46630859375, 7.7305908203125, 7.994873046875, 8.2591552734375, 8.5234375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 6.0, 5.0, 17.0, 12.0, 25.0, 58.0, 177.0, 1112.0, 66895.0, 978082.0, 1762.0, 247.0, 59.0, 31.0, 17.0, 8.0, 8.0, 4.0, 8.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5458984375, -0.5307731628417969, -0.5156478881835938, -0.5005226135253906, -0.4853973388671875, -0.4702720642089844, -0.45514678955078125, -0.4400215148925781, -0.424896240234375, -0.4097709655761719, -0.39464569091796875, -0.3795204162597656, -0.3643951416015625, -0.3492698669433594, -0.33414459228515625, -0.3190193176269531, -0.30389404296875, -0.2887687683105469, -0.27364349365234375, -0.2585182189941406, -0.2433929443359375, -0.22826766967773438, -0.21314239501953125, -0.19801712036132812, -0.182891845703125, -0.16776657104492188, -0.15264129638671875, -0.13751602172851562, -0.1223907470703125, -0.10726547241210938, -0.09214019775390625, -0.07701492309570312, -0.0618896484375, -0.046764373779296875, -0.03163909912109375, -0.016513824462890625, -0.0013885498046875, 0.013736724853515625, 0.02886199951171875, 0.043987274169921875, 0.059112548828125, 0.07423782348632812, 0.08936309814453125, 0.10448837280273438, 0.1196136474609375, 0.13473892211914062, 0.14986419677734375, 0.16498947143554688, 0.18011474609375, 0.19524002075195312, 0.21036529541015625, 0.22549057006835938, 0.2406158447265625, 0.2557411193847656, 0.27086639404296875, 0.2859916687011719, 0.301116943359375, 0.3162422180175781, 0.33136749267578125, 0.3464927673339844, 0.3616180419921875, 0.3767433166503906, 0.39186859130859375, 0.4069938659667969, 0.422119140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 3.0, 15.0, 51.0, 92.0, 356.0, 309.0, 88.0, 42.0, 25.0, 12.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.208087921142578e-05, -4.125572741031647e-05, -4.043057560920715e-05, -3.960542380809784e-05, -3.8780272006988525e-05, -3.795512020587921e-05, -3.71299684047699e-05, -3.6304816603660583e-05, -3.547966480255127e-05, -3.4654513001441956e-05, -3.382936120033264e-05, -3.300420939922333e-05, -3.2179057598114014e-05, -3.13539057970047e-05, -3.0528753995895386e-05, -2.9703602194786072e-05, -2.8878450393676758e-05, -2.8053298592567444e-05, -2.722814679145813e-05, -2.6402994990348816e-05, -2.5577843189239502e-05, -2.4752691388130188e-05, -2.3927539587020874e-05, -2.310238778591156e-05, -2.2277235984802246e-05, -2.1452084183692932e-05, -2.0626932382583618e-05, -1.9801780581474304e-05, -1.897662878036499e-05, -1.8151476979255676e-05, -1.7326325178146362e-05, -1.650117337703705e-05, -1.5676021575927734e-05, -1.485086977481842e-05, -1.4025717973709106e-05, -1.3200566172599792e-05, -1.2375414371490479e-05, -1.1550262570381165e-05, -1.072511076927185e-05, -9.899958968162537e-06, -9.074807167053223e-06, -8.249655365943909e-06, -7.424503564834595e-06, -6.599351763725281e-06, -5.774199962615967e-06, -4.949048161506653e-06, -4.123896360397339e-06, -3.298744559288025e-06, -2.473592758178711e-06, -1.648440957069397e-06, -8.23289155960083e-07, 1.862645149230957e-09, 8.270144462585449e-07, 1.6521662473678589e-06, 2.477318048477173e-06, 3.302469849586487e-06, 4.127621650695801e-06, 4.952773451805115e-06, 5.777925252914429e-06, 6.603077054023743e-06, 7.428228855133057e-06, 8.25338065624237e-06, 9.078532457351685e-06, 9.903684258460999e-06, 1.0728836059570312e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 12.0, 8.0, 35.0, 75.0, 377.0, 2858.0, 1023427.0, 20580.0, 918.0, 153.0, 40.0, 27.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45068359375, -0.436492919921875, -0.42230224609375, -0.408111572265625, -0.3939208984375, -0.379730224609375, -0.36553955078125, -0.351348876953125, -0.337158203125, -0.322967529296875, -0.30877685546875, -0.294586181640625, -0.2803955078125, -0.266204833984375, -0.25201416015625, -0.237823486328125, -0.2236328125, -0.209442138671875, -0.19525146484375, -0.181060791015625, -0.1668701171875, -0.152679443359375, -0.13848876953125, -0.124298095703125, -0.110107421875, -0.095916748046875, -0.08172607421875, -0.067535400390625, -0.0533447265625, -0.039154052734375, -0.02496337890625, -0.010772705078125, 0.00341796875, 0.017608642578125, 0.03179931640625, 0.045989990234375, 0.0601806640625, 0.074371337890625, 0.08856201171875, 0.102752685546875, 0.116943359375, 0.131134033203125, 0.14532470703125, 0.159515380859375, 0.1737060546875, 0.187896728515625, 0.20208740234375, 0.216278076171875, 0.23046875, 0.244659423828125, 0.25885009765625, 0.273040771484375, 0.2872314453125, 0.301422119140625, 0.31561279296875, 0.329803466796875, 0.343994140625, 0.358184814453125, 0.37237548828125, 0.386566162109375, 0.4007568359375, 0.414947509765625, 0.42913818359375, 0.443328857421875, 0.45751953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 9.0, 8.0, 10.0, 30.0, 62.0, 156.0, 461.0, 152.0, 60.0, 12.0, 11.0, 13.0, 6.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061859130859375, -0.059893131256103516, -0.05792713165283203, -0.05596113204956055, -0.05399513244628906, -0.05202913284301758, -0.050063133239746094, -0.04809713363647461, -0.046131134033203125, -0.04416513442993164, -0.042199134826660156, -0.04023313522338867, -0.03826713562011719, -0.0363011360168457, -0.03433513641357422, -0.032369136810302734, -0.03040313720703125, -0.028437137603759766, -0.02647113800048828, -0.024505138397216797, -0.022539138793945312, -0.020573139190673828, -0.018607139587402344, -0.01664113998413086, -0.014675140380859375, -0.01270914077758789, -0.010743141174316406, -0.008777141571044922, -0.0068111419677734375, -0.004845142364501953, -0.0028791427612304688, -0.0009131431579589844, 0.0010528564453125, 0.0030188560485839844, 0.004984855651855469, 0.006950855255126953, 0.008916854858398438, 0.010882854461669922, 0.012848854064941406, 0.01481485366821289, 0.016780853271484375, 0.01874685287475586, 0.020712852478027344, 0.022678852081298828, 0.024644851684570312, 0.026610851287841797, 0.02857685089111328, 0.030542850494384766, 0.03250885009765625, 0.034474849700927734, 0.03644084930419922, 0.0384068489074707, 0.04037284851074219, 0.04233884811401367, 0.044304847717285156, 0.04627084732055664, 0.048236846923828125, 0.05020284652709961, 0.052168846130371094, 0.05413484573364258, 0.05610084533691406, 0.05806684494018555, 0.06003284454345703, 0.061998844146728516, 0.06396484375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 12.0, 61.0, 184.0, 399.0, 268.0, 69.0, 17.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6388486623764038, -1.485108733177185, -1.3313688039779663, -1.1776288747787476, -1.0238889455795288, -0.8701490163803101, -0.7164090871810913, -0.5626691579818726, -0.4089292287826538, -0.25518929958343506, -0.10144937038421631, 0.05229055881500244, 0.2060304880142212, 0.35977041721343994, 0.5135103464126587, 0.6672502756118774, 0.8209902048110962, 0.9747301340103149, 1.1284700632095337, 1.2822099924087524, 1.4359499216079712, 1.58968985080719, 1.7434297800064087, 1.8971697092056274, 2.0509095191955566, 2.2046494483947754, 2.358389377593994, 2.512129306793213, 2.6658692359924316, 2.8196091651916504, 2.973349094390869, 3.127089023590088, 3.280829429626465, 3.4345693588256836, 3.5883092880249023, 3.742049217224121, 3.89578914642334, 4.049529075622559, 4.203269004821777, 4.357008934020996, 4.510748863220215, 4.664488792419434, 4.818228721618652, 4.971968650817871, 5.12570858001709, 5.279448509216309, 5.433188438415527, 5.586928367614746, 5.740668296813965, 5.894408226013184, 6.048148155212402, 6.201888084411621, 6.35562801361084, 6.509367942810059, 6.663107872009277, 6.816847801208496, 6.970587730407715, 7.124327659606934, 7.278067588806152, 7.431807518005371, 7.58554744720459, 7.739287376403809, 7.893027305603027, 8.046767234802246, 8.200507164001465]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 1.0, 5.0, 9.0, 3.0, 4.0, 2.0, 11.0, 14.0, 9.0, 16.0, 10.0, 19.0, 20.0, 21.0, 32.0, 26.0, 33.0, 25.0, 42.0, 29.0, 25.0, 37.0, 35.0, 47.0, 42.0, 31.0, 47.0, 31.0, 45.0, 32.0, 31.0, 21.0, 25.0, 18.0, 21.0, 30.0, 27.0, 17.0, 21.0, 17.0, 13.0, 8.0, 9.0, 10.0, 9.0, 8.0, 2.0, 5.0, 6.0, 1.0, 4.0, 0.0, 1.0, 3.0], "bins": [-11.181366920471191, -10.854825019836426, -10.528284072875977, -10.201742172241211, -9.875201225280762, -9.548659324645996, -9.222118377685547, -8.895576477050781, -8.569034576416016, -8.24249267578125, -7.915951728820801, -7.589410305023193, -7.262868881225586, -6.93632698059082, -6.609785556793213, -6.2832441329956055, -5.956703186035156, -5.630161762237549, -5.303620338439941, -4.977078914642334, -4.650537490844727, -4.323995590209961, -3.9974541664123535, -3.670912742614746, -3.3443713188171387, -3.0178298950195312, -2.691288471221924, -2.3647468090057373, -2.03820538520813, -1.7116639614105225, -1.3851224184036255, -1.0585808753967285, -0.7320394515991211, -0.4054979681968689, -0.0789564847946167, 0.2475849986076355, 0.5741264820098877, 0.9006679058074951, 1.227209448814392, 1.553750991821289, 1.8802924156188965, 2.206833839416504, 2.5333752632141113, 2.859916925430298, 3.1864583492279053, 3.5129997730255127, 3.839541435241699, 4.166082859039307, 4.492624282836914, 4.8191657066345215, 5.145707130432129, 5.472248554229736, 5.798789978027344, 6.125331878662109, 6.451873302459717, 6.778414726257324, 7.104956150054932, 7.431497573852539, 7.7580389976501465, 8.084580421447754, 8.41112232208252, 8.737663269042969, 9.064205169677734, 9.3907470703125, 9.71728801727295]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 4.0, 3.0, 11.0, 12.0, 20.0, 10.0, 11.0, 24.0, 23.0, 28.0, 28.0, 32.0, 32.0, 39.0, 67.0, 79.0, 301.0, 3007.0, 660412.0, 3521931.0, 7157.0, 543.0, 121.0, 70.0, 34.0, 41.0, 31.0, 29.0, 25.0, 17.0, 23.0, 21.0, 15.0, 11.0, 17.0, 7.0, 8.0, 4.0, 6.0, 7.0, 1.0, 7.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.40234375, -3.299652099609375, -3.19696044921875, -3.094268798828125, -2.9915771484375, -2.888885498046875, -2.78619384765625, -2.683502197265625, -2.580810546875, -2.478118896484375, -2.37542724609375, -2.272735595703125, -2.1700439453125, -2.067352294921875, -1.96466064453125, -1.861968994140625, -1.75927734375, -1.656585693359375, -1.55389404296875, -1.451202392578125, -1.3485107421875, -1.245819091796875, -1.14312744140625, -1.040435791015625, -0.937744140625, -0.835052490234375, -0.73236083984375, -0.629669189453125, -0.5269775390625, -0.424285888671875, -0.32159423828125, -0.218902587890625, -0.1162109375, -0.013519287109375, 0.08917236328125, 0.191864013671875, 0.2945556640625, 0.397247314453125, 0.49993896484375, 0.602630615234375, 0.705322265625, 0.808013916015625, 0.91070556640625, 1.013397216796875, 1.1160888671875, 1.218780517578125, 1.32147216796875, 1.424163818359375, 1.52685546875, 1.629547119140625, 1.73223876953125, 1.834930419921875, 1.9376220703125, 2.040313720703125, 2.14300537109375, 2.245697021484375, 2.348388671875, 2.451080322265625, 2.55377197265625, 2.656463623046875, 2.7591552734375, 2.861846923828125, 2.96453857421875, 3.067230224609375, 3.169921875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 3.0, 6.0, 8.0, 5.0, 6.0, 12.0, 16.0, 13.0, 18.0, 26.0, 34.0, 45.0, 43.0, 46.0, 54.0, 54.0, 42.0, 73.0, 56.0, 60.0, 43.0, 51.0, 41.0, 43.0, 45.0, 47.0, 16.0, 22.0, 17.0, 14.0, 12.0, 7.0, 8.0, 7.0, 6.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6689453125, -0.64215087890625, -0.6153564453125, -0.58856201171875, -0.561767578125, -0.53497314453125, -0.5081787109375, -0.48138427734375, -0.45458984375, -0.42779541015625, -0.4010009765625, -0.37420654296875, -0.347412109375, -0.32061767578125, -0.2938232421875, -0.26702880859375, -0.240234375, -0.21343994140625, -0.1866455078125, -0.15985107421875, -0.133056640625, -0.10626220703125, -0.0794677734375, -0.05267333984375, -0.02587890625, 0.00091552734375, 0.0277099609375, 0.05450439453125, 0.081298828125, 0.10809326171875, 0.1348876953125, 0.16168212890625, 0.1884765625, 0.21527099609375, 0.2420654296875, 0.26885986328125, 0.295654296875, 0.32244873046875, 0.3492431640625, 0.37603759765625, 0.40283203125, 0.42962646484375, 0.4564208984375, 0.48321533203125, 0.510009765625, 0.53680419921875, 0.5635986328125, 0.59039306640625, 0.6171875, 0.64398193359375, 0.6707763671875, 0.69757080078125, 0.724365234375, 0.75115966796875, 0.7779541015625, 0.80474853515625, 0.83154296875, 0.85833740234375, 0.8851318359375, 0.91192626953125, 0.938720703125, 0.96551513671875, 0.9923095703125, 1.01910400390625, 1.0458984375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 6.0, 5.0, 3.0, 7.0, 10.0, 15.0, 57.0, 244.0, 4193605.0, 211.0, 52.0, 21.0, 14.0, 9.0, 8.0, 9.0, 4.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-88.5, -86.63623046875, -84.7724609375, -82.90869140625, -81.044921875, -79.18115234375, -77.3173828125, -75.45361328125, -73.58984375, -71.72607421875, -69.8623046875, -67.99853515625, -66.134765625, -64.27099609375, -62.4072265625, -60.54345703125, -58.6796875, -56.81591796875, -54.9521484375, -53.08837890625, -51.224609375, -49.36083984375, -47.4970703125, -45.63330078125, -43.76953125, -41.90576171875, -40.0419921875, -38.17822265625, -36.314453125, -34.45068359375, -32.5869140625, -30.72314453125, -28.859375, -26.99560546875, -25.1318359375, -23.26806640625, -21.404296875, -19.54052734375, -17.6767578125, -15.81298828125, -13.94921875, -12.08544921875, -10.2216796875, -8.35791015625, -6.494140625, -4.63037109375, -2.7666015625, -0.90283203125, 0.9609375, 2.82470703125, 4.6884765625, 6.55224609375, 8.416015625, 10.27978515625, 12.1435546875, 14.00732421875, 15.87109375, 17.73486328125, 19.5986328125, 21.46240234375, 23.326171875, 25.18994140625, 27.0537109375, 28.91748046875, 30.78125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 8.0, 9.0, 5.0, 7.0, 10.0, 21.0, 26.0, 42.0, 86.0, 233.0, 876.0, 1534.0, 734.0, 238.0, 96.0, 69.0, 31.0, 19.0, 14.0, 4.0, 6.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.47998046875, -0.4671592712402344, -0.45433807373046875, -0.4415168762207031, -0.4286956787109375, -0.4158744812011719, -0.40305328369140625, -0.3902320861816406, -0.377410888671875, -0.3645896911621094, -0.35176849365234375, -0.3389472961425781, -0.3261260986328125, -0.3133049011230469, -0.30048370361328125, -0.2876625061035156, -0.27484130859375, -0.2620201110839844, -0.24919891357421875, -0.23637771606445312, -0.2235565185546875, -0.21073532104492188, -0.19791412353515625, -0.18509292602539062, -0.172271728515625, -0.15945053100585938, -0.14662933349609375, -0.13380813598632812, -0.1209869384765625, -0.10816574096679688, -0.09534454345703125, -0.08252334594726562, -0.0697021484375, -0.056880950927734375, -0.04405975341796875, -0.031238555908203125, -0.0184173583984375, -0.005596160888671875, 0.00722503662109375, 0.020046234130859375, 0.032867431640625, 0.045688629150390625, 0.05850982666015625, 0.07133102416992188, 0.0841522216796875, 0.09697341918945312, 0.10979461669921875, 0.12261581420898438, 0.13543701171875, 0.14825820922851562, 0.16107940673828125, 0.17390060424804688, 0.1867218017578125, 0.19954299926757812, 0.21236419677734375, 0.22518539428710938, 0.238006591796875, 0.2508277893066406, 0.26364898681640625, 0.2764701843261719, 0.2892913818359375, 0.3021125793457031, 0.31493377685546875, 0.3277549743652344, 0.340576171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 5.0, 19.0, 25.0, 55.0, 91.0, 142.0, 224.0, 183.0, 134.0, 72.0, 28.0, 15.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1533504724502563, -1.1101672649383545, -1.066983938217163, -1.0238007307052612, -0.9806175231933594, -0.9374343156814575, -0.8942510485649109, -0.8510677814483643, -0.8078845739364624, -0.7647013664245605, -0.7215180993080139, -0.6783348321914673, -0.6351516246795654, -0.5919684171676636, -0.5487851500511169, -0.5056018829345703, -0.46241867542266846, -0.4192354381084442, -0.37605220079421997, -0.3328689634799957, -0.2896857261657715, -0.24650248885154724, -0.203319251537323, -0.16013601422309875, -0.11695277690887451, -0.07376953959465027, -0.030586302280426025, 0.012596935033798218, 0.05578017234802246, 0.0989634096622467, 0.14214664697647095, 0.1853298842906952, 0.22851300239562988, 0.2716962397098541, 0.31487947702407837, 0.3580627143383026, 0.40124595165252686, 0.4444291889667511, 0.48761242628097534, 0.530795693397522, 0.5739789009094238, 0.6171621084213257, 0.6603453755378723, 0.703528642654419, 0.7467118501663208, 0.7898950576782227, 0.8330783247947693, 0.8762615919113159, 0.9194447994232178, 0.9626280069351196, 1.0058112144470215, 1.048994541168213, 1.0921777486801147, 1.1353609561920166, 1.178544282913208, 1.2217274904251099, 1.2649106979370117, 1.3080939054489136, 1.3512771129608154, 1.3944604396820068, 1.4376436471939087, 1.4808268547058105, 1.524010181427002, 1.5671933889389038, 1.6103765964508057]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 5.0, 6.0, 9.0, 12.0, 15.0, 18.0, 19.0, 26.0, 20.0, 37.0, 33.0, 40.0, 55.0, 42.0, 48.0, 48.0, 40.0, 44.0, 45.0, 51.0, 53.0, 55.0, 57.0, 44.0, 34.0, 19.0, 22.0, 26.0, 19.0, 16.0, 10.0, 9.0, 10.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6667957305908203, -0.64150071144104, -0.6162057518959045, -0.5909107327461243, -0.565615713596344, -0.5403207540512085, -0.5150257349014282, -0.48973071575164795, -0.46443572640419006, -0.4391407370567322, -0.4138457179069519, -0.388550728559494, -0.36325573921203613, -0.33796072006225586, -0.312665730714798, -0.2873707413673401, -0.2620757222175598, -0.23678071796894073, -0.21148571372032166, -0.18619072437286377, -0.1608957201242447, -0.1356007158756256, -0.11030572652816772, -0.08501072227954865, -0.059715718030929565, -0.034420717507600784, -0.009125716984272003, 0.01616927981376648, 0.04146428406238556, 0.06675928831100464, 0.09205427765846252, 0.1173492819070816, 0.1426442265510559, 0.167939230799675, 0.19323423504829407, 0.21852922439575195, 0.24382422864437103, 0.2691192328929901, 0.294414222240448, 0.31970924139022827, 0.34500423073768616, 0.37029922008514404, 0.3955942392349243, 0.4208892285823822, 0.4461842179298401, 0.47147923707962036, 0.49677422642707825, 0.5220692157745361, 0.5473642349243164, 0.5726592540740967, 0.5979542136192322, 0.6232492327690125, 0.6485442519187927, 0.6738392114639282, 0.6991342306137085, 0.7244292497634888, 0.749724268913269, 0.7750192880630493, 0.8003142476081848, 0.8256092667579651, 0.8509042859077454, 0.8761992454528809, 0.9014942646026611, 0.9267892837524414, 0.9520842432975769]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 12.0, 16.0, 22.0, 45.0, 46.0, 63.0, 126.0, 193.0, 300.0, 492.0, 722.0, 1191.0, 2181.0, 4709.0, 13056.0, 45277.0, 209211.0, 553737.0, 160016.0, 36682.0, 11296.0, 4150.0, 2015.0, 1127.0, 614.0, 452.0, 274.0, 179.0, 122.0, 68.0, 43.0, 33.0, 24.0, 13.0, 8.0, 7.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2252197265625, -0.21827316284179688, -0.21132659912109375, -0.20438003540039062, -0.1974334716796875, -0.19048690795898438, -0.18354034423828125, -0.17659378051757812, -0.169647216796875, -0.16270065307617188, -0.15575408935546875, -0.14880752563476562, -0.1418609619140625, -0.13491439819335938, -0.12796783447265625, -0.12102127075195312, -0.11407470703125, -0.10712814331054688, -0.10018157958984375, -0.09323501586914062, -0.0862884521484375, -0.07934188842773438, -0.07239532470703125, -0.06544876098632812, -0.058502197265625, -0.051555633544921875, -0.04460906982421875, -0.037662506103515625, -0.0307159423828125, -0.023769378662109375, -0.01682281494140625, -0.009876251220703125, -0.0029296875, 0.004016876220703125, 0.01096343994140625, 0.017910003662109375, 0.0248565673828125, 0.031803131103515625, 0.03874969482421875, 0.045696258544921875, 0.052642822265625, 0.059589385986328125, 0.06653594970703125, 0.07348251342773438, 0.0804290771484375, 0.08737564086914062, 0.09432220458984375, 0.10126876831054688, 0.10821533203125, 0.11516189575195312, 0.12210845947265625, 0.12905502319335938, 0.1360015869140625, 0.14294815063476562, 0.14989471435546875, 0.15684127807617188, 0.163787841796875, 0.17073440551757812, 0.17768096923828125, 0.18462753295898438, 0.1915740966796875, 0.19852066040039062, 0.20546722412109375, 0.21241378784179688, 0.2193603515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 4.0, 6.0, 8.0, 11.0, 17.0, 20.0, 19.0, 38.0, 28.0, 42.0, 40.0, 53.0, 48.0, 57.0, 61.0, 62.0, 63.0, 58.0, 51.0, 50.0, 57.0, 45.0, 35.0, 25.0, 23.0, 18.0, 29.0, 16.0, 8.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.587890625, -0.5709266662597656, -0.5539627075195312, -0.5369987487792969, -0.5200347900390625, -0.5030708312988281, -0.48610687255859375, -0.4691429138183594, -0.452178955078125, -0.4352149963378906, -0.41825103759765625, -0.4012870788574219, -0.3843231201171875, -0.3673591613769531, -0.35039520263671875, -0.3334312438964844, -0.31646728515625, -0.2995033264160156, -0.28253936767578125, -0.2655754089355469, -0.2486114501953125, -0.23164749145507812, -0.21468353271484375, -0.19771957397460938, -0.180755615234375, -0.16379165649414062, -0.14682769775390625, -0.12986373901367188, -0.1128997802734375, -0.09593582153320312, -0.07897186279296875, -0.062007904052734375, -0.0450439453125, -0.028079986572265625, -0.01111602783203125, 0.005847930908203125, 0.0228118896484375, 0.039775848388671875, 0.05673980712890625, 0.07370376586914062, 0.090667724609375, 0.10763168334960938, 0.12459564208984375, 0.14155960083007812, 0.1585235595703125, 0.17548751831054688, 0.19245147705078125, 0.20941543579101562, 0.22637939453125, 0.24334335327148438, 0.26030731201171875, 0.2772712707519531, 0.2942352294921875, 0.3111991882324219, 0.32816314697265625, 0.3451271057128906, 0.362091064453125, 0.3790550231933594, 0.39601898193359375, 0.4129829406738281, 0.4299468994140625, 0.4469108581542969, 0.46387481689453125, 0.4808387756347656, 0.497802734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 13.0, 23.0, 24.0, 28.0, 52.0, 89.0, 135.0, 203.0, 327.0, 473.0, 771.0, 1253.0, 2087.0, 3398.0, 5739.0, 9563.0, 16681.0, 30443.0, 58028.0, 117119.0, 222667.0, 259243.0, 154331.0, 76045.0, 39285.0, 20982.0, 11980.0, 6921.0, 4031.0, 2482.0, 1458.0, 980.0, 644.0, 385.0, 245.0, 126.0, 123.0, 79.0, 40.0, 21.0, 14.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.083251953125, -0.08066654205322266, -0.07808113098144531, -0.07549571990966797, -0.07291030883789062, -0.07032489776611328, -0.06773948669433594, -0.0651540756225586, -0.06256866455078125, -0.059983253479003906, -0.05739784240722656, -0.05481243133544922, -0.052227020263671875, -0.04964160919189453, -0.04705619812011719, -0.044470787048339844, -0.0418853759765625, -0.039299964904785156, -0.03671455383300781, -0.03412914276123047, -0.031543731689453125, -0.02895832061767578, -0.026372909545898438, -0.023787498474121094, -0.02120208740234375, -0.018616676330566406, -0.016031265258789062, -0.013445854187011719, -0.010860443115234375, -0.008275032043457031, -0.0056896209716796875, -0.0031042098999023438, -0.000518798828125, 0.0020666122436523438, 0.0046520233154296875, 0.007237434387207031, 0.009822845458984375, 0.012408256530761719, 0.014993667602539062, 0.017579078674316406, 0.02016448974609375, 0.022749900817871094, 0.025335311889648438, 0.02792072296142578, 0.030506134033203125, 0.03309154510498047, 0.03567695617675781, 0.038262367248535156, 0.0408477783203125, 0.043433189392089844, 0.04601860046386719, 0.04860401153564453, 0.051189422607421875, 0.05377483367919922, 0.05636024475097656, 0.058945655822753906, 0.06153106689453125, 0.0641164779663086, 0.06670188903808594, 0.06928730010986328, 0.07187271118164062, 0.07445812225341797, 0.07704353332519531, 0.07962894439697266, 0.08221435546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 9.0, 8.0, 14.0, 13.0, 14.0, 15.0, 15.0, 27.0, 35.0, 32.0, 27.0, 47.0, 42.0, 48.0, 51.0, 56.0, 54.0, 50.0, 54.0, 47.0, 43.0, 40.0, 41.0, 35.0, 34.0, 33.0, 24.0, 11.0, 21.0, 17.0, 7.0, 7.0, 5.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.685546875, -0.658782958984375, -0.63201904296875, -0.605255126953125, -0.5784912109375, -0.551727294921875, -0.52496337890625, -0.498199462890625, -0.471435546875, -0.444671630859375, -0.41790771484375, -0.391143798828125, -0.3643798828125, -0.337615966796875, -0.31085205078125, -0.284088134765625, -0.25732421875, -0.230560302734375, -0.20379638671875, -0.177032470703125, -0.1502685546875, -0.123504638671875, -0.09674072265625, -0.069976806640625, -0.043212890625, -0.016448974609375, 0.01031494140625, 0.037078857421875, 0.0638427734375, 0.090606689453125, 0.11737060546875, 0.144134521484375, 0.1708984375, 0.197662353515625, 0.22442626953125, 0.251190185546875, 0.2779541015625, 0.304718017578125, 0.33148193359375, 0.358245849609375, 0.385009765625, 0.411773681640625, 0.43853759765625, 0.465301513671875, 0.4920654296875, 0.518829345703125, 0.54559326171875, 0.572357177734375, 0.59912109375, 0.625885009765625, 0.65264892578125, 0.679412841796875, 0.7061767578125, 0.732940673828125, 0.75970458984375, 0.786468505859375, 0.813232421875, 0.839996337890625, 0.86676025390625, 0.893524169921875, 0.9202880859375, 0.947052001953125, 0.97381591796875, 1.000579833984375, 1.02734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 12.0, 18.0, 13.0, 14.0, 35.0, 43.0, 75.0, 82.0, 152.0, 189.0, 281.0, 426.0, 675.0, 1053.0, 1780.0, 3238.0, 6077.0, 12533.0, 26817.0, 61313.0, 138994.0, 264576.0, 269473.0, 142259.0, 63138.0, 27959.0, 12885.0, 6271.0, 3227.0, 1805.0, 1097.0, 723.0, 460.0, 248.0, 176.0, 134.0, 98.0, 68.0, 32.0, 43.0, 26.0, 11.0, 11.0, 4.0, 8.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00620269775390625, -0.0060027241706848145, -0.005802750587463379, -0.005602777004241943, -0.005402803421020508, -0.005202829837799072, -0.005002856254577637, -0.004802882671356201, -0.004602909088134766, -0.00440293550491333, -0.0042029619216918945, -0.004002988338470459, -0.0038030147552490234, -0.003603041172027588, -0.0034030675888061523, -0.003203094005584717, -0.0030031204223632812, -0.0028031468391418457, -0.00260317325592041, -0.0024031996726989746, -0.002203226089477539, -0.0020032525062561035, -0.001803278923034668, -0.0016033053398132324, -0.0014033317565917969, -0.0012033581733703613, -0.0010033845901489258, -0.0008034110069274902, -0.0006034374237060547, -0.00040346384048461914, -0.0002034902572631836, -3.516674041748047e-06, 0.0001964569091796875, 0.00039643049240112305, 0.0005964040756225586, 0.0007963776588439941, 0.0009963512420654297, 0.0011963248252868652, 0.0013962984085083008, 0.0015962719917297363, 0.0017962455749511719, 0.0019962191581726074, 0.002196192741394043, 0.0023961663246154785, 0.002596139907836914, 0.0027961134910583496, 0.002996087074279785, 0.0031960606575012207, 0.0033960342407226562, 0.003596007823944092, 0.0037959814071655273, 0.003995954990386963, 0.0041959285736083984, 0.004395902156829834, 0.0045958757400512695, 0.004795849323272705, 0.004995822906494141, 0.005195796489715576, 0.005395770072937012, 0.005595743656158447, 0.005795717239379883, 0.005995690822601318, 0.006195664405822754, 0.0063956379890441895, 0.006595611572265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 14.0, 16.0, 25.0, 20.0, 36.0, 54.0, 55.0, 80.0, 106.0, 106.0, 103.0, 88.0, 83.0, 66.0, 32.0, 19.0, 19.0, 18.0, 15.0, 10.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.7179718017578125e-05, -2.652965486049652e-05, -2.5879591703414917e-05, -2.5229528546333313e-05, -2.457946538925171e-05, -2.3929402232170105e-05, -2.32793390750885e-05, -2.2629275918006897e-05, -2.1979212760925293e-05, -2.132914960384369e-05, -2.0679086446762085e-05, -2.002902328968048e-05, -1.9378960132598877e-05, -1.8728896975517273e-05, -1.807883381843567e-05, -1.7428770661354065e-05, -1.677870750427246e-05, -1.6128644347190857e-05, -1.5478581190109253e-05, -1.4828518033027649e-05, -1.4178454875946045e-05, -1.3528391718864441e-05, -1.2878328561782837e-05, -1.2228265404701233e-05, -1.1578202247619629e-05, -1.0928139090538025e-05, -1.0278075933456421e-05, -9.628012776374817e-06, -8.977949619293213e-06, -8.327886462211609e-06, -7.677823305130005e-06, -7.027760148048401e-06, -6.377696990966797e-06, -5.727633833885193e-06, -5.077570676803589e-06, -4.427507519721985e-06, -3.777444362640381e-06, -3.127381205558777e-06, -2.477318048477173e-06, -1.8272548913955688e-06, -1.1771917343139648e-06, -5.271285772323608e-07, 1.2293457984924316e-07, 7.729977369308472e-07, 1.4230608940124512e-06, 2.073124051094055e-06, 2.723187208175659e-06, 3.373250365257263e-06, 4.023313522338867e-06, 4.673376679420471e-06, 5.323439836502075e-06, 5.973502993583679e-06, 6.623566150665283e-06, 7.273629307746887e-06, 7.923692464828491e-06, 8.573755621910095e-06, 9.2238187789917e-06, 9.873881936073303e-06, 1.0523945093154907e-05, 1.1174008250236511e-05, 1.1824071407318115e-05, 1.247413456439972e-05, 1.3124197721481323e-05, 1.3774260878562927e-05, 1.4424324035644531e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 8.0, 18.0, 7.0, 12.0, 13.0, 20.0, 22.0, 25.0, 36.0, 42.0, 26.0, 59.0, 56.0, 80.0, 117.0, 236.0, 3171.0, 999510.0, 43990.0, 392.0, 146.0, 84.0, 79.0, 53.0, 42.0, 41.0, 43.0, 30.0, 37.0, 22.0, 21.0, 12.0, 14.0, 13.0, 8.0, 12.0, 10.0, 5.0, 7.0, 6.0, 9.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.039031982421875, -0.03767204284667969, -0.036312103271484375, -0.03495216369628906, -0.03359222412109375, -0.03223228454589844, -0.030872344970703125, -0.029512405395507812, -0.0281524658203125, -0.026792526245117188, -0.025432586669921875, -0.024072647094726562, -0.02271270751953125, -0.021352767944335938, -0.019992828369140625, -0.018632888793945312, -0.01727294921875, -0.015913009643554688, -0.014553070068359375, -0.013193130493164062, -0.01183319091796875, -0.010473251342773438, -0.009113311767578125, -0.0077533721923828125, -0.0063934326171875, -0.0050334930419921875, -0.003673553466796875, -0.0023136138916015625, -0.00095367431640625, 0.0004062652587890625, 0.001766204833984375, 0.0031261444091796875, 0.004486083984375, 0.0058460235595703125, 0.007205963134765625, 0.008565902709960938, 0.00992584228515625, 0.011285781860351562, 0.012645721435546875, 0.014005661010742188, 0.0153656005859375, 0.016725540161132812, 0.018085479736328125, 0.019445419311523438, 0.02080535888671875, 0.022165298461914062, 0.023525238037109375, 0.024885177612304688, 0.0262451171875, 0.027605056762695312, 0.028964996337890625, 0.030324935913085938, 0.03168487548828125, 0.03304481506347656, 0.034404754638671875, 0.03576469421386719, 0.0371246337890625, 0.03848457336425781, 0.039844512939453125, 0.04120445251464844, 0.04256439208984375, 0.04392433166503906, 0.045284271240234375, 0.04664421081542969, 0.048004150390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 11.0, 9.0, 16.0, 20.0, 16.0, 21.0, 17.0, 34.0, 33.0, 22.0, 25.0, 30.0, 44.0, 36.0, 47.0, 51.0, 49.0, 55.0, 48.0, 52.0, 40.0, 49.0, 32.0, 38.0, 34.0, 28.0, 26.0, 19.0, 21.0, 17.0, 8.0, 13.0, 9.0, 9.0, 6.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00209808349609375, -0.00202903151512146, -0.00195997953414917, -0.0018909275531768799, -0.0018218755722045898, -0.0017528235912322998, -0.0016837716102600098, -0.0016147196292877197, -0.0015456676483154297, -0.0014766156673431396, -0.0014075636863708496, -0.0013385117053985596, -0.0012694597244262695, -0.0012004077434539795, -0.0011313557624816895, -0.0010623037815093994, -0.0009932518005371094, -0.0009241998195648193, -0.0008551478385925293, -0.0007860958576202393, -0.0007170438766479492, -0.0006479918956756592, -0.0005789399147033691, -0.0005098879337310791, -0.00044083595275878906, -0.000371783971786499, -0.000302731990814209, -0.00023368000984191895, -0.0001646280288696289, -9.557604789733887e-05, -2.6524066925048828e-05, 4.252791404724121e-05, 0.00011157989501953125, 0.0001806318759918213, 0.00024968385696411133, 0.00031873583793640137, 0.0003877878189086914, 0.00045683979988098145, 0.0005258917808532715, 0.0005949437618255615, 0.0006639957427978516, 0.0007330477237701416, 0.0008020997047424316, 0.0008711516857147217, 0.0009402036666870117, 0.0010092556476593018, 0.0010783076286315918, 0.0011473596096038818, 0.0012164115905761719, 0.001285463571548462, 0.001354515552520752, 0.001423567533493042, 0.001492619514465332, 0.001561671495437622, 0.0016307234764099121, 0.0016997754573822021, 0.0017688274383544922, 0.0018378794193267822, 0.0019069314002990723, 0.0019759833812713623, 0.0020450353622436523, 0.0021140873432159424, 0.0021831393241882324, 0.0022521913051605225, 0.0023212432861328125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 10.0, 30.0, 78.0, 158.0, 267.0, 257.0, 127.0, 47.0, 12.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9061234593391418, -0.8709312081336975, -0.835739016532898, -0.8005467653274536, -0.7653545141220093, -0.7301623225212097, -0.6949700713157654, -0.6597778797149658, -0.6245856285095215, -0.5893933773040771, -0.5542011857032776, -0.5190089344978333, -0.4838167130947113, -0.44862449169158936, -0.413432240486145, -0.37824001908302307, -0.3430477976799011, -0.3078555762767792, -0.2726633548736572, -0.2374711036682129, -0.20227888226509094, -0.167086660861969, -0.13189442455768585, -0.09670218825340271, -0.06150996685028076, -0.026317737996578217, 0.008874490857124329, 0.044066719710826874, 0.07925894856452942, 0.11445116996765137, 0.1496434062719345, 0.18483564257621765, 0.22002792358398438, 0.2552201449871063, 0.29041236639022827, 0.3256046175956726, 0.36079683899879456, 0.3959890604019165, 0.43118131160736084, 0.4663735330104828, 0.5015657544136047, 0.5367580056190491, 0.5719501972198486, 0.607142448425293, 0.6423346996307373, 0.6775268912315369, 0.7127191424369812, 0.7479113340377808, 0.7831035852432251, 0.8182958364486694, 0.853488028049469, 0.8886802792549133, 0.9238724708557129, 0.9590647220611572, 0.9942569732666016, 1.029449224472046, 1.0646414756774902, 1.0998337268829346, 1.135025978088379, 1.1702181100845337, 1.205410361289978, 1.2406026124954224, 1.2757948637008667, 1.310987114906311, 1.3461792469024658]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 10.0, 11.0, 10.0, 14.0, 20.0, 28.0, 26.0, 31.0, 42.0, 44.0, 61.0, 57.0, 52.0, 62.0, 50.0, 53.0, 54.0, 70.0, 70.0, 52.0, 36.0, 33.0, 28.0, 22.0, 15.0, 12.0, 19.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45151618123054504, -0.4350161552429199, -0.4185160994529724, -0.4020160734653473, -0.38551604747772217, -0.36901599168777466, -0.35251596570014954, -0.3360159397125244, -0.3195158839225769, -0.3030158579349518, -0.2865158021450043, -0.27001577615737915, -0.25351575016975403, -0.2370157092809677, -0.2205156683921814, -0.20401564240455627, -0.18751561641693115, -0.17101557552814484, -0.15451554954051971, -0.1380155086517334, -0.12151547521352768, -0.10501544177532196, -0.08851540088653564, -0.07201536744832993, -0.05551533401012421, -0.03901530057191849, -0.02251526340842247, -0.006015226244926453, 0.010484807193279266, 0.026984840631484985, 0.0434848815202713, 0.05998491495847702, 0.07648497819900513, 0.09298501163721085, 0.10948504507541656, 0.12598508596420288, 0.142485111951828, 0.15898515284061432, 0.17548519372940063, 0.19198521971702576, 0.20848526060581207, 0.2249853014945984, 0.2414853274822235, 0.25798535346984863, 0.27448540925979614, 0.29098543524742126, 0.3074854612350464, 0.3239855170249939, 0.340485543012619, 0.35698556900024414, 0.37348562479019165, 0.3899856507778168, 0.4064856767654419, 0.4229857325553894, 0.4394857585430145, 0.45598578453063965, 0.47248584032058716, 0.4889858663082123, 0.5054858922958374, 0.5219859480857849, 0.5384860038757324, 0.5549860000610352, 0.5714860558509827, 0.5879861116409302, 0.6044861078262329]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 8.0, 22.0, 31.0, 26.0, 40.0, 66.0, 130.0, 220.0, 426.0, 906.0, 2223.0, 5969.0, 18542.0, 75113.0, 370603.0, 445999.0, 93935.0, 22839.0, 7026.0, 2337.0, 1012.0, 481.0, 234.0, 130.0, 98.0, 40.0, 30.0, 23.0, 16.0, 17.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49951171875, -0.48566436767578125, -0.4718170166015625, -0.45796966552734375, -0.444122314453125, -0.43027496337890625, -0.4164276123046875, -0.40258026123046875, -0.38873291015625, -0.37488555908203125, -0.3610382080078125, -0.34719085693359375, -0.333343505859375, -0.31949615478515625, -0.3056488037109375, -0.29180145263671875, -0.2779541015625, -0.26410675048828125, -0.2502593994140625, -0.23641204833984375, -0.222564697265625, -0.20871734619140625, -0.1948699951171875, -0.18102264404296875, -0.16717529296875, -0.15332794189453125, -0.1394805908203125, -0.12563323974609375, -0.111785888671875, -0.09793853759765625, -0.0840911865234375, -0.07024383544921875, -0.056396484375, -0.04254913330078125, -0.0287017822265625, -0.01485443115234375, -0.001007080078125, 0.01284027099609375, 0.0266876220703125, 0.04053497314453125, 0.05438232421875, 0.06822967529296875, 0.0820770263671875, 0.09592437744140625, 0.109771728515625, 0.12361907958984375, 0.1374664306640625, 0.15131378173828125, 0.1651611328125, 0.17900848388671875, 0.1928558349609375, 0.20670318603515625, 0.220550537109375, 0.23439788818359375, 0.2482452392578125, 0.26209259033203125, 0.27593994140625, 0.28978729248046875, 0.3036346435546875, 0.31748199462890625, 0.331329345703125, 0.34517669677734375, 0.3590240478515625, 0.37287139892578125, 0.38671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 1.0, 4.0, 6.0, 17.0, 10.0, 12.0, 12.0, 9.0, 23.0, 26.0, 25.0, 32.0, 32.0, 43.0, 37.0, 31.0, 38.0, 49.0, 36.0, 41.0, 45.0, 38.0, 42.0, 40.0, 40.0, 43.0, 38.0, 34.0, 13.0, 30.0, 21.0, 24.0, 21.0, 17.0, 15.0, 5.0, 14.0, 11.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.533203125, -2.4456787109375, -2.358154296875, -2.2706298828125, -2.18310546875, -2.0955810546875, -2.008056640625, -1.9205322265625, -1.8330078125, -1.7454833984375, -1.657958984375, -1.5704345703125, -1.48291015625, -1.3953857421875, -1.307861328125, -1.2203369140625, -1.1328125, -1.0452880859375, -0.957763671875, -0.8702392578125, -0.78271484375, -0.6951904296875, -0.607666015625, -0.5201416015625, -0.4326171875, -0.3450927734375, -0.257568359375, -0.1700439453125, -0.08251953125, 0.0050048828125, 0.092529296875, 0.1800537109375, 0.267578125, 0.3551025390625, 0.442626953125, 0.5301513671875, 0.61767578125, 0.7052001953125, 0.792724609375, 0.8802490234375, 0.9677734375, 1.0552978515625, 1.142822265625, 1.2303466796875, 1.31787109375, 1.4053955078125, 1.492919921875, 1.5804443359375, 1.66796875, 1.7554931640625, 1.843017578125, 1.9305419921875, 2.01806640625, 2.1055908203125, 2.193115234375, 2.2806396484375, 2.3681640625, 2.4556884765625, 2.543212890625, 2.6307373046875, 2.71826171875, 2.8057861328125, 2.893310546875, 2.9808349609375, 3.068359375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 1.0, 5.0, 4.0, 2.0, 8.0, 17.0, 10.0, 9.0, 14.0, 17.0, 21.0, 31.0, 26.0, 38.0, 40.0, 42.0, 49.0, 94.0, 366.0, 179708.0, 867159.0, 425.0, 122.0, 59.0, 45.0, 38.0, 35.0, 25.0, 23.0, 20.0, 18.0, 12.0, 18.0, 8.0, 9.0, 7.0, 9.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.890625, -8.6214599609375, -8.352294921875, -8.0831298828125, -7.81396484375, -7.5447998046875, -7.275634765625, -7.0064697265625, -6.7373046875, -6.4681396484375, -6.198974609375, -5.9298095703125, -5.66064453125, -5.3914794921875, -5.122314453125, -4.8531494140625, -4.583984375, -4.3148193359375, -4.045654296875, -3.7764892578125, -3.50732421875, -3.2381591796875, -2.968994140625, -2.6998291015625, -2.4306640625, -2.1614990234375, -1.892333984375, -1.6231689453125, -1.35400390625, -1.0848388671875, -0.815673828125, -0.5465087890625, -0.27734375, -0.0081787109375, 0.260986328125, 0.5301513671875, 0.79931640625, 1.0684814453125, 1.337646484375, 1.6068115234375, 1.8759765625, 2.1451416015625, 2.414306640625, 2.6834716796875, 2.95263671875, 3.2218017578125, 3.490966796875, 3.7601318359375, 4.029296875, 4.2984619140625, 4.567626953125, 4.8367919921875, 5.10595703125, 5.3751220703125, 5.644287109375, 5.9134521484375, 6.1826171875, 6.4517822265625, 6.720947265625, 6.9901123046875, 7.25927734375, 7.5284423828125, 7.797607421875, 8.0667724609375, 8.3359375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 1.0, 4.0, 5.0, 2.0, 8.0, 18.0, 10.0, 9.0, 14.0, 16.0, 22.0, 29.0, 31.0, 35.0, 41.0, 42.0, 40.0, 49.0, 44.0, 58.0, 66.0, 60.0, 62.0, 48.0, 46.0, 37.0, 36.0, 28.0, 20.0, 21.0, 16.0, 12.0, 18.0, 9.0, 9.0, 7.0, 9.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.888671875, -3.77093505859375, -3.6531982421875, -3.53546142578125, -3.417724609375, -3.29998779296875, -3.1822509765625, -3.06451416015625, -2.94677734375, -2.82904052734375, -2.7113037109375, -2.59356689453125, -2.475830078125, -2.35809326171875, -2.2403564453125, -2.12261962890625, -2.0048828125, -1.88714599609375, -1.7694091796875, -1.65167236328125, -1.533935546875, -1.41619873046875, -1.2984619140625, -1.18072509765625, -1.06298828125, -0.94525146484375, -0.8275146484375, -0.70977783203125, -0.592041015625, -0.47430419921875, -0.3565673828125, -0.23883056640625, -0.12109375, -0.00335693359375, 0.1143798828125, 0.23211669921875, 0.349853515625, 0.46759033203125, 0.5853271484375, 0.70306396484375, 0.82080078125, 0.93853759765625, 1.0562744140625, 1.17401123046875, 1.291748046875, 1.40948486328125, 1.5272216796875, 1.64495849609375, 1.7626953125, 1.88043212890625, 1.9981689453125, 2.11590576171875, 2.233642578125, 2.35137939453125, 2.4691162109375, 2.58685302734375, 2.70458984375, 2.82232666015625, 2.9400634765625, 3.05780029296875, 3.175537109375, 3.29327392578125, 3.4110107421875, 3.52874755859375, 3.646484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 13.0, 9.0, 4.0, 8.0, 7.0, 25.0, 31.0, 46.0, 162.0, 484.0, 2115.0, 25768.0, 1001149.0, 16356.0, 1691.0, 379.0, 134.0, 58.0, 39.0, 17.0, 12.0, 9.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.263427734375, -0.2553062438964844, -0.24718475341796875, -0.23906326293945312, -0.2309417724609375, -0.22282028198242188, -0.21469879150390625, -0.20657730102539062, -0.198455810546875, -0.19033432006835938, -0.18221282958984375, -0.17409133911132812, -0.1659698486328125, -0.15784835815429688, -0.14972686767578125, -0.14160537719726562, -0.13348388671875, -0.12536239624023438, -0.11724090576171875, -0.10911941528320312, -0.1009979248046875, -0.09287643432617188, -0.08475494384765625, -0.07663345336914062, -0.068511962890625, -0.060390472412109375, -0.05226898193359375, -0.044147491455078125, -0.0360260009765625, -0.027904510498046875, -0.01978302001953125, -0.011661529541015625, -0.0035400390625, 0.004581451416015625, 0.01270294189453125, 0.020824432373046875, 0.0289459228515625, 0.037067413330078125, 0.04518890380859375, 0.053310394287109375, 0.061431884765625, 0.06955337524414062, 0.07767486572265625, 0.08579635620117188, 0.0939178466796875, 0.10203933715820312, 0.11016082763671875, 0.11828231811523438, 0.12640380859375, 0.13452529907226562, 0.14264678955078125, 0.15076828002929688, 0.1588897705078125, 0.16701126098632812, 0.17513275146484375, 0.18325424194335938, 0.191375732421875, 0.19949722290039062, 0.20761871337890625, 0.21574020385742188, 0.2238616943359375, 0.23198318481445312, 0.24010467529296875, 0.24822616577148438, 0.25634765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 9.0, 12.0, 26.0, 39.0, 73.0, 127.0, 263.0, 190.0, 92.0, 52.0, 37.0, 17.0, 15.0, 6.0, 5.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2278556823730469e-05, -1.1760741472244263e-05, -1.1242926120758057e-05, -1.072511076927185e-05, -1.0207295417785645e-05, -9.689480066299438e-06, -9.171664714813232e-06, -8.653849363327026e-06, -8.13603401184082e-06, -7.618218660354614e-06, -7.100403308868408e-06, -6.582587957382202e-06, -6.064772605895996e-06, -5.54695725440979e-06, -5.029141902923584e-06, -4.511326551437378e-06, -3.993511199951172e-06, -3.475695848464966e-06, -2.9578804969787598e-06, -2.4400651454925537e-06, -1.9222497940063477e-06, -1.4044344425201416e-06, -8.866190910339355e-07, -3.688037395477295e-07, 1.4901161193847656e-07, 6.668269634246826e-07, 1.1846423149108887e-06, 1.7024576663970947e-06, 2.2202730178833008e-06, 2.738088369369507e-06, 3.255903720855713e-06, 3.773719072341919e-06, 4.291534423828125e-06, 4.809349775314331e-06, 5.327165126800537e-06, 5.844980478286743e-06, 6.362795829772949e-06, 6.880611181259155e-06, 7.398426532745361e-06, 7.916241884231567e-06, 8.434057235717773e-06, 8.95187258720398e-06, 9.469687938690186e-06, 9.987503290176392e-06, 1.0505318641662598e-05, 1.1023133993148804e-05, 1.154094934463501e-05, 1.2058764696121216e-05, 1.2576580047607422e-05, 1.3094395399093628e-05, 1.3612210750579834e-05, 1.413002610206604e-05, 1.4647841453552246e-05, 1.5165656805038452e-05, 1.5683472156524658e-05, 1.6201287508010864e-05, 1.671910285949707e-05, 1.7236918210983276e-05, 1.7754733562469482e-05, 1.827254891395569e-05, 1.8790364265441895e-05, 1.93081796169281e-05, 1.9825994968414307e-05, 2.0343810319900513e-05, 2.086162567138672e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 2.0, 1.0, 4.0, 5.0, 11.0, 13.0, 11.0, 14.0, 33.0, 73.0, 155.0, 672.0, 3360.0, 53637.0, 979731.0, 8957.0, 1343.0, 303.0, 104.0, 43.0, 20.0, 10.0, 12.0, 7.0, 6.0, 5.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2467041015625, -0.2373065948486328, -0.22790908813476562, -0.21851158142089844, -0.20911407470703125, -0.19971656799316406, -0.19031906127929688, -0.1809215545654297, -0.1715240478515625, -0.1621265411376953, -0.15272903442382812, -0.14333152770996094, -0.13393402099609375, -0.12453651428222656, -0.11513900756835938, -0.10574150085449219, -0.096343994140625, -0.08694648742675781, -0.07754898071289062, -0.06815147399902344, -0.05875396728515625, -0.04935646057128906, -0.039958953857421875, -0.030561447143554688, -0.0211639404296875, -0.011766433715820312, -0.002368927001953125, 0.0070285797119140625, 0.01642608642578125, 0.025823593139648438, 0.035221099853515625, 0.04461860656738281, 0.05401611328125, 0.06341361999511719, 0.07281112670898438, 0.08220863342285156, 0.09160614013671875, 0.10100364685058594, 0.11040115356445312, 0.11979866027832031, 0.1291961669921875, 0.1385936737060547, 0.14799118041992188, 0.15738868713378906, 0.16678619384765625, 0.17618370056152344, 0.18558120727539062, 0.1949787139892578, 0.204376220703125, 0.2137737274169922, 0.22317123413085938, 0.23256874084472656, 0.24196624755859375, 0.25136375427246094, 0.2607612609863281, 0.2701587677001953, 0.2795562744140625, 0.2889537811279297, 0.2983512878417969, 0.30774879455566406, 0.31714630126953125, 0.32654380798339844, 0.3359413146972656, 0.3453388214111328, 0.354736328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 3.0, 4.0, 10.0, 20.0, 28.0, 57.0, 140.0, 292.0, 219.0, 100.0, 44.0, 26.0, 21.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.06878662109375, -0.06705808639526367, -0.06532955169677734, -0.06360101699829102, -0.06187248229980469, -0.06014394760131836, -0.05841541290283203, -0.0566868782043457, -0.054958343505859375, -0.05322980880737305, -0.05150127410888672, -0.04977273941040039, -0.04804420471191406, -0.046315670013427734, -0.044587135314941406, -0.04285860061645508, -0.04113006591796875, -0.03940153121948242, -0.037672996520996094, -0.035944461822509766, -0.03421592712402344, -0.03248739242553711, -0.03075885772705078, -0.029030323028564453, -0.027301788330078125, -0.025573253631591797, -0.02384471893310547, -0.02211618423461914, -0.020387649536132812, -0.018659114837646484, -0.016930580139160156, -0.015202045440673828, -0.0134735107421875, -0.011744976043701172, -0.010016441345214844, -0.008287906646728516, -0.0065593719482421875, -0.004830837249755859, -0.0031023025512695312, -0.0013737678527832031, 0.000354766845703125, 0.002083301544189453, 0.0038118362426757812, 0.005540370941162109, 0.0072689056396484375, 0.008997440338134766, 0.010725975036621094, 0.012454509735107422, 0.01418304443359375, 0.015911579132080078, 0.017640113830566406, 0.019368648529052734, 0.021097183227539062, 0.02282571792602539, 0.02455425262451172, 0.026282787322998047, 0.028011322021484375, 0.029739856719970703, 0.03146839141845703, 0.03319692611694336, 0.03492546081542969, 0.036653995513916016, 0.038382530212402344, 0.04011106491088867, 0.041839599609375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 31.0, 87.0, 298.0, 386.0, 158.0, 34.0, 8.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.432240009307861, -5.3282060623168945, -5.224172115325928, -5.120137691497803, -5.016103744506836, -4.912069797515869, -4.808035850524902, -4.7040019035339355, -4.599967956542969, -4.495934009552002, -4.391900062561035, -4.28786563873291, -4.183831691741943, -4.079797744750977, -3.9757637977600098, -3.871729850769043, -3.767695426940918, -3.663661479949951, -3.5596272945404053, -3.4555933475494385, -3.3515591621398926, -3.247525215148926, -3.143491268157959, -3.039457321166992, -2.9354231357574463, -2.8313891887664795, -2.7273550033569336, -2.623321056365967, -2.519287109375, -2.415252923965454, -2.3112189769744873, -2.2071847915649414, -2.1031508445739746, -1.9991167783737183, -1.895082712173462, -1.7910487651824951, -1.6870146989822388, -1.5829806327819824, -1.4789466857910156, -1.3749126195907593, -1.2708784341812134, -1.166844367980957, -1.0628104209899902, -0.9587763547897339, -0.8547422885894775, -0.7507082223892212, -0.6466742157936096, -0.542640209197998, -0.4386061429977417, -0.33457210659980774, -0.23053807020187378, -0.12650403380393982, -0.02246999740600586, 0.08156406879425049, 0.18559807538986206, 0.28963208198547363, 0.39366614818573, 0.49770018458366394, 0.6017342209815979, 0.7057682275772095, 0.8098022937774658, 0.9138363599777222, 1.0178704261779785, 1.1219043731689453, 1.2259384393692017]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 2.0, 4.0, 7.0, 9.0, 5.0, 9.0, 12.0, 9.0, 20.0, 20.0, 19.0, 14.0, 19.0, 21.0, 25.0, 37.0, 42.0, 32.0, 38.0, 41.0, 35.0, 27.0, 36.0, 36.0, 44.0, 32.0, 36.0, 26.0, 31.0, 32.0, 27.0, 18.0, 28.0, 17.0, 33.0, 30.0, 16.0, 14.0, 15.0, 13.0, 16.0, 15.0, 7.0, 10.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.837573528289795, -3.715958595275879, -3.594343662261963, -3.472728729248047, -3.351113796234131, -3.229498863220215, -3.107883930206299, -2.986268997192383, -2.864654064178467, -2.743039131164551, -2.6214241981506348, -2.4998092651367188, -2.3781943321228027, -2.2565793991088867, -2.1349644660949707, -2.0133495330810547, -1.8917347192764282, -1.7701197862625122, -1.6485048532485962, -1.5268899202346802, -1.4052749872207642, -1.2836601734161377, -1.1620452404022217, -1.0404303073883057, -0.9188153147697449, -0.7972003817558289, -0.6755854487419128, -0.5539705753326416, -0.4323556125164032, -0.31074070930480957, -0.18912577629089355, -0.06751084327697754, 0.05410408973693848, 0.1757190227508545, 0.2973339557647705, 0.41894885897636414, 0.5405638217926025, 0.6621786952018738, 0.7837936282157898, 0.9054085612297058, 1.0270235538482666, 1.1486384868621826, 1.2702534198760986, 1.3918683528900146, 1.5134832859039307, 1.6350982189178467, 1.7567131519317627, 1.8783280849456787, 1.9999428987503052, 2.1215577125549316, 2.2431726455688477, 2.3647875785827637, 2.4864025115966797, 2.6080174446105957, 2.7296323776245117, 2.8512473106384277, 2.9728622436523438, 3.0944771766662598, 3.216092109680176, 3.337707042694092, 3.459321975708008, 3.580936908721924, 3.70255184173584, 3.824166774749756, 3.945781707763672]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 6.0, 5.0, 9.0, 13.0, 10.0, 19.0, 20.0, 17.0, 13.0, 29.0, 29.0, 17.0, 24.0, 35.0, 48.0, 71.0, 111.0, 336.0, 1364.0, 11848.0, 984889.0, 3128476.0, 62996.0, 2843.0, 518.0, 149.0, 76.0, 44.0, 32.0, 36.0, 25.0, 23.0, 18.0, 17.0, 18.0, 15.0, 14.0, 15.0, 13.0, 9.0, 12.0, 4.0, 1.0, 6.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.53515625, -1.4825897216796875, -1.430023193359375, -1.3774566650390625, -1.32489013671875, -1.2723236083984375, -1.219757080078125, -1.1671905517578125, -1.1146240234375, -1.0620574951171875, -1.009490966796875, -0.9569244384765625, -0.90435791015625, -0.8517913818359375, -0.799224853515625, -0.7466583251953125, -0.694091796875, -0.6415252685546875, -0.588958740234375, -0.5363922119140625, -0.48382568359375, -0.4312591552734375, -0.378692626953125, -0.3261260986328125, -0.2735595703125, -0.2209930419921875, -0.168426513671875, -0.1158599853515625, -0.06329345703125, -0.0107269287109375, 0.041839599609375, 0.0944061279296875, 0.14697265625, 0.1995391845703125, 0.252105712890625, 0.3046722412109375, 0.35723876953125, 0.4098052978515625, 0.462371826171875, 0.5149383544921875, 0.5675048828125, 0.6200714111328125, 0.672637939453125, 0.7252044677734375, 0.77777099609375, 0.8303375244140625, 0.882904052734375, 0.9354705810546875, 0.988037109375, 1.0406036376953125, 1.093170166015625, 1.1457366943359375, 1.19830322265625, 1.2508697509765625, 1.303436279296875, 1.3560028076171875, 1.4085693359375, 1.4611358642578125, 1.513702392578125, 1.5662689208984375, 1.61883544921875, 1.6714019775390625, 1.723968505859375, 1.7765350341796875, 1.8291015625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 3.0, 14.0, 8.0, 11.0, 4.0, 16.0, 32.0, 27.0, 40.0, 33.0, 53.0, 55.0, 47.0, 66.0, 72.0, 72.0, 66.0, 62.0, 63.0, 58.0, 46.0, 39.0, 23.0, 20.0, 20.0, 12.0, 13.0, 7.0, 10.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56494140625, -0.5467681884765625, -0.528594970703125, -0.5104217529296875, -0.49224853515625, -0.4740753173828125, -0.455902099609375, -0.4377288818359375, -0.4195556640625, -0.4013824462890625, -0.383209228515625, -0.3650360107421875, -0.34686279296875, -0.3286895751953125, -0.310516357421875, -0.2923431396484375, -0.274169921875, -0.2559967041015625, -0.237823486328125, -0.2196502685546875, -0.20147705078125, -0.1833038330078125, -0.165130615234375, -0.1469573974609375, -0.1287841796875, -0.1106109619140625, -0.092437744140625, -0.0742645263671875, -0.05609130859375, -0.0379180908203125, -0.019744873046875, -0.0015716552734375, 0.0166015625, 0.0347747802734375, 0.052947998046875, 0.0711212158203125, 0.08929443359375, 0.1074676513671875, 0.125640869140625, 0.1438140869140625, 0.1619873046875, 0.1801605224609375, 0.198333740234375, 0.2165069580078125, 0.23468017578125, 0.2528533935546875, 0.271026611328125, 0.2891998291015625, 0.307373046875, 0.3255462646484375, 0.343719482421875, 0.3618927001953125, 0.38006591796875, 0.3982391357421875, 0.416412353515625, 0.4345855712890625, 0.4527587890625, 0.4709320068359375, 0.489105224609375, 0.5072784423828125, 0.52545166015625, 0.5436248779296875, 0.561798095703125, 0.5799713134765625, 0.59814453125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 7.0, 12.0, 12.0, 44.0, 65.0, 121.0, 269.0, 504.0, 4177173.0, 15201.0, 418.0, 209.0, 108.0, 69.0, 30.0, 11.0, 13.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9140625, -12.3953857421875, -11.876708984375, -11.3580322265625, -10.83935546875, -10.3206787109375, -9.802001953125, -9.2833251953125, -8.7646484375, -8.2459716796875, -7.727294921875, -7.2086181640625, -6.68994140625, -6.1712646484375, -5.652587890625, -5.1339111328125, -4.615234375, -4.0965576171875, -3.577880859375, -3.0592041015625, -2.54052734375, -2.0218505859375, -1.503173828125, -0.9844970703125, -0.4658203125, 0.0528564453125, 0.571533203125, 1.0902099609375, 1.60888671875, 2.1275634765625, 2.646240234375, 3.1649169921875, 3.68359375, 4.2022705078125, 4.720947265625, 5.2396240234375, 5.75830078125, 6.2769775390625, 6.795654296875, 7.3143310546875, 7.8330078125, 8.3516845703125, 8.870361328125, 9.3890380859375, 9.90771484375, 10.4263916015625, 10.945068359375, 11.4637451171875, 11.982421875, 12.5010986328125, 13.019775390625, 13.5384521484375, 14.05712890625, 14.5758056640625, 15.094482421875, 15.6131591796875, 16.1318359375, 16.6505126953125, 17.169189453125, 17.6878662109375, 18.20654296875, 18.7252197265625, 19.243896484375, 19.7625732421875, 20.28125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 8.0, 15.0, 15.0, 32.0, 37.0, 73.0, 110.0, 169.0, 412.0, 836.0, 956.0, 643.0, 314.0, 156.0, 104.0, 63.0, 40.0, 24.0, 20.0, 8.0, 8.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2340087890625, -0.2247753143310547, -0.21554183959960938, -0.20630836486816406, -0.19707489013671875, -0.18784141540527344, -0.17860794067382812, -0.1693744659423828, -0.1601409912109375, -0.1509075164794922, -0.14167404174804688, -0.13244056701660156, -0.12320709228515625, -0.11397361755371094, -0.10474014282226562, -0.09550666809082031, -0.086273193359375, -0.07703971862792969, -0.06780624389648438, -0.05857276916503906, -0.04933929443359375, -0.04010581970214844, -0.030872344970703125, -0.021638870239257812, -0.0124053955078125, -0.0031719207763671875, 0.006061553955078125, 0.015295028686523438, 0.02452850341796875, 0.03376197814941406, 0.042995452880859375, 0.05222892761230469, 0.06146240234375, 0.07069587707519531, 0.07992935180664062, 0.08916282653808594, 0.09839630126953125, 0.10762977600097656, 0.11686325073242188, 0.1260967254638672, 0.1353302001953125, 0.1445636749267578, 0.15379714965820312, 0.16303062438964844, 0.17226409912109375, 0.18149757385253906, 0.19073104858398438, 0.1999645233154297, 0.209197998046875, 0.2184314727783203, 0.22766494750976562, 0.23689842224121094, 0.24613189697265625, 0.25536537170410156, 0.2645988464355469, 0.2738323211669922, 0.2830657958984375, 0.2922992706298828, 0.3015327453613281, 0.31076622009277344, 0.31999969482421875, 0.32923316955566406, 0.3384666442871094, 0.3477001190185547, 0.35693359375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 7.0, 16.0, 20.0, 40.0, 35.0, 53.0, 81.0, 96.0, 114.0, 136.0, 99.0, 100.0, 63.0, 45.0, 41.0, 12.0, 18.0, 8.0, 3.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8708227276802063, -0.8479793071746826, -0.8251358270645142, -0.8022924065589905, -0.7794489860534668, -0.7566055655479431, -0.7337621450424194, -0.710918664932251, -0.6880752444267273, -0.6652318239212036, -0.6423883438110352, -0.6195449233055115, -0.5967015027999878, -0.5738580822944641, -0.5510146617889404, -0.528171181678772, -0.5053277611732483, -0.4824843406677246, -0.45964089035987854, -0.43679744005203247, -0.4139540195465088, -0.3911105990409851, -0.36826714873313904, -0.34542369842529297, -0.3225802779197693, -0.2997368574142456, -0.27689340710639954, -0.25404995679855347, -0.23120653629302979, -0.2083631008863449, -0.18551966547966003, -0.16267623007297516, -0.1398327350616455, -0.11698929965496063, -0.09414586424827576, -0.07130242884159088, -0.048458993434906006, -0.02561555802822113, -0.002772122621536255, 0.02007131278514862, 0.042914748191833496, 0.06575818359851837, 0.08860161900520325, 0.11144505441188812, 0.134288489818573, 0.15713192522525787, 0.17997536063194275, 0.20281879603862762, 0.2256622314453125, 0.24850566685199738, 0.27134910225868225, 0.2941925525665283, 0.317035973072052, 0.3398793935775757, 0.36272284388542175, 0.3855662941932678, 0.4084097146987915, 0.4312531352043152, 0.45409658551216125, 0.4769400358200073, 0.499783456325531, 0.5226268768310547, 0.5454703569412231, 0.5683137774467468, 0.5911571979522705]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 2.0, 7.0, 9.0, 4.0, 5.0, 10.0, 10.0, 17.0, 30.0, 27.0, 35.0, 39.0, 45.0, 53.0, 40.0, 53.0, 48.0, 43.0, 49.0, 40.0, 53.0, 51.0, 47.0, 44.0, 42.0, 36.0, 30.0, 29.0, 15.0, 24.0, 25.0, 11.0, 8.0, 7.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5734447240829468, -0.5570437908172607, -0.5406428575515747, -0.5242419242858887, -0.5078409910202026, -0.4914400279521942, -0.4750390648841858, -0.45863813161849976, -0.4422371983528137, -0.4258362650871277, -0.40943533182144165, -0.3930343687534332, -0.3766334354877472, -0.36023250222206116, -0.34383153915405273, -0.3274306058883667, -0.31102967262268066, -0.29462873935699463, -0.2782278060913086, -0.26182684302330017, -0.24542590975761414, -0.2290249764919281, -0.21262402832508087, -0.19622308015823364, -0.1798221468925476, -0.16342121362686157, -0.14702026546001434, -0.13061931729316711, -0.11421838402748108, -0.09781744331121445, -0.08141650259494781, -0.06501556187868118, -0.048614680767059326, -0.032213740050792694, -0.015812799334526062, 0.0005881413817405701, 0.016989082098007202, 0.033390022814273834, 0.049790963530540466, 0.0661919042468071, 0.08259284496307373, 0.09899378567934036, 0.115394726395607, 0.13179567456245422, 0.14819660782814026, 0.1645975410938263, 0.18099848926067352, 0.19739943742752075, 0.2138003706932068, 0.23020130395889282, 0.24660225212574005, 0.2630032002925873, 0.2794041335582733, 0.29580506682395935, 0.3122060298919678, 0.3286069631576538, 0.34500789642333984, 0.3614088296890259, 0.3778097629547119, 0.39421072602272034, 0.41061165928840637, 0.4270125925540924, 0.44341355562210083, 0.45981448888778687, 0.4762154221534729]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 15.0, 16.0, 23.0, 28.0, 54.0, 80.0, 92.0, 163.0, 220.0, 315.0, 501.0, 705.0, 1191.0, 2046.0, 3782.0, 8204.0, 21737.0, 79991.0, 387439.0, 413639.0, 86532.0, 23635.0, 8641.0, 3904.0, 2079.0, 1243.0, 755.0, 513.0, 304.0, 218.0, 142.0, 95.0, 53.0, 61.0, 35.0, 23.0, 18.0, 12.0, 10.0, 12.0, 4.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.14404296875, -0.13954544067382812, -0.13504791259765625, -0.13055038452148438, -0.1260528564453125, -0.12155532836914062, -0.11705780029296875, -0.11256027221679688, -0.108062744140625, -0.10356521606445312, -0.09906768798828125, -0.09457015991210938, -0.0900726318359375, -0.08557510375976562, -0.08107757568359375, -0.07658004760742188, -0.07208251953125, -0.06758499145507812, -0.06308746337890625, -0.058589935302734375, -0.0540924072265625, -0.049594879150390625, -0.04509735107421875, -0.040599822998046875, -0.036102294921875, -0.031604766845703125, -0.02710723876953125, -0.022609710693359375, -0.0181121826171875, -0.013614654541015625, -0.00911712646484375, -0.004619598388671875, -0.0001220703125, 0.004375457763671875, 0.00887298583984375, 0.013370513916015625, 0.0178680419921875, 0.022365570068359375, 0.02686309814453125, 0.031360626220703125, 0.035858154296875, 0.040355682373046875, 0.04485321044921875, 0.049350738525390625, 0.0538482666015625, 0.058345794677734375, 0.06284332275390625, 0.06734085083007812, 0.07183837890625, 0.07633590698242188, 0.08083343505859375, 0.08533096313476562, 0.0898284912109375, 0.09432601928710938, 0.09882354736328125, 0.10332107543945312, 0.107818603515625, 0.11231613159179688, 0.11681365966796875, 0.12131118774414062, 0.1258087158203125, 0.13030624389648438, 0.13480377197265625, 0.13930130004882812, 0.143798828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 3.0, 7.0, 3.0, 10.0, 11.0, 5.0, 22.0, 16.0, 31.0, 30.0, 40.0, 35.0, 43.0, 54.0, 46.0, 58.0, 43.0, 56.0, 46.0, 58.0, 55.0, 49.0, 40.0, 35.0, 34.0, 31.0, 27.0, 28.0, 18.0, 14.0, 11.0, 18.0, 6.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32763671875, -0.3175773620605469, -0.30751800537109375, -0.2974586486816406, -0.2873992919921875, -0.2773399353027344, -0.26728057861328125, -0.2572212219238281, -0.247161865234375, -0.23710250854492188, -0.22704315185546875, -0.21698379516601562, -0.2069244384765625, -0.19686508178710938, -0.18680572509765625, -0.17674636840820312, -0.16668701171875, -0.15662765502929688, -0.14656829833984375, -0.13650894165039062, -0.1264495849609375, -0.11639022827148438, -0.10633087158203125, -0.09627151489257812, -0.086212158203125, -0.07615280151367188, -0.06609344482421875, -0.056034088134765625, -0.0459747314453125, -0.035915374755859375, -0.02585601806640625, -0.015796661376953125, -0.0057373046875, 0.004322052001953125, 0.01438140869140625, 0.024440765380859375, 0.0345001220703125, 0.044559478759765625, 0.05461883544921875, 0.06467819213867188, 0.074737548828125, 0.08479690551757812, 0.09485626220703125, 0.10491561889648438, 0.1149749755859375, 0.12503433227539062, 0.13509368896484375, 0.14515304565429688, 0.15521240234375, 0.16527175903320312, 0.17533111572265625, 0.18539047241210938, 0.1954498291015625, 0.20550918579101562, 0.21556854248046875, 0.22562789916992188, 0.235687255859375, 0.24574661254882812, 0.25580596923828125, 0.2658653259277344, 0.2759246826171875, 0.2859840393066406, 0.29604339599609375, 0.3061027526855469, 0.316162109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 3.0, 5.0, 10.0, 6.0, 12.0, 15.0, 29.0, 29.0, 57.0, 73.0, 118.0, 170.0, 291.0, 435.0, 723.0, 1107.0, 1663.0, 2729.0, 4504.0, 7182.0, 12257.0, 21681.0, 39300.0, 77310.0, 156550.0, 250407.0, 219382.0, 119756.0, 58629.0, 30919.0, 17196.0, 10018.0, 6032.0, 3670.0, 2292.0, 1372.0, 925.0, 570.0, 376.0, 235.0, 171.0, 116.0, 93.0, 56.0, 34.0, 14.0, 14.0, 7.0, 5.0, 2.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.050018310546875, -0.048493385314941406, -0.04696846008300781, -0.04544353485107422, -0.043918609619140625, -0.04239368438720703, -0.04086875915527344, -0.039343833923339844, -0.03781890869140625, -0.036293983459472656, -0.03476905822753906, -0.03324413299560547, -0.031719207763671875, -0.03019428253173828, -0.028669357299804688, -0.027144432067871094, -0.0256195068359375, -0.024094581604003906, -0.022569656372070312, -0.02104473114013672, -0.019519805908203125, -0.01799488067626953, -0.016469955444335938, -0.014945030212402344, -0.01342010498046875, -0.011895179748535156, -0.010370254516601562, -0.008845329284667969, -0.007320404052734375, -0.005795478820800781, -0.0042705535888671875, -0.0027456283569335938, -0.001220703125, 0.00030422210693359375, 0.0018291473388671875, 0.0033540725708007812, 0.004878997802734375, 0.006403923034667969, 0.007928848266601562, 0.009453773498535156, 0.01097869873046875, 0.012503623962402344, 0.014028549194335938, 0.015553474426269531, 0.017078399658203125, 0.01860332489013672, 0.020128250122070312, 0.021653175354003906, 0.0231781005859375, 0.024703025817871094, 0.026227951049804688, 0.02775287628173828, 0.029277801513671875, 0.03080272674560547, 0.03232765197753906, 0.033852577209472656, 0.03537750244140625, 0.036902427673339844, 0.03842735290527344, 0.03995227813720703, 0.041477203369140625, 0.04300212860107422, 0.04452705383300781, 0.046051979064941406, 0.047576904296875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 5.0, 4.0, 12.0, 16.0, 12.0, 14.0, 28.0, 30.0, 38.0, 30.0, 38.0, 44.0, 54.0, 44.0, 63.0, 59.0, 55.0, 55.0, 53.0, 55.0, 37.0, 36.0, 27.0, 49.0, 28.0, 21.0, 17.0, 22.0, 12.0, 13.0, 5.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.59033203125, -0.5729904174804688, -0.5556488037109375, -0.5383071899414062, -0.520965576171875, -0.5036239624023438, -0.4862823486328125, -0.46894073486328125, -0.45159912109375, -0.43425750732421875, -0.4169158935546875, -0.39957427978515625, -0.382232666015625, -0.36489105224609375, -0.3475494384765625, -0.33020782470703125, -0.3128662109375, -0.29552459716796875, -0.2781829833984375, -0.26084136962890625, -0.243499755859375, -0.22615814208984375, -0.2088165283203125, -0.19147491455078125, -0.17413330078125, -0.15679168701171875, -0.1394500732421875, -0.12210845947265625, -0.104766845703125, -0.08742523193359375, -0.0700836181640625, -0.05274200439453125, -0.035400390625, -0.01805877685546875, -0.0007171630859375, 0.01662445068359375, 0.033966064453125, 0.05130767822265625, 0.0686492919921875, 0.08599090576171875, 0.10333251953125, 0.12067413330078125, 0.1380157470703125, 0.15535736083984375, 0.172698974609375, 0.19004058837890625, 0.2073822021484375, 0.22472381591796875, 0.2420654296875, 0.25940704345703125, 0.2767486572265625, 0.29409027099609375, 0.311431884765625, 0.32877349853515625, 0.3461151123046875, 0.36345672607421875, 0.38079833984375, 0.39813995361328125, 0.4154815673828125, 0.43282318115234375, 0.450164794921875, 0.46750640869140625, 0.4848480224609375, 0.5021896362304688, 0.51953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 14.0, 5.0, 17.0, 18.0, 29.0, 34.0, 60.0, 78.0, 127.0, 220.0, 296.0, 485.0, 811.0, 1467.0, 2837.0, 5765.0, 12314.0, 28837.0, 67548.0, 151404.0, 264742.0, 256617.0, 141663.0, 62967.0, 26761.0, 11698.0, 5387.0, 2777.0, 1426.0, 778.0, 464.0, 307.0, 162.0, 114.0, 83.0, 55.0, 46.0, 37.0, 24.0, 26.0, 17.0, 10.0, 9.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.004669189453125, -0.0045275092124938965, -0.004385828971862793, -0.0042441487312316895, -0.004102468490600586, -0.003960788249969482, -0.003819108009338379, -0.0036774277687072754, -0.003535747528076172, -0.0033940672874450684, -0.003252387046813965, -0.0031107068061828613, -0.002969026565551758, -0.0028273463249206543, -0.0026856660842895508, -0.0025439858436584473, -0.0024023056030273438, -0.0022606253623962402, -0.0021189451217651367, -0.001977264881134033, -0.0018355846405029297, -0.0016939043998718262, -0.0015522241592407227, -0.0014105439186096191, -0.0012688636779785156, -0.0011271834373474121, -0.0009855031967163086, -0.0008438229560852051, -0.0007021427154541016, -0.000560462474822998, -0.00041878223419189453, -0.000277101993560791, -0.0001354217529296875, 6.258487701416016e-06, 0.00014793872833251953, 0.00028961896896362305, 0.00043129920959472656, 0.0005729794502258301, 0.0007146596908569336, 0.0008563399314880371, 0.0009980201721191406, 0.0011397004127502441, 0.0012813806533813477, 0.0014230608940124512, 0.0015647411346435547, 0.0017064213752746582, 0.0018481016159057617, 0.0019897818565368652, 0.0021314620971679688, 0.0022731423377990723, 0.0024148225784301758, 0.0025565028190612793, 0.002698183059692383, 0.0028398633003234863, 0.00298154354095459, 0.0031232237815856934, 0.003264904022216797, 0.0034065842628479004, 0.003548264503479004, 0.0036899447441101074, 0.003831624984741211, 0.0039733052253723145, 0.004114985466003418, 0.0042566657066345215, 0.004398345947265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 8.0, 17.0, 24.0, 23.0, 29.0, 34.0, 57.0, 67.0, 82.0, 106.0, 107.0, 91.0, 103.0, 71.0, 59.0, 45.0, 22.0, 22.0, 12.0, 3.0, 8.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.71661376953125e-05, -1.6694888472557068e-05, -1.6223639249801636e-05, -1.5752390027046204e-05, -1.528114080429077e-05, -1.480989158153534e-05, -1.4338642358779907e-05, -1.3867393136024475e-05, -1.3396143913269043e-05, -1.292489469051361e-05, -1.2453645467758179e-05, -1.1982396245002747e-05, -1.1511147022247314e-05, -1.1039897799491882e-05, -1.056864857673645e-05, -1.0097399353981018e-05, -9.626150131225586e-06, -9.154900908470154e-06, -8.683651685714722e-06, -8.21240246295929e-06, -7.741153240203857e-06, -7.269904017448425e-06, -6.798654794692993e-06, -6.327405571937561e-06, -5.856156349182129e-06, -5.384907126426697e-06, -4.913657903671265e-06, -4.4424086809158325e-06, -3.9711594581604e-06, -3.4999102354049683e-06, -3.028661012649536e-06, -2.557411789894104e-06, -2.086162567138672e-06, -1.6149133443832397e-06, -1.1436641216278076e-06, -6.724148988723755e-07, -2.0116567611694336e-07, 2.7008354663848877e-07, 7.413327693939209e-07, 1.212581992149353e-06, 1.6838312149047852e-06, 2.1550804376602173e-06, 2.6263296604156494e-06, 3.0975788831710815e-06, 3.5688281059265137e-06, 4.040077328681946e-06, 4.511326551437378e-06, 4.98257577419281e-06, 5.453824996948242e-06, 5.925074219703674e-06, 6.3963234424591064e-06, 6.8675726652145386e-06, 7.338821887969971e-06, 7.810071110725403e-06, 8.281320333480835e-06, 8.752569556236267e-06, 9.2238187789917e-06, 9.695068001747131e-06, 1.0166317224502563e-05, 1.0637566447257996e-05, 1.1108815670013428e-05, 1.158006489276886e-05, 1.2051314115524292e-05, 1.2522563338279724e-05, 1.2993812561035156e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 8.0, 13.0, 10.0, 5.0, 17.0, 20.0, 40.0, 38.0, 61.0, 57.0, 76.0, 89.0, 148.0, 393.0, 3661.0, 153836.0, 860122.0, 27949.0, 1240.0, 232.0, 119.0, 91.0, 64.0, 53.0, 32.0, 40.0, 34.0, 26.0, 17.0, 17.0, 12.0, 7.0, 6.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016143798828125, -0.015592813491821289, -0.015041828155517578, -0.014490842819213867, -0.013939857482910156, -0.013388872146606445, -0.012837886810302734, -0.012286901473999023, -0.011735916137695312, -0.011184930801391602, -0.01063394546508789, -0.01008296012878418, -0.009531974792480469, -0.008980989456176758, -0.008430004119873047, -0.007879018783569336, -0.007328033447265625, -0.006777048110961914, -0.006226062774658203, -0.005675077438354492, -0.005124092102050781, -0.00457310676574707, -0.004022121429443359, -0.0034711360931396484, -0.0029201507568359375, -0.0023691654205322266, -0.0018181800842285156, -0.0012671947479248047, -0.0007162094116210938, -0.0001652240753173828, 0.0003857612609863281, 0.0009367465972900391, 0.00148773193359375, 0.002038717269897461, 0.002589702606201172, 0.003140687942504883, 0.0036916732788085938, 0.004242658615112305, 0.004793643951416016, 0.0053446292877197266, 0.0058956146240234375, 0.0064465999603271484, 0.006997585296630859, 0.00754857063293457, 0.008099555969238281, 0.008650541305541992, 0.009201526641845703, 0.009752511978149414, 0.010303497314453125, 0.010854482650756836, 0.011405467987060547, 0.011956453323364258, 0.012507438659667969, 0.01305842399597168, 0.01360940933227539, 0.014160394668579102, 0.014711380004882812, 0.015262365341186523, 0.015813350677490234, 0.016364336013793945, 0.016915321350097656, 0.017466306686401367, 0.018017292022705078, 0.01856827735900879, 0.0191192626953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 8.0, 6.0, 4.0, 13.0, 14.0, 12.0, 18.0, 22.0, 27.0, 28.0, 28.0, 33.0, 45.0, 55.0, 36.0, 51.0, 56.0, 47.0, 80.0, 71.0, 49.0, 52.0, 50.0, 40.0, 30.0, 13.0, 20.0, 19.0, 10.0, 19.0, 10.0, 10.0, 3.0, 7.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012884140014648438, -0.0012472718954086304, -0.001206129789352417, -0.0011649876832962036, -0.0011238455772399902, -0.0010827034711837769, -0.0010415613651275635, -0.00100041925907135, -0.0009592771530151367, -0.0009181350469589233, -0.00087699294090271, -0.0008358508348464966, -0.0007947087287902832, -0.0007535666227340698, -0.0007124245166778564, -0.0006712824106216431, -0.0006301403045654297, -0.0005889981985092163, -0.0005478560924530029, -0.0005067139863967896, -0.00046557188034057617, -0.0004244297742843628, -0.0003832876682281494, -0.00034214556217193604, -0.00030100345611572266, -0.0002598613500595093, -0.0002187192440032959, -0.00017757713794708252, -0.00013643503189086914, -9.529292583465576e-05, -5.415081977844238e-05, -1.3008713722229004e-05, 2.8133392333984375e-05, 6.927549839019775e-05, 0.00011041760444641113, 0.0001515597105026245, 0.0001927018165588379, 0.00023384392261505127, 0.00027498602867126465, 0.00031612813472747803, 0.0003572702407836914, 0.0003984123468399048, 0.00043955445289611816, 0.00048069655895233154, 0.0005218386650085449, 0.0005629807710647583, 0.0006041228771209717, 0.0006452649831771851, 0.0006864070892333984, 0.0007275491952896118, 0.0007686913013458252, 0.0008098334074020386, 0.000850975513458252, 0.0008921176195144653, 0.0009332597255706787, 0.0009744018316268921, 0.0010155439376831055, 0.0010566860437393188, 0.0010978281497955322, 0.0011389702558517456, 0.001180112361907959, 0.0012212544679641724, 0.0012623965740203857, 0.0013035386800765991, 0.0013446807861328125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 20.0, 28.0, 38.0, 44.0, 71.0, 90.0, 100.0, 129.0, 115.0, 117.0, 84.0, 42.0, 41.0, 20.0, 19.0, 10.0, 5.0, 4.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4676409959793091, -0.4544897675514221, -0.44133850932121277, -0.4281872808933258, -0.41503605246543884, -0.4018847942352295, -0.38873356580734253, -0.37558233737945557, -0.3624311089515686, -0.34927988052368164, -0.3361286222934723, -0.3229773938655853, -0.30982616543769836, -0.296674907207489, -0.28352367877960205, -0.2703724503517151, -0.25722119212150574, -0.24406994879245758, -0.23091872036457062, -0.21776747703552246, -0.2046162486076355, -0.19146500527858734, -0.17831376194953918, -0.16516253352165222, -0.15201129019260406, -0.1388600468635559, -0.12570881843566895, -0.11255757510662079, -0.09940633922815323, -0.08625510334968567, -0.07310386002063751, -0.05995262414216995, -0.046801358461380005, -0.033650122582912445, -0.020498882979154587, -0.0073476433753967285, 0.005803592503070831, 0.01895482838153839, 0.03210607171058655, 0.04525730758905411, 0.05840854346752167, 0.07155977934598923, 0.08471101522445679, 0.09786225855350494, 0.1110134944319725, 0.12416473031044006, 0.13731597363948822, 0.15046721696853638, 0.16361844539642334, 0.1767696887254715, 0.18992091715335846, 0.20307216048240662, 0.21622338891029358, 0.22937463223934174, 0.2425258755683899, 0.25567710399627686, 0.2688283324241638, 0.2819795608520508, 0.29513081908226013, 0.3082820475101471, 0.32143327593803406, 0.3345845341682434, 0.34773576259613037, 0.36088699102401733, 0.3740382492542267]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 5.0, 5.0, 6.0, 11.0, 11.0, 16.0, 20.0, 27.0, 32.0, 40.0, 49.0, 49.0, 44.0, 47.0, 58.0, 40.0, 54.0, 41.0, 53.0, 54.0, 47.0, 40.0, 51.0, 30.0, 30.0, 24.0, 23.0, 26.0, 18.0, 14.0, 6.0, 5.0, 6.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3533909320831299, -0.3437140882015228, -0.33403724431991577, -0.3243604302406311, -0.31468358635902405, -0.305006742477417, -0.2953299283981323, -0.28565308451652527, -0.2759762406349182, -0.26629939675331116, -0.2566225528717041, -0.24694573879241943, -0.23726889491081238, -0.22759205102920532, -0.21791522204875946, -0.2082383930683136, -0.19856154918670654, -0.1888847053050995, -0.17920787632465363, -0.16953104734420776, -0.1598542034626007, -0.15017735958099365, -0.1405005306005478, -0.13082370162010193, -0.12114685773849487, -0.11147002130746841, -0.10179318487644196, -0.0921163484454155, -0.08243951201438904, -0.07276267558336258, -0.06308583915233612, -0.05340900272130966, -0.043732136487960815, -0.03405530005693436, -0.024378463625907898, -0.01470162719488144, -0.0050247907638549805, 0.004652045667171478, 0.014328882098197937, 0.024005718529224396, 0.033682554960250854, 0.04335939139127731, 0.05303622782230377, 0.06271306425333023, 0.07238990068435669, 0.08206673711538315, 0.0917435735464096, 0.10142040997743607, 0.11109724640846252, 0.12077408283948898, 0.13045091927051544, 0.1401277482509613, 0.14980459213256836, 0.15948143601417542, 0.16915826499462128, 0.17883509397506714, 0.1885119378566742, 0.19818878173828125, 0.2078656107187271, 0.21754243969917297, 0.22721928358078003, 0.23689612746238708, 0.24657295644283295, 0.2562497854232788, 0.26592662930488586]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 7.0, 3.0, 3.0, 4.0, 3.0, 12.0, 16.0, 28.0, 24.0, 41.0, 70.0, 77.0, 122.0, 143.0, 253.0, 345.0, 484.0, 775.0, 1314.0, 2286.0, 4083.0, 8759.0, 21683.0, 64106.0, 229853.0, 455299.0, 174638.0, 50201.0, 17371.0, 7358.0, 3770.0, 1981.0, 1162.0, 700.0, 491.0, 341.0, 213.0, 160.0, 111.0, 76.0, 53.0, 39.0, 32.0, 24.0, 9.0, 11.0, 9.0, 8.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0853271484375, -0.0823221206665039, -0.07931709289550781, -0.07631206512451172, -0.07330703735351562, -0.07030200958251953, -0.06729698181152344, -0.06429195404052734, -0.06128692626953125, -0.058281898498535156, -0.05527687072753906, -0.05227184295654297, -0.049266815185546875, -0.04626178741455078, -0.04325675964355469, -0.040251731872558594, -0.0372467041015625, -0.034241676330566406, -0.031236648559570312, -0.02823162078857422, -0.025226593017578125, -0.02222156524658203, -0.019216537475585938, -0.016211509704589844, -0.01320648193359375, -0.010201454162597656, -0.0071964263916015625, -0.004191398620605469, -0.001186370849609375, 0.0018186569213867188, 0.0048236846923828125, 0.007828712463378906, 0.010833740234375, 0.013838768005371094, 0.016843795776367188, 0.01984882354736328, 0.022853851318359375, 0.02585887908935547, 0.028863906860351562, 0.031868934631347656, 0.03487396240234375, 0.037878990173339844, 0.04088401794433594, 0.04388904571533203, 0.046894073486328125, 0.04989910125732422, 0.05290412902832031, 0.055909156799316406, 0.0589141845703125, 0.061919212341308594, 0.06492424011230469, 0.06792926788330078, 0.07093429565429688, 0.07393932342529297, 0.07694435119628906, 0.07994937896728516, 0.08295440673828125, 0.08595943450927734, 0.08896446228027344, 0.09196949005126953, 0.09497451782226562, 0.09797954559326172, 0.10098457336425781, 0.1039896011352539, 0.10699462890625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 2.0, 3.0, 5.0, 6.0, 10.0, 8.0, 13.0, 22.0, 21.0, 33.0, 29.0, 36.0, 35.0, 48.0, 59.0, 37.0, 44.0, 39.0, 44.0, 50.0, 55.0, 46.0, 49.0, 36.0, 31.0, 36.0, 38.0, 38.0, 27.0, 19.0, 17.0, 12.0, 9.0, 15.0, 12.0, 3.0, 3.0, 7.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.1884765625, -1.1571884155273438, -1.1259002685546875, -1.0946121215820312, -1.063323974609375, -1.0320358276367188, -1.0007476806640625, -0.9694595336914062, -0.93817138671875, -0.9068832397460938, -0.8755950927734375, -0.8443069458007812, -0.813018798828125, -0.7817306518554688, -0.7504425048828125, -0.7191543579101562, -0.6878662109375, -0.6565780639648438, -0.6252899169921875, -0.5940017700195312, -0.562713623046875, -0.5314254760742188, -0.5001373291015625, -0.46884918212890625, -0.43756103515625, -0.40627288818359375, -0.3749847412109375, -0.34369659423828125, -0.312408447265625, -0.28112030029296875, -0.2498321533203125, -0.21854400634765625, -0.187255859375, -0.15596771240234375, -0.1246795654296875, -0.09339141845703125, -0.062103271484375, -0.03081512451171875, 0.0004730224609375, 0.03176116943359375, 0.06304931640625, 0.09433746337890625, 0.1256256103515625, 0.15691375732421875, 0.188201904296875, 0.21949005126953125, 0.2507781982421875, 0.28206634521484375, 0.3133544921875, 0.34464263916015625, 0.3759307861328125, 0.40721893310546875, 0.438507080078125, 0.46979522705078125, 0.5010833740234375, 0.5323715209960938, 0.56365966796875, 0.5949478149414062, 0.6262359619140625, 0.6575241088867188, 0.688812255859375, 0.7201004028320312, 0.7513885498046875, 0.7826766967773438, 0.81396484375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 4.0, 7.0, 10.0, 13.0, 12.0, 13.0, 14.0, 24.0, 18.0, 17.0, 20.0, 27.0, 25.0, 23.0, 28.0, 36.0, 37.0, 45.0, 42.0, 83.0, 73038.0, 974448.0, 142.0, 38.0, 39.0, 35.0, 35.0, 31.0, 37.0, 33.0, 28.0, 22.0, 25.0, 12.0, 19.0, 9.0, 7.0, 8.0, 10.0, 8.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3046875, -3.18682861328125, -3.0689697265625, -2.95111083984375, -2.833251953125, -2.71539306640625, -2.5975341796875, -2.47967529296875, -2.36181640625, -2.24395751953125, -2.1260986328125, -2.00823974609375, -1.890380859375, -1.77252197265625, -1.6546630859375, -1.53680419921875, -1.4189453125, -1.30108642578125, -1.1832275390625, -1.06536865234375, -0.947509765625, -0.82965087890625, -0.7117919921875, -0.59393310546875, -0.47607421875, -0.35821533203125, -0.2403564453125, -0.12249755859375, -0.004638671875, 0.11322021484375, 0.2310791015625, 0.34893798828125, 0.466796875, 0.58465576171875, 0.7025146484375, 0.82037353515625, 0.938232421875, 1.05609130859375, 1.1739501953125, 1.29180908203125, 1.40966796875, 1.52752685546875, 1.6453857421875, 1.76324462890625, 1.881103515625, 1.99896240234375, 2.1168212890625, 2.23468017578125, 2.3525390625, 2.47039794921875, 2.5882568359375, 2.70611572265625, 2.823974609375, 2.94183349609375, 3.0596923828125, 3.17755126953125, 3.29541015625, 3.41326904296875, 3.5311279296875, 3.64898681640625, 3.766845703125, 3.88470458984375, 4.0025634765625, 4.12042236328125, 4.23828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 5.0, 8.0, 14.0, 14.0, 12.0, 12.0, 22.0, 24.0, 15.0, 16.0, 25.0, 28.0, 21.0, 30.0, 33.0, 42.0, 42.0, 38.0, 33.0, 43.0, 43.0, 41.0, 42.0, 34.0, 38.0, 40.0, 25.0, 33.0, 34.0, 32.0, 27.0, 21.0, 14.0, 20.0, 8.0, 8.0, 6.0, 11.0, 7.0, 9.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.71435546875, -0.6890106201171875, -0.663665771484375, -0.6383209228515625, -0.61297607421875, -0.5876312255859375, -0.562286376953125, -0.5369415283203125, -0.5115966796875, -0.4862518310546875, -0.460906982421875, -0.4355621337890625, -0.41021728515625, -0.3848724365234375, -0.359527587890625, -0.3341827392578125, -0.308837890625, -0.2834930419921875, -0.258148193359375, -0.2328033447265625, -0.20745849609375, -0.1821136474609375, -0.156768798828125, -0.1314239501953125, -0.1060791015625, -0.0807342529296875, -0.055389404296875, -0.0300445556640625, -0.00469970703125, 0.0206451416015625, 0.045989990234375, 0.0713348388671875, 0.0966796875, 0.1220245361328125, 0.147369384765625, 0.1727142333984375, 0.19805908203125, 0.2234039306640625, 0.248748779296875, 0.2740936279296875, 0.2994384765625, 0.3247833251953125, 0.350128173828125, 0.3754730224609375, 0.40081787109375, 0.4261627197265625, 0.451507568359375, 0.4768524169921875, 0.502197265625, 0.5275421142578125, 0.552886962890625, 0.5782318115234375, 0.60357666015625, 0.6289215087890625, 0.654266357421875, 0.6796112060546875, 0.7049560546875, 0.7303009033203125, 0.755645751953125, 0.7809906005859375, 0.80633544921875, 0.8316802978515625, 0.857025146484375, 0.8823699951171875, 0.90771484375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 6.0, 2.0, 4.0, 4.0, 5.0, 11.0, 13.0, 19.0, 34.0, 45.0, 94.0, 229.0, 900.0, 8257.0, 940399.0, 94615.0, 3065.0, 512.0, 159.0, 64.0, 33.0, 24.0, 15.0, 9.0, 9.0, 11.0, 4.0, 4.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1734619140625, -0.16847801208496094, -0.16349411010742188, -0.1585102081298828, -0.15352630615234375, -0.1485424041748047, -0.14355850219726562, -0.13857460021972656, -0.1335906982421875, -0.12860679626464844, -0.12362289428710938, -0.11863899230957031, -0.11365509033203125, -0.10867118835449219, -0.10368728637695312, -0.09870338439941406, -0.093719482421875, -0.08873558044433594, -0.08375167846679688, -0.07876777648925781, -0.07378387451171875, -0.06879997253417969, -0.06381607055664062, -0.05883216857910156, -0.0538482666015625, -0.04886436462402344, -0.043880462646484375, -0.03889656066894531, -0.03391265869140625, -0.028928756713867188, -0.023944854736328125, -0.018960952758789062, -0.01397705078125, -0.008993148803710938, -0.004009246826171875, 0.0009746551513671875, 0.00595855712890625, 0.010942459106445312, 0.015926361083984375, 0.020910263061523438, 0.0258941650390625, 0.030878067016601562, 0.035861968994140625, 0.04084587097167969, 0.04582977294921875, 0.05081367492675781, 0.055797576904296875, 0.06078147888183594, 0.065765380859375, 0.07074928283691406, 0.07573318481445312, 0.08071708679199219, 0.08570098876953125, 0.09068489074707031, 0.09566879272460938, 0.10065269470214844, 0.1056365966796875, 0.11062049865722656, 0.11560440063476562, 0.12058830261230469, 0.12557220458984375, 0.1305561065673828, 0.13554000854492188, 0.14052391052246094, 0.1455078125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 6.0, 6.0, 9.0, 37.0, 48.0, 111.0, 280.0, 280.0, 105.0, 48.0, 16.0, 20.0, 18.0, 10.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1324882507324219e-05, -1.0960735380649567e-05, -1.0596588253974915e-05, -1.0232441127300262e-05, -9.86829400062561e-06, -9.504146873950958e-06, -9.139999747276306e-06, -8.775852620601654e-06, -8.411705493927002e-06, -8.04755836725235e-06, -7.683411240577698e-06, -7.319264113903046e-06, -6.9551169872283936e-06, -6.5909698605537415e-06, -6.226822733879089e-06, -5.862675607204437e-06, -5.498528480529785e-06, -5.134381353855133e-06, -4.770234227180481e-06, -4.406087100505829e-06, -4.041939973831177e-06, -3.6777928471565247e-06, -3.3136457204818726e-06, -2.9494985938072205e-06, -2.5853514671325684e-06, -2.2212043404579163e-06, -1.8570572137832642e-06, -1.492910087108612e-06, -1.12876296043396e-06, -7.646158337593079e-07, -4.0046870708465576e-07, -3.632158041000366e-08, 3.2782554626464844e-07, 6.919726729393005e-07, 1.0561197996139526e-06, 1.4202669262886047e-06, 1.7844140529632568e-06, 2.148561179637909e-06, 2.512708306312561e-06, 2.876855432987213e-06, 3.2410025596618652e-06, 3.6051496863365173e-06, 3.9692968130111694e-06, 4.3334439396858215e-06, 4.697591066360474e-06, 5.061738193035126e-06, 5.425885319709778e-06, 5.79003244638443e-06, 6.154179573059082e-06, 6.518326699733734e-06, 6.882473826408386e-06, 7.246620953083038e-06, 7.6107680797576904e-06, 7.974915206432343e-06, 8.339062333106995e-06, 8.703209459781647e-06, 9.067356586456299e-06, 9.431503713130951e-06, 9.795650839805603e-06, 1.0159797966480255e-05, 1.0523945093154907e-05, 1.088809221982956e-05, 1.1252239346504211e-05, 1.1616386473178864e-05, 1.1980533599853516e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 6.0, 12.0, 10.0, 28.0, 39.0, 85.0, 197.0, 607.0, 2291.0, 17085.0, 935156.0, 86050.0, 5233.0, 1113.0, 340.0, 133.0, 70.0, 33.0, 28.0, 9.0, 6.0, 5.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1187744140625, -0.11433219909667969, -0.10988998413085938, -0.10544776916503906, -0.10100555419921875, -0.09656333923339844, -0.09212112426757812, -0.08767890930175781, -0.0832366943359375, -0.07879447937011719, -0.07435226440429688, -0.06991004943847656, -0.06546783447265625, -0.06102561950683594, -0.056583404541015625, -0.05214118957519531, -0.047698974609375, -0.04325675964355469, -0.038814544677734375, -0.03437232971191406, -0.02993011474609375, -0.025487899780273438, -0.021045684814453125, -0.016603469848632812, -0.0121612548828125, -0.0077190399169921875, -0.003276824951171875, 0.0011653900146484375, 0.00560760498046875, 0.010049819946289062, 0.014492034912109375, 0.018934249877929688, 0.02337646484375, 0.027818679809570312, 0.032260894775390625, 0.03670310974121094, 0.04114532470703125, 0.04558753967285156, 0.050029754638671875, 0.05447196960449219, 0.0589141845703125, 0.06335639953613281, 0.06779861450195312, 0.07224082946777344, 0.07668304443359375, 0.08112525939941406, 0.08556747436523438, 0.09000968933105469, 0.094451904296875, 0.09889411926269531, 0.10333633422851562, 0.10777854919433594, 0.11222076416015625, 0.11666297912597656, 0.12110519409179688, 0.1255474090576172, 0.1299896240234375, 0.1344318389892578, 0.13887405395507812, 0.14331626892089844, 0.14775848388671875, 0.15220069885253906, 0.15664291381835938, 0.1610851287841797, 0.16552734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 5.0, 2.0, 6.0, 9.0, 6.0, 14.0, 24.0, 27.0, 43.0, 97.0, 296.0, 233.0, 92.0, 48.0, 41.0, 16.0, 20.0, 2.0, 8.0, 6.0, 3.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0322265625, -0.03102874755859375, -0.0298309326171875, -0.02863311767578125, -0.027435302734375, -0.02623748779296875, -0.0250396728515625, -0.02384185791015625, -0.02264404296875, -0.02144622802734375, -0.0202484130859375, -0.01905059814453125, -0.017852783203125, -0.01665496826171875, -0.0154571533203125, -0.01425933837890625, -0.0130615234375, -0.01186370849609375, -0.0106658935546875, -0.00946807861328125, -0.008270263671875, -0.00707244873046875, -0.0058746337890625, -0.00467681884765625, -0.00347900390625, -0.00228118896484375, -0.0010833740234375, 0.00011444091796875, 0.001312255859375, 0.00251007080078125, 0.0037078857421875, 0.00490570068359375, 0.006103515625, 0.00730133056640625, 0.0084991455078125, 0.00969696044921875, 0.010894775390625, 0.01209259033203125, 0.0132904052734375, 0.01448822021484375, 0.01568603515625, 0.01688385009765625, 0.0180816650390625, 0.01927947998046875, 0.020477294921875, 0.02167510986328125, 0.0228729248046875, 0.02407073974609375, 0.0252685546875, 0.02646636962890625, 0.0276641845703125, 0.02886199951171875, 0.030059814453125, 0.03125762939453125, 0.0324554443359375, 0.03365325927734375, 0.03485107421875, 0.03604888916015625, 0.0372467041015625, 0.03844451904296875, 0.039642333984375, 0.04084014892578125, 0.0420379638671875, 0.04323577880859375, 0.04443359375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 10.0, 20.0, 55.0, 79.0, 150.0, 206.0, 220.0, 132.0, 65.0, 36.0, 17.0, 10.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.3014256954193115, -2.2552154064178467, -2.209005117416382, -2.162795066833496, -2.1165847778320312, -2.0703744888305664, -2.0241641998291016, -1.9779539108276367, -1.9317437410354614, -1.8855334520339966, -1.8393232822418213, -1.7931129932403564, -1.7469027042388916, -1.7006925344467163, -1.6544822454452515, -1.6082720756530762, -1.5620617866516113, -1.5158514976501465, -1.4696413278579712, -1.4234310388565063, -1.377220869064331, -1.3310105800628662, -1.2848002910614014, -1.2385900020599365, -1.1923798322677612, -1.1461695432662964, -1.099959373474121, -1.0537490844726562, -1.0075387954711914, -0.9613286256790161, -0.9151183366775513, -0.8689081072807312, -0.8226979374885559, -0.7764877080917358, -0.730277419090271, -0.6840671896934509, -0.6378569602966309, -0.5916467308998108, -0.5454365015029907, -0.4992262125015259, -0.4530159831047058, -0.40680575370788574, -0.3605954945087433, -0.31438523530960083, -0.26817500591278076, -0.2219647616147995, -0.17575451731681824, -0.12954425811767578, -0.08333402872085571, -0.03712378442287445, 0.009086459875106812, 0.055296704173088074, 0.10150694847106934, 0.1477171927690506, 0.19392743706703186, 0.24013769626617432, 0.2863479256629944, 0.33255815505981445, 0.3787684142589569, 0.42497867345809937, 0.47118890285491943, 0.5173991322517395, 0.5636093616485596, 0.6098196506500244, 0.6560298800468445]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 2.0, 6.0, 4.0, 11.0, 8.0, 16.0, 13.0, 20.0, 23.0, 34.0, 31.0, 26.0, 32.0, 40.0, 41.0, 43.0, 37.0, 59.0, 53.0, 46.0, 49.0, 47.0, 42.0, 37.0, 47.0, 33.0, 40.0, 33.0, 24.0, 20.0, 17.0, 20.0, 5.0, 10.0, 6.0, 3.0, 6.0, 9.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5256943702697754, -1.479115605354309, -1.4325368404388428, -1.3859580755233765, -1.3393793106079102, -1.2928004264831543, -1.246221661567688, -1.1996428966522217, -1.1530641317367554, -1.106485366821289, -1.0599066019058228, -1.0133278369903564, -0.9667490124702454, -0.920170247554779, -0.873591423034668, -0.8270126581192017, -0.7804338932037354, -0.733855128288269, -0.6872763633728027, -0.6406975388526917, -0.5941187739372253, -0.547540009021759, -0.500961184501648, -0.45438241958618164, -0.40780365467071533, -0.361224889755249, -0.3146460950374603, -0.26806730031967163, -0.22148853540420532, -0.17490975558757782, -0.12833097577095032, -0.08175218105316162, -0.03517341613769531, 0.01140536367893219, 0.05798414349555969, 0.1045629233121872, 0.1511417031288147, 0.1977204829454422, 0.2442992627620697, 0.2908780574798584, 0.3374568223953247, 0.384035587310791, 0.4306143820285797, 0.4771931767463684, 0.5237719416618347, 0.570350706577301, 0.6169295310974121, 0.6635082960128784, 0.7100870609283447, 0.756665825843811, 0.8032445907592773, 0.8498234152793884, 0.8964021801948547, 0.942980945110321, 0.9895597696304321, 1.0361385345458984, 1.0827172994613647, 1.129296064376831, 1.1758748292922974, 1.2224535942077637, 1.2690324783325195, 1.3156112432479858, 1.3621900081634521, 1.4087687730789185, 1.4553475379943848]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 9.0, 3.0, 10.0, 12.0, 11.0, 20.0, 14.0, 26.0, 27.0, 54.0, 42.0, 92.0, 177.0, 421.0, 1095.0, 3776.0, 22823.0, 899605.0, 3160717.0, 94092.0, 8172.0, 1846.0, 606.0, 217.0, 124.0, 74.0, 43.0, 22.0, 26.0, 21.0, 15.0, 12.0, 10.0, 11.0, 13.0, 3.0, 7.0, 7.0, 5.0, 1.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0556640625, -1.0207366943359375, -0.985809326171875, -0.9508819580078125, -0.91595458984375, -0.8810272216796875, -0.846099853515625, -0.8111724853515625, -0.7762451171875, -0.7413177490234375, -0.706390380859375, -0.6714630126953125, -0.63653564453125, -0.6016082763671875, -0.566680908203125, -0.5317535400390625, -0.496826171875, -0.4618988037109375, -0.426971435546875, -0.3920440673828125, -0.35711669921875, -0.3221893310546875, -0.287261962890625, -0.2523345947265625, -0.2174072265625, -0.1824798583984375, -0.147552490234375, -0.1126251220703125, -0.07769775390625, -0.0427703857421875, -0.007843017578125, 0.0270843505859375, 0.06201171875, 0.0969390869140625, 0.131866455078125, 0.1667938232421875, 0.20172119140625, 0.2366485595703125, 0.271575927734375, 0.3065032958984375, 0.3414306640625, 0.3763580322265625, 0.411285400390625, 0.4462127685546875, 0.48114013671875, 0.5160675048828125, 0.550994873046875, 0.5859222412109375, 0.620849609375, 0.6557769775390625, 0.690704345703125, 0.7256317138671875, 0.76055908203125, 0.7954864501953125, 0.830413818359375, 0.8653411865234375, 0.9002685546875, 0.9351959228515625, 0.970123291015625, 1.0050506591796875, 1.03997802734375, 1.0749053955078125, 1.109832763671875, 1.1447601318359375, 1.1796875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 8.0, 3.0, 10.0, 9.0, 8.0, 12.0, 21.0, 23.0, 27.0, 39.0, 33.0, 47.0, 45.0, 50.0, 49.0, 57.0, 60.0, 64.0, 60.0, 50.0, 63.0, 48.0, 47.0, 40.0, 22.0, 22.0, 24.0, 16.0, 9.0, 5.0, 12.0, 5.0, 2.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.413818359375, -0.4015007019042969, -0.38918304443359375, -0.3768653869628906, -0.3645477294921875, -0.3522300720214844, -0.33991241455078125, -0.3275947570800781, -0.315277099609375, -0.3029594421386719, -0.29064178466796875, -0.2783241271972656, -0.2660064697265625, -0.2536888122558594, -0.24137115478515625, -0.22905349731445312, -0.21673583984375, -0.20441818237304688, -0.19210052490234375, -0.17978286743164062, -0.1674652099609375, -0.15514755249023438, -0.14282989501953125, -0.13051223754882812, -0.118194580078125, -0.10587692260742188, -0.09355926513671875, -0.08124160766601562, -0.0689239501953125, -0.056606292724609375, -0.04428863525390625, -0.031970977783203125, -0.0196533203125, -0.007335662841796875, 0.00498199462890625, 0.017299652099609375, 0.0296173095703125, 0.041934967041015625, 0.05425262451171875, 0.06657028198242188, 0.078887939453125, 0.09120559692382812, 0.10352325439453125, 0.11584091186523438, 0.1281585693359375, 0.14047622680664062, 0.15279388427734375, 0.16511154174804688, 0.17742919921875, 0.18974685668945312, 0.20206451416015625, 0.21438217163085938, 0.2266998291015625, 0.23901748657226562, 0.25133514404296875, 0.2636528015136719, 0.275970458984375, 0.2882881164550781, 0.30060577392578125, 0.3129234313964844, 0.3252410888671875, 0.3375587463378906, 0.34987640380859375, 0.3621940612792969, 0.37451171875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 3.0, 6.0, 4.0, 9.0, 12.0, 10.0, 25.0, 42.0, 70.0, 132.0, 349.0, 969.0, 10796.0, 3957913.0, 219043.0, 3673.0, 712.0, 234.0, 116.0, 69.0, 39.0, 14.0, 11.0, 7.0, 8.0, 1.0, 4.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.48046875, -1.415557861328125, -1.35064697265625, -1.285736083984375, -1.2208251953125, -1.155914306640625, -1.09100341796875, -1.026092529296875, -0.961181640625, -0.896270751953125, -0.83135986328125, -0.766448974609375, -0.7015380859375, -0.636627197265625, -0.57171630859375, -0.506805419921875, -0.44189453125, -0.376983642578125, -0.31207275390625, -0.247161865234375, -0.1822509765625, -0.117340087890625, -0.05242919921875, 0.012481689453125, 0.077392578125, 0.142303466796875, 0.20721435546875, 0.272125244140625, 0.3370361328125, 0.401947021484375, 0.46685791015625, 0.531768798828125, 0.5966796875, 0.661590576171875, 0.72650146484375, 0.791412353515625, 0.8563232421875, 0.921234130859375, 0.98614501953125, 1.051055908203125, 1.115966796875, 1.180877685546875, 1.24578857421875, 1.310699462890625, 1.3756103515625, 1.440521240234375, 1.50543212890625, 1.570343017578125, 1.63525390625, 1.700164794921875, 1.76507568359375, 1.829986572265625, 1.8948974609375, 1.959808349609375, 2.02471923828125, 2.089630126953125, 2.154541015625, 2.219451904296875, 2.28436279296875, 2.349273681640625, 2.4141845703125, 2.479095458984375, 2.54400634765625, 2.608917236328125, 2.673828125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 7.0, 1.0, 13.0, 23.0, 27.0, 41.0, 49.0, 102.0, 240.0, 568.0, 1152.0, 917.0, 457.0, 205.0, 105.0, 53.0, 41.0, 27.0, 13.0, 11.0, 11.0, 6.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35693359375, -0.34798431396484375, -0.3390350341796875, -0.33008575439453125, -0.321136474609375, -0.31218719482421875, -0.3032379150390625, -0.29428863525390625, -0.28533935546875, -0.27639007568359375, -0.2674407958984375, -0.25849151611328125, -0.249542236328125, -0.24059295654296875, -0.2316436767578125, -0.22269439697265625, -0.2137451171875, -0.20479583740234375, -0.1958465576171875, -0.18689727783203125, -0.177947998046875, -0.16899871826171875, -0.1600494384765625, -0.15110015869140625, -0.14215087890625, -0.13320159912109375, -0.1242523193359375, -0.11530303955078125, -0.106353759765625, -0.09740447998046875, -0.0884552001953125, -0.07950592041015625, -0.070556640625, -0.06160736083984375, -0.0526580810546875, -0.04370880126953125, -0.034759521484375, -0.02581024169921875, -0.0168609619140625, -0.00791168212890625, 0.00103759765625, 0.00998687744140625, 0.0189361572265625, 0.02788543701171875, 0.036834716796875, 0.04578399658203125, 0.0547332763671875, 0.06368255615234375, 0.0726318359375, 0.08158111572265625, 0.0905303955078125, 0.09947967529296875, 0.108428955078125, 0.11737823486328125, 0.1263275146484375, 0.13527679443359375, 0.14422607421875, 0.15317535400390625, 0.1621246337890625, 0.17107391357421875, 0.180023193359375, 0.18897247314453125, 0.1979217529296875, 0.20687103271484375, 0.2158203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 2.0, 12.0, 10.0, 16.0, 16.0, 25.0, 32.0, 45.0, 59.0, 73.0, 81.0, 90.0, 87.0, 79.0, 85.0, 70.0, 63.0, 39.0, 26.0, 33.0, 14.0, 9.0, 8.0, 6.0, 8.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5367403030395508, -0.5201295614242554, -0.50351881980896, -0.48690807819366455, -0.47029733657836914, -0.45368659496307373, -0.43707582354545593, -0.4204650819301605, -0.4038543403148651, -0.3872435986995697, -0.3706328570842743, -0.3540221154689789, -0.3374113440513611, -0.3208006024360657, -0.30418986082077026, -0.28757911920547485, -0.27096837759017944, -0.25435763597488403, -0.23774689435958862, -0.22113613784313202, -0.2045253962278366, -0.1879146546125412, -0.1713038980960846, -0.15469315648078918, -0.13808241486549377, -0.12147167325019836, -0.10486092418432236, -0.08825017511844635, -0.07163943350315094, -0.05502869188785553, -0.03841794282197952, -0.021807193756103516, -0.0051964521408081055, 0.011414293199777603, 0.028025038540363312, 0.04463578388094902, 0.06124652922153473, 0.07785727083683014, 0.09446801990270615, 0.11107876896858215, 0.12768951058387756, 0.14430025219917297, 0.16091099381446838, 0.177521750330925, 0.1941324919462204, 0.2107432335615158, 0.2273539900779724, 0.24396473169326782, 0.26057547330856323, 0.27718621492385864, 0.29379695653915405, 0.31040769815444946, 0.3270184397697449, 0.3436291813850403, 0.3602399528026581, 0.3768506944179535, 0.3934614360332489, 0.4100721776485443, 0.4266829192638397, 0.44329366087913513, 0.45990443229675293, 0.47651517391204834, 0.49312591552734375, 0.5097366571426392, 0.5263473987579346]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 6.0, 7.0, 7.0, 11.0, 13.0, 16.0, 11.0, 22.0, 23.0, 30.0, 42.0, 46.0, 40.0, 51.0, 43.0, 40.0, 52.0, 53.0, 48.0, 57.0, 48.0, 44.0, 38.0, 39.0, 39.0, 34.0, 22.0, 26.0, 18.0, 15.0, 12.0, 12.0, 7.0, 9.0, 11.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3666754961013794, -0.35368362069129944, -0.3406917452812195, -0.32769984006881714, -0.3147079646587372, -0.3017160892486572, -0.2887241840362549, -0.2757323086261749, -0.26274043321609497, -0.24974855780601501, -0.23675666749477386, -0.22376477718353271, -0.21077290177345276, -0.1977810263633728, -0.18478913605213165, -0.1717972457408905, -0.15880537033081055, -0.1458134949207306, -0.13282160460948944, -0.11982972174882889, -0.10683783888816833, -0.09384595602750778, -0.08085407316684723, -0.06786219030618668, -0.05487030744552612, -0.04187842458486557, -0.028886541724205017, -0.015894658863544464, -0.002902776002883911, 0.010089106857776642, 0.023080989718437195, 0.03607287257909775, 0.04906478524208069, 0.06205666810274124, 0.0750485509634018, 0.08804043382406235, 0.1010323166847229, 0.11402419954538345, 0.127016082406044, 0.14000797271728516, 0.1529998481273651, 0.16599172353744507, 0.17898361384868622, 0.19197550415992737, 0.20496737957000732, 0.21795925498008728, 0.23095114529132843, 0.24394303560256958, 0.25693491101264954, 0.2699267864227295, 0.28291869163513184, 0.2959105670452118, 0.30890244245529175, 0.3218943178653717, 0.33488619327545166, 0.347878098487854, 0.36086997389793396, 0.3738618493080139, 0.38685375452041626, 0.3998456299304962, 0.41283750534057617, 0.42582938075065613, 0.4388212561607361, 0.4518131613731384, 0.4648050367832184]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 10.0, 14.0, 11.0, 14.0, 27.0, 46.0, 84.0, 142.0, 211.0, 408.0, 815.0, 1815.0, 4676.0, 15441.0, 74121.0, 552990.0, 336112.0, 44689.0, 10596.0, 3372.0, 1434.0, 708.0, 363.0, 181.0, 75.0, 59.0, 42.0, 24.0, 18.0, 18.0, 14.0, 7.0, 2.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1256103515625, -0.12075233459472656, -0.11589431762695312, -0.11103630065917969, -0.10617828369140625, -0.10132026672363281, -0.09646224975585938, -0.09160423278808594, -0.0867462158203125, -0.08188819885253906, -0.07703018188476562, -0.07217216491699219, -0.06731414794921875, -0.06245613098144531, -0.057598114013671875, -0.05274009704589844, -0.047882080078125, -0.04302406311035156, -0.038166046142578125, -0.03330802917480469, -0.02845001220703125, -0.023591995239257812, -0.018733978271484375, -0.013875961303710938, -0.0090179443359375, -0.0041599273681640625, 0.000698089599609375, 0.0055561065673828125, 0.01041412353515625, 0.015272140502929688, 0.020130157470703125, 0.024988174438476562, 0.02984619140625, 0.03470420837402344, 0.039562225341796875, 0.04442024230957031, 0.04927825927734375, 0.05413627624511719, 0.058994293212890625, 0.06385231018066406, 0.0687103271484375, 0.07356834411621094, 0.07842636108398438, 0.08328437805175781, 0.08814239501953125, 0.09300041198730469, 0.09785842895507812, 0.10271644592285156, 0.107574462890625, 0.11243247985839844, 0.11729049682617188, 0.12214851379394531, 0.12700653076171875, 0.1318645477294922, 0.13672256469726562, 0.14158058166503906, 0.1464385986328125, 0.15129661560058594, 0.15615463256835938, 0.1610126495361328, 0.16587066650390625, 0.1707286834716797, 0.17558670043945312, 0.18044471740722656, 0.185302734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 11.0, 5.0, 5.0, 14.0, 14.0, 21.0, 22.0, 29.0, 45.0, 41.0, 57.0, 60.0, 57.0, 55.0, 74.0, 69.0, 57.0, 71.0, 59.0, 44.0, 51.0, 25.0, 23.0, 18.0, 26.0, 13.0, 12.0, 10.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2196044921875, -0.20995521545410156, -0.20030593872070312, -0.1906566619873047, -0.18100738525390625, -0.1713581085205078, -0.16170883178710938, -0.15205955505371094, -0.1424102783203125, -0.13276100158691406, -0.12311172485351562, -0.11346244812011719, -0.10381317138671875, -0.09416389465332031, -0.08451461791992188, -0.07486534118652344, -0.065216064453125, -0.05556678771972656, -0.045917510986328125, -0.03626823425292969, -0.02661895751953125, -0.016969680786132812, -0.007320404052734375, 0.0023288726806640625, 0.0119781494140625, 0.021627426147460938, 0.031276702880859375, 0.04092597961425781, 0.05057525634765625, 0.06022453308105469, 0.06987380981445312, 0.07952308654785156, 0.08917236328125, 0.09882164001464844, 0.10847091674804688, 0.11812019348144531, 0.12776947021484375, 0.1374187469482422, 0.14706802368164062, 0.15671730041503906, 0.1663665771484375, 0.17601585388183594, 0.18566513061523438, 0.1953144073486328, 0.20496368408203125, 0.2146129608154297, 0.22426223754882812, 0.23391151428222656, 0.243560791015625, 0.25321006774902344, 0.2628593444824219, 0.2725086212158203, 0.28215789794921875, 0.2918071746826172, 0.3014564514160156, 0.31110572814941406, 0.3207550048828125, 0.33040428161621094, 0.3400535583496094, 0.3497028350830078, 0.35935211181640625, 0.3690013885498047, 0.3786506652832031, 0.38829994201660156, 0.39794921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 6.0, 6.0, 9.0, 12.0, 25.0, 30.0, 47.0, 57.0, 83.0, 127.0, 201.0, 312.0, 473.0, 763.0, 1123.0, 1772.0, 2914.0, 4581.0, 7648.0, 12821.0, 22268.0, 40861.0, 79225.0, 159420.0, 254367.0, 214767.0, 114234.0, 57450.0, 30244.0, 16974.0, 9845.0, 5910.0, 3595.0, 2293.0, 1447.0, 899.0, 597.0, 372.0, 267.0, 177.0, 118.0, 75.0, 41.0, 29.0, 17.0, 19.0, 10.0, 11.0, 5.0, 5.0, 6.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.041961669921875, -0.04071855545043945, -0.039475440979003906, -0.03823232650756836, -0.03698921203613281, -0.035746097564697266, -0.03450298309326172, -0.03325986862182617, -0.032016754150390625, -0.030773639678955078, -0.02953052520751953, -0.028287410736083984, -0.027044296264648438, -0.02580118179321289, -0.024558067321777344, -0.023314952850341797, -0.02207183837890625, -0.020828723907470703, -0.019585609436035156, -0.01834249496459961, -0.017099380493164062, -0.015856266021728516, -0.014613151550292969, -0.013370037078857422, -0.012126922607421875, -0.010883808135986328, -0.009640693664550781, -0.008397579193115234, -0.0071544647216796875, -0.005911350250244141, -0.004668235778808594, -0.003425121307373047, -0.0021820068359375, -0.0009388923645019531, 0.00030422210693359375, 0.0015473365783691406, 0.0027904510498046875, 0.004033565521240234, 0.005276679992675781, 0.006519794464111328, 0.007762908935546875, 0.009006023406982422, 0.010249137878417969, 0.011492252349853516, 0.012735366821289062, 0.01397848129272461, 0.015221595764160156, 0.016464710235595703, 0.01770782470703125, 0.018950939178466797, 0.020194053649902344, 0.02143716812133789, 0.022680282592773438, 0.023923397064208984, 0.02516651153564453, 0.026409626007080078, 0.027652740478515625, 0.028895854949951172, 0.03013896942138672, 0.031382083892822266, 0.03262519836425781, 0.03386831283569336, 0.035111427307128906, 0.03635454177856445, 0.03759765625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 6.0, 6.0, 11.0, 9.0, 12.0, 7.0, 11.0, 18.0, 33.0, 32.0, 36.0, 42.0, 43.0, 48.0, 49.0, 57.0, 53.0, 55.0, 44.0, 55.0, 53.0, 41.0, 40.0, 36.0, 34.0, 28.0, 28.0, 24.0, 11.0, 22.0, 10.0, 8.0, 6.0, 9.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389404296875, -0.3758087158203125, -0.362213134765625, -0.3486175537109375, -0.33502197265625, -0.3214263916015625, -0.307830810546875, -0.2942352294921875, -0.2806396484375, -0.2670440673828125, -0.253448486328125, -0.2398529052734375, -0.22625732421875, -0.2126617431640625, -0.199066162109375, -0.1854705810546875, -0.171875, -0.1582794189453125, -0.144683837890625, -0.1310882568359375, -0.11749267578125, -0.1038970947265625, -0.090301513671875, -0.0767059326171875, -0.0631103515625, -0.0495147705078125, -0.035919189453125, -0.0223236083984375, -0.00872802734375, 0.0048675537109375, 0.018463134765625, 0.0320587158203125, 0.045654296875, 0.0592498779296875, 0.072845458984375, 0.0864410400390625, 0.10003662109375, 0.1136322021484375, 0.127227783203125, 0.1408233642578125, 0.1544189453125, 0.1680145263671875, 0.181610107421875, 0.1952056884765625, 0.20880126953125, 0.2223968505859375, 0.235992431640625, 0.2495880126953125, 0.26318359375, 0.2767791748046875, 0.290374755859375, 0.3039703369140625, 0.31756591796875, 0.3311614990234375, 0.344757080078125, 0.3583526611328125, 0.3719482421875, 0.3855438232421875, 0.399139404296875, 0.4127349853515625, 0.42633056640625, 0.4399261474609375, 0.453521728515625, 0.4671173095703125, 0.480712890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 6.0, 6.0, 7.0, 11.0, 14.0, 18.0, 23.0, 22.0, 27.0, 54.0, 60.0, 95.0, 144.0, 192.0, 297.0, 466.0, 658.0, 1188.0, 2063.0, 3440.0, 6536.0, 13515.0, 29026.0, 63332.0, 134245.0, 248343.0, 261685.0, 148253.0, 70537.0, 32314.0, 15062.0, 7298.0, 3878.0, 2140.0, 1257.0, 739.0, 512.0, 331.0, 229.0, 155.0, 113.0, 68.0, 49.0, 39.0, 26.0, 24.0, 17.0, 13.0, 12.0, 5.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034732818603515625, -0.003353804349899292, -0.0032343268394470215, -0.003114849328994751, -0.0029953718185424805, -0.00287589430809021, -0.0027564167976379395, -0.002636939287185669, -0.0025174617767333984, -0.002397984266281128, -0.0022785067558288574, -0.002159029245376587, -0.0020395517349243164, -0.001920074224472046, -0.0018005967140197754, -0.0016811192035675049, -0.0015616416931152344, -0.0014421641826629639, -0.0013226866722106934, -0.0012032091617584229, -0.0010837316513061523, -0.0009642541408538818, -0.0008447766304016113, -0.0007252991199493408, -0.0006058216094970703, -0.0004863440990447998, -0.0003668665885925293, -0.0002473890781402588, -0.00012791156768798828, -8.434057235717773e-06, 0.00011104345321655273, 0.00023052096366882324, 0.00034999847412109375, 0.00046947598457336426, 0.0005889534950256348, 0.0007084310054779053, 0.0008279085159301758, 0.0009473860263824463, 0.0010668635368347168, 0.0011863410472869873, 0.0013058185577392578, 0.0014252960681915283, 0.0015447735786437988, 0.0016642510890960693, 0.0017837285995483398, 0.0019032061100006104, 0.002022683620452881, 0.0021421611309051514, 0.002261638641357422, 0.0023811161518096924, 0.002500593662261963, 0.0026200711727142334, 0.002739548683166504, 0.0028590261936187744, 0.002978503704071045, 0.0030979812145233154, 0.003217458724975586, 0.0033369362354278564, 0.003456413745880127, 0.0035758912563323975, 0.003695368766784668, 0.0038148462772369385, 0.003934323787689209, 0.0040538012981414795, 0.00417327880859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 8.0, 5.0, 4.0, 11.0, 8.0, 14.0, 14.0, 22.0, 37.0, 28.0, 32.0, 56.0, 76.0, 68.0, 84.0, 84.0, 74.0, 75.0, 76.0, 46.0, 33.0, 36.0, 19.0, 19.0, 18.0, 11.0, 8.0, 6.0, 5.0, 8.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1146068572998047e-05, -1.0829418897628784e-05, -1.0512769222259521e-05, -1.0196119546890259e-05, -9.879469871520996e-06, -9.562820196151733e-06, -9.24617052078247e-06, -8.929520845413208e-06, -8.612871170043945e-06, -8.296221494674683e-06, -7.97957181930542e-06, -7.662922143936157e-06, -7.3462724685668945e-06, -7.029622793197632e-06, -6.712973117828369e-06, -6.3963234424591064e-06, -6.079673767089844e-06, -5.763024091720581e-06, -5.446374416351318e-06, -5.129724740982056e-06, -4.813075065612793e-06, -4.49642539024353e-06, -4.179775714874268e-06, -3.863126039505005e-06, -3.546476364135742e-06, -3.2298266887664795e-06, -2.913177013397217e-06, -2.596527338027954e-06, -2.2798776626586914e-06, -1.9632279872894287e-06, -1.646578311920166e-06, -1.3299286365509033e-06, -1.0132789611816406e-06, -6.966292858123779e-07, -3.7997961044311523e-07, -6.332993507385254e-08, 2.5331974029541016e-07, 5.699694156646729e-07, 8.866190910339355e-07, 1.2032687664031982e-06, 1.519918441772461e-06, 1.8365681171417236e-06, 2.1532177925109863e-06, 2.469867467880249e-06, 2.7865171432495117e-06, 3.1031668186187744e-06, 3.419816493988037e-06, 3.7364661693573e-06, 4.0531158447265625e-06, 4.369765520095825e-06, 4.686415195465088e-06, 5.003064870834351e-06, 5.319714546203613e-06, 5.636364221572876e-06, 5.953013896942139e-06, 6.269663572311401e-06, 6.586313247680664e-06, 6.902962923049927e-06, 7.2196125984191895e-06, 7.536262273788452e-06, 7.852911949157715e-06, 8.169561624526978e-06, 8.48621129989624e-06, 8.802860975265503e-06, 9.119510650634766e-06]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 5.0, 3.0, 8.0, 14.0, 8.0, 13.0, 24.0, 21.0, 35.0, 54.0, 87.0, 159.0, 435.0, 1959.0, 19139.0, 337253.0, 638715.0, 45811.0, 3639.0, 611.0, 238.0, 108.0, 66.0, 38.0, 24.0, 25.0, 27.0, 11.0, 8.0, 6.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00959014892578125, -0.009208917617797852, -0.008827686309814453, -0.008446455001831055, -0.008065223693847656, -0.007683992385864258, -0.007302761077880859, -0.006921529769897461, -0.0065402984619140625, -0.006159067153930664, -0.005777835845947266, -0.005396604537963867, -0.005015373229980469, -0.00463414192199707, -0.004252910614013672, -0.0038716793060302734, -0.003490447998046875, -0.0031092166900634766, -0.002727985382080078, -0.0023467540740966797, -0.0019655227661132812, -0.0015842914581298828, -0.0012030601501464844, -0.0008218288421630859, -0.0004405975341796875, -5.936622619628906e-05, 0.0003218650817871094, 0.0007030963897705078, 0.0010843276977539062, 0.0014655590057373047, 0.0018467903137207031, 0.0022280216217041016, 0.0026092529296875, 0.0029904842376708984, 0.003371715545654297, 0.0037529468536376953, 0.004134178161621094, 0.004515409469604492, 0.004896640777587891, 0.005277872085571289, 0.0056591033935546875, 0.006040334701538086, 0.006421566009521484, 0.006802797317504883, 0.007184028625488281, 0.00756525993347168, 0.007946491241455078, 0.008327722549438477, 0.008708953857421875, 0.009090185165405273, 0.009471416473388672, 0.00985264778137207, 0.010233879089355469, 0.010615110397338867, 0.010996341705322266, 0.011377573013305664, 0.011758804321289062, 0.012140035629272461, 0.01252126693725586, 0.012902498245239258, 0.013283729553222656, 0.013664960861206055, 0.014046192169189453, 0.014427423477172852, 0.01480865478515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 9.0, 6.0, 4.0, 16.0, 16.0, 23.0, 26.0, 23.0, 32.0, 41.0, 35.0, 64.0, 67.0, 74.0, 96.0, 67.0, 71.0, 70.0, 45.0, 54.0, 44.0, 30.0, 26.0, 15.0, 17.0, 9.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010442733764648438, -0.0009997189044952393, -0.0009551644325256348, -0.0009106099605560303, -0.0008660554885864258, -0.0008215010166168213, -0.0007769465446472168, -0.0007323920726776123, -0.0006878376007080078, -0.0006432831287384033, -0.0005987286567687988, -0.0005541741847991943, -0.0005096197128295898, -0.00046506524085998535, -0.00042051076889038086, -0.00037595629692077637, -0.0003314018249511719, -0.0002868473529815674, -0.0002422928810119629, -0.0001977384090423584, -0.0001531839370727539, -0.00010862946510314941, -6.407499313354492e-05, -1.952052116394043e-05, 2.5033950805664062e-05, 6.958842277526855e-05, 0.00011414289474487305, 0.00015869736671447754, 0.00020325183868408203, 0.0002478063106536865, 0.000292360782623291, 0.0003369152545928955, 0.0003814697265625, 0.0004260241985321045, 0.000470578670501709, 0.0005151331424713135, 0.000559687614440918, 0.0006042420864105225, 0.000648796558380127, 0.0006933510303497314, 0.0007379055023193359, 0.0007824599742889404, 0.0008270144462585449, 0.0008715689182281494, 0.0009161233901977539, 0.0009606778621673584, 0.0010052323341369629, 0.0010497868061065674, 0.0010943412780761719, 0.0011388957500457764, 0.0011834502220153809, 0.0012280046939849854, 0.0012725591659545898, 0.0013171136379241943, 0.0013616681098937988, 0.0014062225818634033, 0.0014507770538330078, 0.0014953315258026123, 0.0015398859977722168, 0.0015844404697418213, 0.0016289949417114258, 0.0016735494136810303, 0.0017181038856506348, 0.0017626583576202393, 0.0018072128295898438]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 6.0, 13.0, 13.0, 24.0, 27.0, 49.0, 70.0, 93.0, 93.0, 94.0, 98.0, 92.0, 84.0, 68.0, 59.0, 29.0, 25.0, 18.0, 8.0, 11.0, 7.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31510552763938904, -0.30460652709007263, -0.2941075563430786, -0.2836085557937622, -0.2731095552444458, -0.2626105546951294, -0.2521115839481354, -0.24161258339881897, -0.23111359775066376, -0.22061461210250854, -0.21011561155319214, -0.19961662590503693, -0.1891176402568817, -0.1786186397075653, -0.1681196540594101, -0.15762066841125488, -0.14712166786193848, -0.13662268221378326, -0.12612368166446686, -0.11562469601631165, -0.10512570291757584, -0.09462670981884003, -0.08412772417068481, -0.073628731071949, -0.0631297379732132, -0.052630744874477386, -0.042131755501031876, -0.031632766127586365, -0.021133773028850555, -0.010634779930114746, -0.0001357942819595337, 0.010363198816776276, 0.020862221717834473, 0.03136121481657028, 0.04186020419001579, 0.052359193563461304, 0.06285818666219711, 0.07335717976093292, 0.08385616540908813, 0.09435515850782394, 0.10485415160655975, 0.11535314470529556, 0.12585213780403137, 0.13635112345218658, 0.1468501091003418, 0.1573491096496582, 0.16784809529781342, 0.17834708094596863, 0.18884608149528503, 0.19934506714344025, 0.20984406769275665, 0.22034305334091187, 0.23084205389022827, 0.24134103953838348, 0.2518400251865387, 0.2623390257358551, 0.2728379964828491, 0.2833369970321655, 0.29383596777915955, 0.30433496832847595, 0.31483396887779236, 0.3253329396247864, 0.3358319401741028, 0.3463309407234192, 0.3568299412727356]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 3.0, 4.0, 2.0, 6.0, 8.0, 6.0, 16.0, 14.0, 11.0, 21.0, 24.0, 30.0, 29.0, 53.0, 43.0, 52.0, 47.0, 35.0, 56.0, 57.0, 56.0, 48.0, 52.0, 48.0, 40.0, 45.0, 32.0, 31.0, 24.0, 25.0, 22.0, 9.0, 12.0, 12.0, 7.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.22186490893363953, -0.21434876322746277, -0.206832617521286, -0.19931647181510925, -0.1918003112077713, -0.18428416550159454, -0.17676801979541779, -0.16925187408924103, -0.16173572838306427, -0.1542195826768875, -0.14670343697071075, -0.1391872763633728, -0.13167113065719604, -0.12415498495101929, -0.11663883924484253, -0.10912269353866577, -0.10160654038190842, -0.09409039467573166, -0.0865742415189743, -0.07905809581279755, -0.07154195010662079, -0.06402580440044403, -0.056509651243686676, -0.04899350553750992, -0.04147735610604286, -0.033961206674575806, -0.026445060968399048, -0.01892891153693199, -0.011412763968110085, -0.0038966163992881775, 0.003619533032178879, 0.011135678738355637, 0.018651828169822693, 0.0261679757386446, 0.03368412330746651, 0.04120027273893356, 0.04871641844511032, 0.05623256787657738, 0.06374871730804443, 0.07126486301422119, 0.07878100872039795, 0.08629715442657471, 0.09381330758333206, 0.10132945328950882, 0.10884559899568558, 0.11636175215244293, 0.12387789785861969, 0.13139404356479645, 0.1389102041721344, 0.14642634987831116, 0.15394249558448792, 0.16145864129066467, 0.16897480189800262, 0.17649094760417938, 0.18400709331035614, 0.1915232390165329, 0.19903938472270966, 0.2065555304288864, 0.21407167613506317, 0.22158783674240112, 0.22910398244857788, 0.23662012815475464, 0.2441362738609314, 0.25165241956710815, 0.2591685652732849]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 6.0, 16.0, 11.0, 33.0, 38.0, 45.0, 67.0, 99.0, 149.0, 222.0, 365.0, 475.0, 756.0, 1324.0, 2093.0, 3642.0, 6903.0, 13984.0, 34216.0, 120040.0, 488144.0, 270546.0, 61814.0, 21402.0, 9813.0, 5025.0, 2815.0, 1609.0, 1007.0, 637.0, 416.0, 262.0, 163.0, 124.0, 99.0, 58.0, 35.0, 38.0, 19.0, 13.0, 9.0, 5.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.1541748046875, -0.14916229248046875, -0.1441497802734375, -0.13913726806640625, -0.134124755859375, -0.12911224365234375, -0.1240997314453125, -0.11908721923828125, -0.11407470703125, -0.10906219482421875, -0.1040496826171875, -0.09903717041015625, -0.094024658203125, -0.08901214599609375, -0.0839996337890625, -0.07898712158203125, -0.073974609375, -0.06896209716796875, -0.0639495849609375, -0.05893707275390625, -0.053924560546875, -0.04891204833984375, -0.0438995361328125, -0.03888702392578125, -0.03387451171875, -0.02886199951171875, -0.0238494873046875, -0.01883697509765625, -0.013824462890625, -0.00881195068359375, -0.0037994384765625, 0.00121307373046875, 0.0062255859375, 0.01123809814453125, 0.0162506103515625, 0.02126312255859375, 0.026275634765625, 0.03128814697265625, 0.0363006591796875, 0.04131317138671875, 0.04632568359375, 0.05133819580078125, 0.0563507080078125, 0.06136322021484375, 0.066375732421875, 0.07138824462890625, 0.0764007568359375, 0.08141326904296875, 0.08642578125, 0.09143829345703125, 0.0964508056640625, 0.10146331787109375, 0.106475830078125, 0.11148834228515625, 0.1165008544921875, 0.12151336669921875, 0.12652587890625, 0.13153839111328125, 0.1365509033203125, 0.14156341552734375, 0.146575927734375, 0.15158843994140625, 0.1566009521484375, 0.16161346435546875, 0.1666259765625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 7.0, 4.0, 10.0, 3.0, 11.0, 17.0, 26.0, 35.0, 30.0, 39.0, 57.0, 65.0, 51.0, 54.0, 52.0, 65.0, 58.0, 56.0, 68.0, 44.0, 51.0, 43.0, 23.0, 27.0, 21.0, 20.0, 15.0, 13.0, 5.0, 7.0, 5.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6181640625, -0.5990219116210938, -0.5798797607421875, -0.5607376098632812, -0.541595458984375, -0.5224533081054688, -0.5033111572265625, -0.48416900634765625, -0.46502685546875, -0.44588470458984375, -0.4267425537109375, -0.40760040283203125, -0.388458251953125, -0.36931610107421875, -0.3501739501953125, -0.33103179931640625, -0.3118896484375, -0.29274749755859375, -0.2736053466796875, -0.25446319580078125, -0.235321044921875, -0.21617889404296875, -0.1970367431640625, -0.17789459228515625, -0.15875244140625, -0.13961029052734375, -0.1204681396484375, -0.10132598876953125, -0.082183837890625, -0.06304168701171875, -0.0438995361328125, -0.02475738525390625, -0.005615234375, 0.01352691650390625, 0.0326690673828125, 0.05181121826171875, 0.070953369140625, 0.09009552001953125, 0.1092376708984375, 0.12837982177734375, 0.14752197265625, 0.16666412353515625, 0.1858062744140625, 0.20494842529296875, 0.224090576171875, 0.24323272705078125, 0.2623748779296875, 0.28151702880859375, 0.3006591796875, 0.31980133056640625, 0.3389434814453125, 0.35808563232421875, 0.377227783203125, 0.39636993408203125, 0.4155120849609375, 0.43465423583984375, 0.45379638671875, 0.47293853759765625, 0.4920806884765625, 0.5112228393554688, 0.530364990234375, 0.5495071411132812, 0.5686492919921875, 0.5877914428710938, 0.60693359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 9.0, 6.0, 8.0, 9.0, 17.0, 21.0, 22.0, 20.0, 30.0, 24.0, 27.0, 34.0, 38.0, 56.0, 70.0, 98.0, 203.0, 1959.0, 993751.0, 50936.0, 608.0, 155.0, 91.0, 43.0, 57.0, 31.0, 35.0, 37.0, 28.0, 21.0, 19.0, 13.0, 21.0, 11.0, 4.0, 13.0, 3.0, 7.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.62890625, -1.57769775390625, -1.5264892578125, -1.47528076171875, -1.424072265625, -1.37286376953125, -1.3216552734375, -1.27044677734375, -1.21923828125, -1.16802978515625, -1.1168212890625, -1.06561279296875, -1.014404296875, -0.96319580078125, -0.9119873046875, -0.86077880859375, -0.8095703125, -0.75836181640625, -0.7071533203125, -0.65594482421875, -0.604736328125, -0.55352783203125, -0.5023193359375, -0.45111083984375, -0.39990234375, -0.34869384765625, -0.2974853515625, -0.24627685546875, -0.195068359375, -0.14385986328125, -0.0926513671875, -0.04144287109375, 0.009765625, 0.06097412109375, 0.1121826171875, 0.16339111328125, 0.214599609375, 0.26580810546875, 0.3170166015625, 0.36822509765625, 0.41943359375, 0.47064208984375, 0.5218505859375, 0.57305908203125, 0.624267578125, 0.67547607421875, 0.7266845703125, 0.77789306640625, 0.8291015625, 0.88031005859375, 0.9315185546875, 0.98272705078125, 1.033935546875, 1.08514404296875, 1.1363525390625, 1.18756103515625, 1.23876953125, 1.28997802734375, 1.3411865234375, 1.39239501953125, 1.443603515625, 1.49481201171875, 1.5460205078125, 1.59722900390625, 1.6484375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 7.0, 5.0, 8.0, 13.0, 14.0, 18.0, 31.0, 30.0, 28.0, 31.0, 25.0, 33.0, 36.0, 42.0, 54.0, 34.0, 42.0, 54.0, 48.0, 64.0, 34.0, 40.0, 45.0, 36.0, 36.0, 36.0, 25.0, 29.0, 14.0, 19.0, 16.0, 9.0, 11.0, 9.0, 4.0, 3.0, 3.0, 7.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.451904296875, -0.4355659484863281, -0.41922760009765625, -0.4028892517089844, -0.3865509033203125, -0.3702125549316406, -0.35387420654296875, -0.3375358581542969, -0.321197509765625, -0.3048591613769531, -0.28852081298828125, -0.2721824645996094, -0.2558441162109375, -0.23950576782226562, -0.22316741943359375, -0.20682907104492188, -0.19049072265625, -0.17415237426757812, -0.15781402587890625, -0.14147567749023438, -0.1251373291015625, -0.10879898071289062, -0.09246063232421875, -0.07612228393554688, -0.059783935546875, -0.043445587158203125, -0.02710723876953125, -0.010768890380859375, 0.0055694580078125, 0.021907806396484375, 0.03824615478515625, 0.054584503173828125, 0.0709228515625, 0.08726119995117188, 0.10359954833984375, 0.11993789672851562, 0.1362762451171875, 0.15261459350585938, 0.16895294189453125, 0.18529129028320312, 0.201629638671875, 0.21796798706054688, 0.23430633544921875, 0.2506446838378906, 0.2669830322265625, 0.2833213806152344, 0.29965972900390625, 0.3159980773925781, 0.33233642578125, 0.3486747741699219, 0.36501312255859375, 0.3813514709472656, 0.3976898193359375, 0.4140281677246094, 0.43036651611328125, 0.4467048645019531, 0.463043212890625, 0.4793815612792969, 0.49571990966796875, 0.5120582580566406, 0.5283966064453125, 0.5447349548339844, 0.5610733032226562, 0.5774116516113281, 0.59375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 8.0, 3.0, 5.0, 7.0, 8.0, 7.0, 14.0, 10.0, 8.0, 21.0, 27.0, 31.0, 39.0, 63.0, 88.0, 145.0, 249.0, 730.0, 2478.0, 10518.0, 74672.0, 816663.0, 123111.0, 14688.0, 3223.0, 863.0, 365.0, 171.0, 90.0, 61.0, 52.0, 34.0, 26.0, 17.0, 16.0, 15.0, 9.0, 5.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07269287109375, -0.07005882263183594, -0.06742477416992188, -0.06479072570800781, -0.06215667724609375, -0.05952262878417969, -0.056888580322265625, -0.05425453186035156, -0.0516204833984375, -0.04898643493652344, -0.046352386474609375, -0.04371833801269531, -0.04108428955078125, -0.03845024108886719, -0.035816192626953125, -0.03318214416503906, -0.030548095703125, -0.027914047241210938, -0.025279998779296875, -0.022645950317382812, -0.02001190185546875, -0.017377853393554688, -0.014743804931640625, -0.012109756469726562, -0.0094757080078125, -0.0068416595458984375, -0.004207611083984375, -0.0015735626220703125, 0.00106048583984375, 0.0036945343017578125, 0.006328582763671875, 0.008962631225585938, 0.0115966796875, 0.014230728149414062, 0.016864776611328125, 0.019498825073242188, 0.02213287353515625, 0.024766921997070312, 0.027400970458984375, 0.030035018920898438, 0.0326690673828125, 0.03530311584472656, 0.037937164306640625, 0.04057121276855469, 0.04320526123046875, 0.04583930969238281, 0.048473358154296875, 0.05110740661621094, 0.053741455078125, 0.05637550354003906, 0.059009552001953125, 0.06164360046386719, 0.06427764892578125, 0.06691169738769531, 0.06954574584960938, 0.07217979431152344, 0.0748138427734375, 0.07744789123535156, 0.08008193969726562, 0.08271598815917969, 0.08535003662109375, 0.08798408508300781, 0.09061813354492188, 0.09325218200683594, 0.09588623046875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 7.0, 9.0, 10.0, 8.0, 14.0, 17.0, 28.0, 31.0, 44.0, 101.0, 103.0, 105.0, 110.0, 120.0, 77.0, 64.0, 37.0, 16.0, 18.0, 9.0, 16.0, 17.0, 2.0, 4.0, 5.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.715557098388672e-06, -9.46037471294403e-06, -9.20519232749939e-06, -8.950009942054749e-06, -8.694827556610107e-06, -8.439645171165466e-06, -8.184462785720825e-06, -7.929280400276184e-06, -7.674098014831543e-06, -7.418915629386902e-06, -7.163733243942261e-06, -6.90855085849762e-06, -6.6533684730529785e-06, -6.398186087608337e-06, -6.143003702163696e-06, -5.887821316719055e-06, -5.632638931274414e-06, -5.377456545829773e-06, -5.122274160385132e-06, -4.867091774940491e-06, -4.61190938949585e-06, -4.3567270040512085e-06, -4.101544618606567e-06, -3.846362233161926e-06, -3.591179847717285e-06, -3.335997462272644e-06, -3.080815076828003e-06, -2.825632691383362e-06, -2.5704503059387207e-06, -2.3152679204940796e-06, -2.0600855350494385e-06, -1.8049031496047974e-06, -1.5497207641601562e-06, -1.2945383787155151e-06, -1.039355993270874e-06, -7.841736078262329e-07, -5.289912223815918e-07, -2.738088369369507e-07, -1.862645149230957e-08, 2.3655593395233154e-07, 4.917383193969727e-07, 7.469207048416138e-07, 1.0021030902862549e-06, 1.257285475730896e-06, 1.5124678611755371e-06, 1.7676502466201782e-06, 2.0228326320648193e-06, 2.2780150175094604e-06, 2.5331974029541016e-06, 2.7883797883987427e-06, 3.043562173843384e-06, 3.298744559288025e-06, 3.553926944732666e-06, 3.809109330177307e-06, 4.064291715621948e-06, 4.319474101066589e-06, 4.5746564865112305e-06, 4.829838871955872e-06, 5.085021257400513e-06, 5.340203642845154e-06, 5.595386028289795e-06, 5.850568413734436e-06, 6.105750799179077e-06, 6.360933184623718e-06, 6.616115570068359e-06]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 7.0, 10.0, 12.0, 21.0, 18.0, 33.0, 44.0, 81.0, 136.0, 442.0, 1548.0, 8301.0, 87036.0, 889305.0, 53258.0, 6300.0, 1295.0, 372.0, 136.0, 59.0, 36.0, 24.0, 17.0, 11.0, 12.0, 5.0, 9.0, 4.0, 5.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10205078125, -0.09803581237792969, -0.09402084350585938, -0.09000587463378906, -0.08599090576171875, -0.08197593688964844, -0.07796096801757812, -0.07394599914550781, -0.0699310302734375, -0.06591606140136719, -0.061901092529296875, -0.05788612365722656, -0.05387115478515625, -0.04985618591308594, -0.045841217041015625, -0.04182624816894531, -0.037811279296875, -0.03379631042480469, -0.029781341552734375, -0.025766372680664062, -0.02175140380859375, -0.017736434936523438, -0.013721466064453125, -0.009706497192382812, -0.0056915283203125, -0.0016765594482421875, 0.002338409423828125, 0.0063533782958984375, 0.01036834716796875, 0.014383316040039062, 0.018398284912109375, 0.022413253784179688, 0.02642822265625, 0.030443191528320312, 0.034458160400390625, 0.03847312927246094, 0.04248809814453125, 0.04650306701660156, 0.050518035888671875, 0.05453300476074219, 0.0585479736328125, 0.06256294250488281, 0.06657791137695312, 0.07059288024902344, 0.07460784912109375, 0.07862281799316406, 0.08263778686523438, 0.08665275573730469, 0.090667724609375, 0.09468269348144531, 0.09869766235351562, 0.10271263122558594, 0.10672760009765625, 0.11074256896972656, 0.11475753784179688, 0.11877250671386719, 0.1227874755859375, 0.1268024444580078, 0.13081741333007812, 0.13483238220214844, 0.13884735107421875, 0.14286231994628906, 0.14687728881835938, 0.1508922576904297, 0.1549072265625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 2.0, 4.0, 7.0, 9.0, 15.0, 17.0, 33.0, 25.0, 34.0, 48.0, 62.0, 81.0, 159.0, 144.0, 94.0, 61.0, 48.0, 41.0, 21.0, 13.0, 10.0, 14.0, 9.0, 8.0, 3.0, 7.0, 2.0, 4.0, 7.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023193359375, -0.022421598434448242, -0.021649837493896484, -0.020878076553344727, -0.02010631561279297, -0.01933455467224121, -0.018562793731689453, -0.017791032791137695, -0.017019271850585938, -0.01624751091003418, -0.015475749969482422, -0.014703989028930664, -0.013932228088378906, -0.013160467147827148, -0.01238870620727539, -0.011616945266723633, -0.010845184326171875, -0.010073423385620117, -0.00930166244506836, -0.008529901504516602, -0.007758140563964844, -0.006986379623413086, -0.006214618682861328, -0.00544285774230957, -0.0046710968017578125, -0.0038993358612060547, -0.003127574920654297, -0.002355813980102539, -0.0015840530395507812, -0.0008122920989990234, -4.0531158447265625e-05, 0.0007312297821044922, 0.00150299072265625, 0.002274751663208008, 0.0030465126037597656, 0.0038182735443115234, 0.004590034484863281, 0.005361795425415039, 0.006133556365966797, 0.006905317306518555, 0.0076770782470703125, 0.00844883918762207, 0.009220600128173828, 0.009992361068725586, 0.010764122009277344, 0.011535882949829102, 0.01230764389038086, 0.013079404830932617, 0.013851165771484375, 0.014622926712036133, 0.01539468765258789, 0.01616644859313965, 0.016938209533691406, 0.017709970474243164, 0.018481731414794922, 0.01925349235534668, 0.020025253295898438, 0.020797014236450195, 0.021568775177001953, 0.02234053611755371, 0.02311229705810547, 0.023884057998657227, 0.024655818939208984, 0.025427579879760742, 0.0261993408203125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 20.0, 25.0, 77.0, 156.0, 222.0, 212.0, 158.0, 76.0, 35.0, 15.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5838356018066406, -0.535101592540741, -0.4863676130771637, -0.43763360381126404, -0.38889962434768677, -0.3401656150817871, -0.29143160581588745, -0.24269762635231018, -0.19396361708641052, -0.14522962272167206, -0.096495620906353, -0.047761619091033936, 0.0009723752737045288, 0.04970636963844299, 0.09844037890434265, 0.14717435836791992, 0.19590836763381958, 0.24464236199855804, 0.2933763563632965, 0.34211036562919617, 0.39084434509277344, 0.4395783543586731, 0.48831236362457275, 0.5370463132858276, 0.5857803821563721, 0.6345143914222717, 0.6832484006881714, 0.7319823503494263, 0.7807163596153259, 0.8294503688812256, 0.8781843781471252, 0.9269183874130249, 0.9756523370742798, 1.0243862867355347, 1.073120355606079, 1.121854305267334, 1.1705883741378784, 1.2193223237991333, 1.2680563926696777, 1.3167903423309326, 1.3655242919921875, 1.4142582416534424, 1.4629923105239868, 1.5117262601852417, 1.5604603290557861, 1.609194278717041, 1.657928228378296, 1.7066622972488403, 1.7553963661193848, 1.8041303157806396, 1.852864384651184, 1.901598334312439, 1.9503324031829834, 1.9990663528442383, 2.047800302505493, 2.096534252166748, 2.145268201828003, 2.194002151489258, 2.2427361011505127, 2.2914702892303467, 2.3402042388916016, 2.3889381885528564, 2.4376721382141113, 2.486406087875366, 2.5351402759552]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 8.0, 11.0, 12.0, 7.0, 10.0, 14.0, 21.0, 17.0, 20.0, 26.0, 26.0, 31.0, 24.0, 35.0, 26.0, 32.0, 41.0, 35.0, 36.0, 48.0, 38.0, 40.0, 46.0, 40.0, 35.0, 36.0, 35.0, 27.0, 30.0, 25.0, 34.0, 24.0, 11.0, 23.0, 16.0, 9.0, 15.0, 8.0, 5.0, 4.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.8181977272033691, -0.7946558594703674, -0.771113932132721, -0.7475720643997192, -0.7240301966667175, -0.7004883289337158, -0.6769464015960693, -0.6534045338630676, -0.6298626661300659, -0.6063207983970642, -0.5827788710594177, -0.559237003326416, -0.5356951355934143, -0.5121532678604126, -0.4886113405227661, -0.4650694727897644, -0.4415275752544403, -0.4179856777191162, -0.3944438099861145, -0.3709019124507904, -0.3473600447177887, -0.3238181471824646, -0.3002762794494629, -0.2767343819141388, -0.2531924843788147, -0.2296506017446518, -0.2061087191104889, -0.1825668215751648, -0.15902495384216309, -0.135483056306839, -0.11194117367267609, -0.08839929103851318, -0.06485742330551147, -0.04131554067134857, -0.01777365431189537, 0.005768232047557831, 0.029310114681720734, 0.052851997315883636, 0.07639388740062714, 0.09993577003479004, 0.12347765266895294, 0.14701953530311584, 0.17056141793727875, 0.19410330057144165, 0.21764519810676575, 0.24118706583976746, 0.26472896337509155, 0.28827083110809326, 0.31181272864341736, 0.33535462617874146, 0.35889649391174316, 0.38243839144706726, 0.40598025918006897, 0.42952215671539307, 0.4530640244483948, 0.47660592198371887, 0.500147819519043, 0.5236896872520447, 0.5472316145896912, 0.5707734823226929, 0.5943153500556946, 0.6178572177886963, 0.6413991451263428, 0.6649410128593445, 0.6884828805923462]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 7.0, 6.0, 11.0, 7.0, 8.0, 7.0, 10.0, 15.0, 29.0, 29.0, 41.0, 47.0, 97.0, 113.0, 192.0, 266.0, 370.0, 647.0, 993.0, 1746.0, 2967.0, 5119.0, 11316.0, 29459.0, 124072.0, 683035.0, 2013408.0, 1032873.0, 209563.0, 48131.0, 14844.0, 6535.0, 3291.0, 1923.0, 1137.0, 689.0, 431.0, 305.0, 165.0, 129.0, 81.0, 41.0, 36.0, 31.0, 22.0, 13.0, 15.0, 5.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.409423828125, -0.39725494384765625, -0.3850860595703125, -0.37291717529296875, -0.360748291015625, -0.34857940673828125, -0.3364105224609375, -0.32424163818359375, -0.31207275390625, -0.29990386962890625, -0.2877349853515625, -0.27556610107421875, -0.263397216796875, -0.25122833251953125, -0.2390594482421875, -0.22689056396484375, -0.2147216796875, -0.20255279541015625, -0.1903839111328125, -0.17821502685546875, -0.166046142578125, -0.15387725830078125, -0.1417083740234375, -0.12953948974609375, -0.11737060546875, -0.10520172119140625, -0.0930328369140625, -0.08086395263671875, -0.068695068359375, -0.05652618408203125, -0.0443572998046875, -0.03218841552734375, -0.02001953125, -0.00785064697265625, 0.0043182373046875, 0.01648712158203125, 0.028656005859375, 0.04082489013671875, 0.0529937744140625, 0.06516265869140625, 0.07733154296875, 0.08950042724609375, 0.1016693115234375, 0.11383819580078125, 0.126007080078125, 0.13817596435546875, 0.1503448486328125, 0.16251373291015625, 0.1746826171875, 0.18685150146484375, 0.1990203857421875, 0.21118927001953125, 0.223358154296875, 0.23552703857421875, 0.2476959228515625, 0.25986480712890625, 0.27203369140625, 0.28420257568359375, 0.2963714599609375, 0.30854034423828125, 0.320709228515625, 0.33287811279296875, 0.3450469970703125, 0.35721588134765625, 0.369384765625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 2.0, 14.0, 8.0, 10.0, 6.0, 13.0, 13.0, 14.0, 23.0, 31.0, 33.0, 42.0, 43.0, 36.0, 42.0, 46.0, 37.0, 60.0, 52.0, 58.0, 48.0, 42.0, 47.0, 42.0, 30.0, 32.0, 29.0, 23.0, 16.0, 23.0, 19.0, 12.0, 17.0, 8.0, 10.0, 4.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2783203125, -0.268463134765625, -0.25860595703125, -0.248748779296875, -0.2388916015625, -0.229034423828125, -0.21917724609375, -0.209320068359375, -0.199462890625, -0.189605712890625, -0.17974853515625, -0.169891357421875, -0.1600341796875, -0.150177001953125, -0.14031982421875, -0.130462646484375, -0.12060546875, -0.110748291015625, -0.10089111328125, -0.091033935546875, -0.0811767578125, -0.071319580078125, -0.06146240234375, -0.051605224609375, -0.041748046875, -0.031890869140625, -0.02203369140625, -0.012176513671875, -0.0023193359375, 0.007537841796875, 0.01739501953125, 0.027252197265625, 0.037109375, 0.046966552734375, 0.05682373046875, 0.066680908203125, 0.0765380859375, 0.086395263671875, 0.09625244140625, 0.106109619140625, 0.115966796875, 0.125823974609375, 0.13568115234375, 0.145538330078125, 0.1553955078125, 0.165252685546875, 0.17510986328125, 0.184967041015625, 0.19482421875, 0.204681396484375, 0.21453857421875, 0.224395751953125, 0.2342529296875, 0.244110107421875, 0.25396728515625, 0.263824462890625, 0.273681640625, 0.283538818359375, 0.29339599609375, 0.303253173828125, 0.3131103515625, 0.322967529296875, 0.33282470703125, 0.342681884765625, 0.3525390625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 13.0, 13.0, 9.0, 23.0, 25.0, 26.0, 69.0, 89.0, 203.0, 592.0, 9119.0, 4152627.0, 29976.0, 933.0, 248.0, 117.0, 66.0, 51.0, 35.0, 15.0, 14.0, 9.0, 3.0, 3.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.697265625, -1.6107177734375, -1.524169921875, -1.4376220703125, -1.35107421875, -1.2645263671875, -1.177978515625, -1.0914306640625, -1.0048828125, -0.9183349609375, -0.831787109375, -0.7452392578125, -0.65869140625, -0.5721435546875, -0.485595703125, -0.3990478515625, -0.3125, -0.2259521484375, -0.139404296875, -0.0528564453125, 0.03369140625, 0.1202392578125, 0.206787109375, 0.2933349609375, 0.3798828125, 0.4664306640625, 0.552978515625, 0.6395263671875, 0.72607421875, 0.8126220703125, 0.899169921875, 0.9857177734375, 1.072265625, 1.1588134765625, 1.245361328125, 1.3319091796875, 1.41845703125, 1.5050048828125, 1.591552734375, 1.6781005859375, 1.7646484375, 1.8511962890625, 1.937744140625, 2.0242919921875, 2.11083984375, 2.1973876953125, 2.283935546875, 2.3704833984375, 2.45703125, 2.5435791015625, 2.630126953125, 2.7166748046875, 2.80322265625, 2.8897705078125, 2.976318359375, 3.0628662109375, 3.1494140625, 3.2359619140625, 3.322509765625, 3.4090576171875, 3.49560546875, 3.5821533203125, 3.668701171875, 3.7552490234375, 3.841796875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 5.0, 2.0, 5.0, 11.0, 11.0, 12.0, 31.0, 35.0, 42.0, 77.0, 94.0, 203.0, 338.0, 601.0, 892.0, 720.0, 376.0, 223.0, 113.0, 89.0, 63.0, 36.0, 28.0, 20.0, 21.0, 11.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.26220703125, -0.2560558319091797, -0.24990463256835938, -0.24375343322753906, -0.23760223388671875, -0.23145103454589844, -0.22529983520507812, -0.2191486358642578, -0.2129974365234375, -0.2068462371826172, -0.20069503784179688, -0.19454383850097656, -0.18839263916015625, -0.18224143981933594, -0.17609024047851562, -0.1699390411376953, -0.163787841796875, -0.1576366424560547, -0.15148544311523438, -0.14533424377441406, -0.13918304443359375, -0.13303184509277344, -0.12688064575195312, -0.12072944641113281, -0.1145782470703125, -0.10842704772949219, -0.10227584838867188, -0.09612464904785156, -0.08997344970703125, -0.08382225036621094, -0.07767105102539062, -0.07151985168457031, -0.06536865234375, -0.05921745300292969, -0.053066253662109375, -0.04691505432128906, -0.04076385498046875, -0.03461265563964844, -0.028461456298828125, -0.022310256958007812, -0.0161590576171875, -0.010007858276367188, -0.003856658935546875, 0.0022945404052734375, 0.00844573974609375, 0.014596939086914062, 0.020748138427734375, 0.026899337768554688, 0.033050537109375, 0.03920173645019531, 0.045352935791015625, 0.05150413513183594, 0.05765533447265625, 0.06380653381347656, 0.06995773315429688, 0.07610893249511719, 0.0822601318359375, 0.08841133117675781, 0.09456253051757812, 0.10071372985839844, 0.10686492919921875, 0.11301612854003906, 0.11916732788085938, 0.1253185272216797, 0.1314697265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 1.0, 1.0, 3.0, 4.0, 12.0, 14.0, 15.0, 29.0, 39.0, 44.0, 61.0, 106.0, 121.0, 134.0, 113.0, 98.0, 64.0, 53.0, 32.0, 21.0, 17.0, 11.0, 8.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5870668292045593, -0.5669479966163635, -0.5468291640281677, -0.5267103314399719, -0.5065914392471313, -0.48647263646125793, -0.46635377407073975, -0.44623494148254395, -0.42611610889434814, -0.40599727630615234, -0.38587844371795654, -0.36575958132743835, -0.34564074873924255, -0.32552191615104675, -0.30540305376052856, -0.28528422117233276, -0.26516538858413696, -0.24504655599594116, -0.22492770850658417, -0.20480886101722717, -0.18469002842903137, -0.16457119584083557, -0.14445234835147858, -0.12433350086212158, -0.10421466827392578, -0.08409582823514938, -0.06397698819637299, -0.04385814815759659, -0.02373930811882019, -0.0036204680800437927, 0.016498371958732605, 0.0366172194480896, 0.0567360520362854, 0.0768548920750618, 0.0969737321138382, 0.1170925721526146, 0.137211412191391, 0.1573302447795868, 0.1774490922689438, 0.19756793975830078, 0.21768677234649658, 0.23780560493469238, 0.2579244375228882, 0.27804329991340637, 0.2981621325016022, 0.318280965089798, 0.33839982748031616, 0.35851866006851196, 0.37863749265670776, 0.39875632524490356, 0.41887515783309937, 0.43899402022361755, 0.45911285281181335, 0.47923168540000916, 0.49935054779052734, 0.5194693803787231, 0.539588212966919, 0.5597070455551147, 0.5798258781433105, 0.5999447107315063, 0.6200635433197021, 0.6401824355125427, 0.6603012681007385, 0.6804201006889343, 0.7005389332771301]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 3.0, 8.0, 15.0, 17.0, 12.0, 13.0, 20.0, 31.0, 28.0, 32.0, 29.0, 34.0, 31.0, 40.0, 36.0, 41.0, 49.0, 51.0, 57.0, 59.0, 51.0, 39.0, 31.0, 43.0, 31.0, 37.0, 32.0, 22.0, 21.0, 17.0, 13.0, 12.0, 11.0, 8.0, 5.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.3655202388763428, -0.35440778732299805, -0.3432953357696533, -0.3321828842163086, -0.32107046246528625, -0.30995801091194153, -0.2988455593585968, -0.2877331078052521, -0.27662065625190735, -0.2655082046985626, -0.2543957531452179, -0.24328331649303436, -0.23217086493968964, -0.2210584282875061, -0.20994597673416138, -0.19883352518081665, -0.18772108852863312, -0.1766086369752884, -0.16549620032310486, -0.15438374876976013, -0.1432712972164154, -0.13215884566307068, -0.12104640901088715, -0.10993395745754242, -0.09882151335477829, -0.08770906925201416, -0.07659661769866943, -0.0654841735959053, -0.054371725767850876, -0.04325927793979645, -0.03214683383703232, -0.02103438228368759, -0.009921938180923462, 0.0011905087158083916, 0.012302955612540245, 0.023415401577949524, 0.03452784940600395, 0.04564029723405838, 0.05675274133682251, 0.06786519289016724, 0.07897763699293137, 0.0900900810956955, 0.10120253264904022, 0.11231497675180435, 0.12342742085456848, 0.1345398724079132, 0.14565232396125793, 0.15676477551460266, 0.1678772121667862, 0.17898966372013092, 0.19010210037231445, 0.20121455192565918, 0.2123270034790039, 0.22343945503234863, 0.23455189168453217, 0.2456643432378769, 0.2567767798900604, 0.26788923144340515, 0.2790016829967499, 0.2901141047477722, 0.30122655630111694, 0.31233900785446167, 0.3234514594078064, 0.3345639109611511, 0.34567636251449585]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 7.0, 4.0, 5.0, 12.0, 20.0, 31.0, 42.0, 52.0, 85.0, 148.0, 237.0, 383.0, 692.0, 1469.0, 3351.0, 8545.0, 26195.0, 99214.0, 451564.0, 349855.0, 73390.0, 20550.0, 7124.0, 2788.0, 1243.0, 634.0, 340.0, 214.0, 120.0, 77.0, 59.0, 36.0, 24.0, 16.0, 10.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10406494140625, -0.10080242156982422, -0.09753990173339844, -0.09427738189697266, -0.09101486206054688, -0.0877523422241211, -0.08448982238769531, -0.08122730255126953, -0.07796478271484375, -0.07470226287841797, -0.07143974304199219, -0.0681772232055664, -0.06491470336914062, -0.061652183532714844, -0.05838966369628906, -0.05512714385986328, -0.0518646240234375, -0.04860210418701172, -0.04533958435058594, -0.042077064514160156, -0.038814544677734375, -0.035552024841308594, -0.03228950500488281, -0.02902698516845703, -0.02576446533203125, -0.02250194549560547, -0.019239425659179688, -0.015976905822753906, -0.012714385986328125, -0.009451866149902344, -0.0061893463134765625, -0.0029268264770507812, 0.000335693359375, 0.0035982131958007812, 0.0068607330322265625, 0.010123252868652344, 0.013385772705078125, 0.016648292541503906, 0.019910812377929688, 0.02317333221435547, 0.02643585205078125, 0.02969837188720703, 0.03296089172363281, 0.036223411560058594, 0.039485931396484375, 0.042748451232910156, 0.04601097106933594, 0.04927349090576172, 0.0525360107421875, 0.05579853057861328, 0.05906105041503906, 0.062323570251464844, 0.06558609008789062, 0.0688486099243164, 0.07211112976074219, 0.07537364959716797, 0.07863616943359375, 0.08189868927001953, 0.08516120910644531, 0.0884237289428711, 0.09168624877929688, 0.09494876861572266, 0.09821128845214844, 0.10147380828857422, 0.104736328125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 12.0, 12.0, 12.0, 26.0, 25.0, 27.0, 50.0, 44.0, 43.0, 73.0, 56.0, 74.0, 75.0, 101.0, 58.0, 56.0, 46.0, 54.0, 45.0, 25.0, 18.0, 23.0, 14.0, 9.0, 3.0, 2.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.321044921875, -0.31110382080078125, -0.3011627197265625, -0.29122161865234375, -0.281280517578125, -0.27133941650390625, -0.2613983154296875, -0.25145721435546875, -0.24151611328125, -0.23157501220703125, -0.2216339111328125, -0.21169281005859375, -0.201751708984375, -0.19181060791015625, -0.1818695068359375, -0.17192840576171875, -0.1619873046875, -0.15204620361328125, -0.1421051025390625, -0.13216400146484375, -0.122222900390625, -0.11228179931640625, -0.1023406982421875, -0.09239959716796875, -0.08245849609375, -0.07251739501953125, -0.0625762939453125, -0.05263519287109375, -0.042694091796875, -0.03275299072265625, -0.0228118896484375, -0.01287078857421875, -0.0029296875, 0.00701141357421875, 0.0169525146484375, 0.02689361572265625, 0.036834716796875, 0.04677581787109375, 0.0567169189453125, 0.06665802001953125, 0.07659912109375, 0.08654022216796875, 0.0964813232421875, 0.10642242431640625, 0.116363525390625, 0.12630462646484375, 0.1362457275390625, 0.14618682861328125, 0.1561279296875, 0.16606903076171875, 0.1760101318359375, 0.18595123291015625, 0.195892333984375, 0.20583343505859375, 0.2157745361328125, 0.22571563720703125, 0.23565673828125, 0.24559783935546875, 0.2555389404296875, 0.26548004150390625, 0.275421142578125, 0.28536224365234375, 0.2953033447265625, 0.30524444580078125, 0.315185546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 12.0, 14.0, 21.0, 30.0, 39.0, 71.0, 100.0, 161.0, 223.0, 351.0, 509.0, 873.0, 1247.0, 1904.0, 2950.0, 4643.0, 7092.0, 11329.0, 18049.0, 29351.0, 50678.0, 90538.0, 158164.0, 217140.0, 184871.0, 111864.0, 62316.0, 35481.0, 21353.0, 13298.0, 8414.0, 5404.0, 3478.0, 2254.0, 1545.0, 912.0, 667.0, 408.0, 298.0, 198.0, 109.0, 78.0, 42.0, 25.0, 18.0, 17.0, 10.0, 3.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0364990234375, -0.0354151725769043, -0.034331321716308594, -0.03324747085571289, -0.03216361999511719, -0.031079769134521484, -0.02999591827392578, -0.028912067413330078, -0.027828216552734375, -0.026744365692138672, -0.02566051483154297, -0.024576663970947266, -0.023492813110351562, -0.02240896224975586, -0.021325111389160156, -0.020241260528564453, -0.01915740966796875, -0.018073558807373047, -0.016989707946777344, -0.01590585708618164, -0.014822006225585938, -0.013738155364990234, -0.012654304504394531, -0.011570453643798828, -0.010486602783203125, -0.009402751922607422, -0.008318901062011719, -0.007235050201416016, -0.0061511993408203125, -0.005067348480224609, -0.003983497619628906, -0.002899646759033203, -0.0018157958984375, -0.0007319450378417969, 0.00035190582275390625, 0.0014357566833496094, 0.0025196075439453125, 0.0036034584045410156, 0.004687309265136719, 0.005771160125732422, 0.006855010986328125, 0.007938861846923828, 0.009022712707519531, 0.010106563568115234, 0.011190414428710938, 0.01227426528930664, 0.013358116149902344, 0.014441967010498047, 0.01552581787109375, 0.016609668731689453, 0.017693519592285156, 0.01877737045288086, 0.019861221313476562, 0.020945072174072266, 0.02202892303466797, 0.023112773895263672, 0.024196624755859375, 0.025280475616455078, 0.02636432647705078, 0.027448177337646484, 0.028532028198242188, 0.02961587905883789, 0.030699729919433594, 0.0317835807800293, 0.032867431640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 6.0, 4.0, 9.0, 8.0, 16.0, 11.0, 10.0, 15.0, 14.0, 21.0, 20.0, 28.0, 28.0, 18.0, 33.0, 35.0, 34.0, 51.0, 41.0, 39.0, 48.0, 41.0, 42.0, 41.0, 48.0, 37.0, 31.0, 40.0, 27.0, 16.0, 21.0, 23.0, 26.0, 23.0, 23.0, 11.0, 13.0, 11.0, 7.0, 8.0, 7.0, 8.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33984375, -0.32840728759765625, -0.3169708251953125, -0.30553436279296875, -0.294097900390625, -0.28266143798828125, -0.2712249755859375, -0.25978851318359375, -0.24835205078125, -0.23691558837890625, -0.2254791259765625, -0.21404266357421875, -0.202606201171875, -0.19116973876953125, -0.1797332763671875, -0.16829681396484375, -0.1568603515625, -0.14542388916015625, -0.1339874267578125, -0.12255096435546875, -0.111114501953125, -0.09967803955078125, -0.0882415771484375, -0.07680511474609375, -0.06536865234375, -0.05393218994140625, -0.0424957275390625, -0.03105926513671875, -0.019622802734375, -0.00818634033203125, 0.0032501220703125, 0.01468658447265625, 0.026123046875, 0.03755950927734375, 0.0489959716796875, 0.06043243408203125, 0.071868896484375, 0.08330535888671875, 0.0947418212890625, 0.10617828369140625, 0.11761474609375, 0.12905120849609375, 0.1404876708984375, 0.15192413330078125, 0.163360595703125, 0.17479705810546875, 0.1862335205078125, 0.19766998291015625, 0.2091064453125, 0.22054290771484375, 0.2319793701171875, 0.24341583251953125, 0.254852294921875, 0.26628875732421875, 0.2777252197265625, 0.28916168212890625, 0.30059814453125, 0.31203460693359375, 0.3234710693359375, 0.33490753173828125, 0.346343994140625, 0.35778045654296875, 0.3692169189453125, 0.38065338134765625, 0.39208984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 9.0, 11.0, 22.0, 20.0, 29.0, 43.0, 74.0, 91.0, 121.0, 191.0, 301.0, 402.0, 622.0, 953.0, 1521.0, 2420.0, 4338.0, 8533.0, 18083.0, 41661.0, 101020.0, 227740.0, 307445.0, 187948.0, 80210.0, 33543.0, 14505.0, 6982.0, 3697.0, 2158.0, 1255.0, 825.0, 570.0, 357.0, 245.0, 183.0, 119.0, 89.0, 64.0, 43.0, 34.0, 24.0, 17.0, 6.0, 9.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.00487518310546875, -0.00473332405090332, -0.004591464996337891, -0.004449605941772461, -0.004307746887207031, -0.0041658878326416016, -0.004024028778076172, -0.003882169723510742, -0.0037403106689453125, -0.003598451614379883, -0.003456592559814453, -0.0033147335052490234, -0.0031728744506835938, -0.003031015396118164, -0.0028891563415527344, -0.0027472972869873047, -0.002605438232421875, -0.0024635791778564453, -0.0023217201232910156, -0.002179861068725586, -0.0020380020141601562, -0.0018961429595947266, -0.0017542839050292969, -0.0016124248504638672, -0.0014705657958984375, -0.0013287067413330078, -0.0011868476867675781, -0.0010449886322021484, -0.0009031295776367188, -0.0007612705230712891, -0.0006194114685058594, -0.0004775524139404297, -0.000335693359375, -0.0001938343048095703, -5.1975250244140625e-05, 8.988380432128906e-05, 0.00023174285888671875, 0.00037360191345214844, 0.0005154609680175781, 0.0006573200225830078, 0.0007991790771484375, 0.0009410381317138672, 0.0010828971862792969, 0.0012247562408447266, 0.0013666152954101562, 0.001508474349975586, 0.0016503334045410156, 0.0017921924591064453, 0.001934051513671875, 0.0020759105682373047, 0.0022177696228027344, 0.002359628677368164, 0.0025014877319335938, 0.0026433467864990234, 0.002785205841064453, 0.002927064895629883, 0.0030689239501953125, 0.003210783004760742, 0.003352642059326172, 0.0034945011138916016, 0.0036363601684570312, 0.003778219223022461, 0.003920078277587891, 0.00406193733215332, 0.00420379638671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 7.0, 6.0, 6.0, 17.0, 17.0, 17.0, 32.0, 40.0, 39.0, 54.0, 53.0, 88.0, 98.0, 77.0, 92.0, 83.0, 53.0, 45.0, 33.0, 35.0, 29.0, 24.0, 13.0, 5.0, 11.0, 9.0, 3.0, 3.0, 5.0, 5.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3909759521484375e-06, -7.0445239543914795e-06, -6.6980719566345215e-06, -6.3516199588775635e-06, -6.0051679611206055e-06, -5.6587159633636475e-06, -5.3122639656066895e-06, -4.9658119678497314e-06, -4.6193599700927734e-06, -4.2729079723358154e-06, -3.926455974578857e-06, -3.5800039768218994e-06, -3.2335519790649414e-06, -2.8870999813079834e-06, -2.5406479835510254e-06, -2.1941959857940674e-06, -1.8477439880371094e-06, -1.5012919902801514e-06, -1.1548399925231934e-06, -8.083879947662354e-07, -4.6193599700927734e-07, -1.1548399925231934e-07, 2.3096799850463867e-07, 5.774199962615967e-07, 9.238719940185547e-07, 1.2703239917755127e-06, 1.6167759895324707e-06, 1.9632279872894287e-06, 2.3096799850463867e-06, 2.6561319828033447e-06, 3.0025839805603027e-06, 3.3490359783172607e-06, 3.6954879760742188e-06, 4.041939973831177e-06, 4.388391971588135e-06, 4.734843969345093e-06, 5.081295967102051e-06, 5.427747964859009e-06, 5.774199962615967e-06, 6.120651960372925e-06, 6.467103958129883e-06, 6.813555955886841e-06, 7.160007953643799e-06, 7.506459951400757e-06, 7.852911949157715e-06, 8.199363946914673e-06, 8.545815944671631e-06, 8.892267942428589e-06, 9.238719940185547e-06, 9.585171937942505e-06, 9.931623935699463e-06, 1.0278075933456421e-05, 1.0624527931213379e-05, 1.0970979928970337e-05, 1.1317431926727295e-05, 1.1663883924484253e-05, 1.2010335922241211e-05, 1.2356787919998169e-05, 1.2703239917755127e-05, 1.3049691915512085e-05, 1.3396143913269043e-05, 1.3742595911026001e-05, 1.4089047908782959e-05, 1.4435499906539917e-05, 1.4781951904296875e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 3.0, 13.0, 9.0, 8.0, 14.0, 26.0, 37.0, 58.0, 127.0, 230.0, 803.0, 4769.0, 79809.0, 854162.0, 101417.0, 5606.0, 902.0, 266.0, 112.0, 46.0, 46.0, 25.0, 24.0, 21.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0201263427734375, -0.019629836082458496, -0.019133329391479492, -0.01863682270050049, -0.018140316009521484, -0.01764380931854248, -0.017147302627563477, -0.016650795936584473, -0.01615428924560547, -0.015657782554626465, -0.015161275863647461, -0.014664769172668457, -0.014168262481689453, -0.01367175579071045, -0.013175249099731445, -0.012678742408752441, -0.012182235717773438, -0.011685729026794434, -0.01118922233581543, -0.010692715644836426, -0.010196208953857422, -0.009699702262878418, -0.009203195571899414, -0.00870668888092041, -0.008210182189941406, -0.007713675498962402, -0.0072171688079833984, -0.0067206621170043945, -0.006224155426025391, -0.005727648735046387, -0.005231142044067383, -0.004734635353088379, -0.004238128662109375, -0.003741621971130371, -0.003245115280151367, -0.0027486085891723633, -0.0022521018981933594, -0.0017555952072143555, -0.0012590885162353516, -0.0007625818252563477, -0.00026607513427734375, 0.00023043155670166016, 0.0007269382476806641, 0.001223444938659668, 0.0017199516296386719, 0.0022164583206176758, 0.0027129650115966797, 0.0032094717025756836, 0.0037059783935546875, 0.004202485084533691, 0.004698991775512695, 0.005195498466491699, 0.005692005157470703, 0.006188511848449707, 0.006685018539428711, 0.007181525230407715, 0.007678031921386719, 0.008174538612365723, 0.008671045303344727, 0.00916755199432373, 0.009664058685302734, 0.010160565376281738, 0.010657072067260742, 0.011153578758239746, 0.01165008544921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 7.0, 6.0, 10.0, 7.0, 16.0, 32.0, 31.0, 43.0, 56.0, 54.0, 78.0, 118.0, 96.0, 85.0, 82.0, 73.0, 51.0, 35.0, 32.0, 29.0, 19.0, 12.0, 10.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0023403167724609375, -0.0022810548543930054, -0.0022217929363250732, -0.002162531018257141, -0.002103269100189209, -0.002044007182121277, -0.0019847452640533447, -0.0019254833459854126, -0.0018662214279174805, -0.0018069595098495483, -0.0017476975917816162, -0.001688435673713684, -0.001629173755645752, -0.0015699118375778198, -0.0015106499195098877, -0.0014513880014419556, -0.0013921260833740234, -0.0013328641653060913, -0.0012736022472381592, -0.001214340329170227, -0.001155078411102295, -0.0010958164930343628, -0.0010365545749664307, -0.0009772926568984985, -0.0009180307388305664, -0.0008587688207626343, -0.0007995069026947021, -0.00074024498462677, -0.0006809830665588379, -0.0006217211484909058, -0.0005624592304229736, -0.0005031973123550415, -0.0004439353942871094, -0.00038467347621917725, -0.0003254115581512451, -0.000266149640083313, -0.00020688772201538086, -0.00014762580394744873, -8.83638858795166e-05, -2.9101967811584473e-05, 3.0159950256347656e-05, 8.942186832427979e-05, 0.00014868378639221191, 0.00020794570446014404, 0.00026720762252807617, 0.0003264695405960083, 0.00038573145866394043, 0.00044499337673187256, 0.0005042552947998047, 0.0005635172128677368, 0.0006227791309356689, 0.0006820410490036011, 0.0007413029670715332, 0.0008005648851394653, 0.0008598268032073975, 0.0009190887212753296, 0.0009783506393432617, 0.0010376125574111938, 0.001096874475479126, 0.001156136393547058, 0.0012153983116149902, 0.0012746602296829224, 0.0013339221477508545, 0.0013931840658187866, 0.0014524459838867188]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 0.0, 2.0, 1.0, 9.0, 16.0, 18.0, 29.0, 47.0, 55.0, 92.0, 143.0, 160.0, 124.0, 108.0, 72.0, 39.0, 33.0, 20.0, 16.0, 10.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3354811668395996, -0.3222896456718445, -0.30909812450408936, -0.29590660333633423, -0.2827151119709015, -0.26952359080314636, -0.25633206963539124, -0.2431405484676361, -0.22994902729988098, -0.21675750613212585, -0.20356599986553192, -0.1903744786977768, -0.17718295753002167, -0.16399145126342773, -0.1507999300956726, -0.13760840892791748, -0.12441690266132355, -0.11122538894414902, -0.09803386777639389, -0.08484235405921936, -0.07165083289146423, -0.0584593191742897, -0.04526780545711517, -0.032076284289360046, -0.018884770572185516, -0.0056932540610432625, 0.007498262450098991, 0.02068977802991867, 0.0338812954723835, 0.04707281291484833, 0.06026432663202286, 0.07345584779977798, 0.08664736151695251, 0.09983887523412704, 0.11303039640188217, 0.1262219101190567, 0.13941343128681183, 0.15260493755340576, 0.1657964587211609, 0.17898797988891602, 0.19217950105667114, 0.20537102222442627, 0.2185625284910202, 0.23175404965877533, 0.24494557082653046, 0.2581370770931244, 0.2713285982608795, 0.28452011942863464, 0.2977116107940674, 0.3109031319618225, 0.32409465312957764, 0.33728617429733276, 0.3504776656627655, 0.36366918683052063, 0.37686070799827576, 0.3900522291660309, 0.403243750333786, 0.41643527150154114, 0.42962679266929626, 0.442818284034729, 0.45600980520248413, 0.46920132637023926, 0.4823928475379944, 0.4955843687057495, 0.5087758898735046]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 12.0, 8.0, 13.0, 12.0, 21.0, 20.0, 37.0, 23.0, 44.0, 43.0, 47.0, 46.0, 50.0, 57.0, 68.0, 81.0, 67.0, 48.0, 56.0, 43.0, 46.0, 34.0, 32.0, 26.0, 19.0, 14.0, 6.0, 12.0, 7.0, 2.0, 2.0, 6.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.29134315252304077, -0.2829345166683197, -0.27452588081359863, -0.2661172151565552, -0.2577085793018341, -0.24929994344711304, -0.24089130759239197, -0.2324826568365097, -0.22407400608062744, -0.21566537022590637, -0.2072567194700241, -0.19884808361530304, -0.19043943285942078, -0.1820307970046997, -0.17362216114997864, -0.16521351039409637, -0.1568048745393753, -0.14839623868465424, -0.13998758792877197, -0.1315789520740509, -0.12317030131816864, -0.11476166546344757, -0.1063530221581459, -0.09794437885284424, -0.08953573554754257, -0.0811270922422409, -0.07271844893693924, -0.06430980563163757, -0.055901166051626205, -0.04749252274632454, -0.03908388316631317, -0.030675239861011505, -0.022266611456871033, -0.013857969082891941, -0.005449326708912849, 0.0029593147337436676, 0.011367958039045334, 0.019776601344347, 0.028185240924358368, 0.036593884229660034, 0.0450025275349617, 0.05341117084026337, 0.06181981414556503, 0.0702284574508667, 0.07863709330558777, 0.08704574406147003, 0.0954543799161911, 0.10386302322149277, 0.11227166652679443, 0.1206803098320961, 0.12908895313739777, 0.13749758899211884, 0.1459062397480011, 0.15431487560272217, 0.16272351145744324, 0.1711321622133255, 0.17954081296920776, 0.18794944882392883, 0.1963580995798111, 0.20476673543453217, 0.21317538619041443, 0.2215840220451355, 0.22999265789985657, 0.23840130865573883, 0.2468099445104599]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 7.0, 5.0, 7.0, 7.0, 10.0, 17.0, 27.0, 53.0, 91.0, 321.0, 1170.0, 6078.0, 52803.0, 753766.0, 215472.0, 15297.0, 2466.0, 594.0, 210.0, 71.0, 38.0, 19.0, 10.0, 8.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.301025390625, -0.28932952880859375, -0.2776336669921875, -0.26593780517578125, -0.254241943359375, -0.24254608154296875, -0.2308502197265625, -0.21915435791015625, -0.20745849609375, -0.19576263427734375, -0.1840667724609375, -0.17237091064453125, -0.160675048828125, -0.14897918701171875, -0.1372833251953125, -0.12558746337890625, -0.1138916015625, -0.10219573974609375, -0.0904998779296875, -0.07880401611328125, -0.067108154296875, -0.05541229248046875, -0.0437164306640625, -0.03202056884765625, -0.02032470703125, -0.00862884521484375, 0.0030670166015625, 0.01476287841796875, 0.026458740234375, 0.03815460205078125, 0.0498504638671875, 0.06154632568359375, 0.0732421875, 0.08493804931640625, 0.0966339111328125, 0.10832977294921875, 0.120025634765625, 0.13172149658203125, 0.1434173583984375, 0.15511322021484375, 0.16680908203125, 0.17850494384765625, 0.1902008056640625, 0.20189666748046875, 0.213592529296875, 0.22528839111328125, 0.2369842529296875, 0.24868011474609375, 0.2603759765625, 0.27207183837890625, 0.2837677001953125, 0.29546356201171875, 0.307159423828125, 0.31885528564453125, 0.3305511474609375, 0.34224700927734375, 0.35394287109375, 0.36563873291015625, 0.3773345947265625, 0.38903045654296875, 0.400726318359375, 0.41242218017578125, 0.4241180419921875, 0.43581390380859375, 0.447509765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 7.0, 10.0, 21.0, 12.0, 46.0, 39.0, 52.0, 64.0, 70.0, 84.0, 85.0, 88.0, 88.0, 69.0, 63.0, 61.0, 53.0, 20.0, 32.0, 19.0, 8.0, 8.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58544921875, -0.5610122680664062, -0.5365753173828125, -0.5121383666992188, -0.487701416015625, -0.46326446533203125, -0.4388275146484375, -0.41439056396484375, -0.38995361328125, -0.36551666259765625, -0.3410797119140625, -0.31664276123046875, -0.292205810546875, -0.26776885986328125, -0.2433319091796875, -0.21889495849609375, -0.1944580078125, -0.17002105712890625, -0.1455841064453125, -0.12114715576171875, -0.096710205078125, -0.07227325439453125, -0.0478363037109375, -0.02339935302734375, 0.00103759765625, 0.02547454833984375, 0.0499114990234375, 0.07434844970703125, 0.098785400390625, 0.12322235107421875, 0.1476593017578125, 0.17209625244140625, 0.196533203125, 0.22097015380859375, 0.2454071044921875, 0.26984405517578125, 0.294281005859375, 0.31871795654296875, 0.3431549072265625, 0.36759185791015625, 0.39202880859375, 0.41646575927734375, 0.4409027099609375, 0.46533966064453125, 0.489776611328125, 0.5142135620117188, 0.5386505126953125, 0.5630874633789062, 0.5875244140625, 0.6119613647460938, 0.6363983154296875, 0.6608352661132812, 0.685272216796875, 0.7097091674804688, 0.7341461181640625, 0.7585830688476562, 0.78302001953125, 0.8074569702148438, 0.8318939208984375, 0.8563308715820312, 0.880767822265625, 0.9052047729492188, 0.9296417236328125, 0.9540786743164062, 0.978515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 5.0, 9.0, 14.0, 7.0, 16.0, 24.0, 38.0, 40.0, 47.0, 48.0, 63.0, 86.0, 107.0, 104.0, 158.0, 218.0, 359.0, 1230.0, 13975.0, 839952.0, 185668.0, 4472.0, 723.0, 288.0, 187.0, 136.0, 94.0, 94.0, 73.0, 67.0, 51.0, 44.0, 40.0, 38.0, 19.0, 16.0, 10.0, 6.0, 7.0, 3.0, 3.0, 5.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52734375, -0.5090408325195312, -0.4907379150390625, -0.47243499755859375, -0.454132080078125, -0.43582916259765625, -0.4175262451171875, -0.39922332763671875, -0.38092041015625, -0.36261749267578125, -0.3443145751953125, -0.32601165771484375, -0.307708740234375, -0.28940582275390625, -0.2711029052734375, -0.25279998779296875, -0.2344970703125, -0.21619415283203125, -0.1978912353515625, -0.17958831787109375, -0.161285400390625, -0.14298248291015625, -0.1246795654296875, -0.10637664794921875, -0.08807373046875, -0.06977081298828125, -0.0514678955078125, -0.03316497802734375, -0.014862060546875, 0.00344085693359375, 0.0217437744140625, 0.04004669189453125, 0.058349609375, 0.07665252685546875, 0.0949554443359375, 0.11325836181640625, 0.131561279296875, 0.14986419677734375, 0.1681671142578125, 0.18647003173828125, 0.20477294921875, 0.22307586669921875, 0.2413787841796875, 0.25968170166015625, 0.277984619140625, 0.29628753662109375, 0.3145904541015625, 0.33289337158203125, 0.3511962890625, 0.36949920654296875, 0.3878021240234375, 0.40610504150390625, 0.424407958984375, 0.44271087646484375, 0.4610137939453125, 0.47931671142578125, 0.49761962890625, 0.5159225463867188, 0.5342254638671875, 0.5525283813476562, 0.570831298828125, 0.5891342163085938, 0.6074371337890625, 0.6257400512695312, 0.64404296875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 2.0, 6.0, 4.0, 15.0, 23.0, 14.0, 19.0, 22.0, 42.0, 32.0, 31.0, 42.0, 31.0, 45.0, 51.0, 57.0, 37.0, 41.0, 48.0, 44.0, 46.0, 48.0, 42.0, 31.0, 33.0, 35.0, 34.0, 29.0, 20.0, 15.0, 13.0, 15.0, 9.0, 9.0, 5.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.412109375, -0.3974761962890625, -0.382843017578125, -0.3682098388671875, -0.35357666015625, -0.3389434814453125, -0.324310302734375, -0.3096771240234375, -0.2950439453125, -0.2804107666015625, -0.265777587890625, -0.2511444091796875, -0.23651123046875, -0.2218780517578125, -0.207244873046875, -0.1926116943359375, -0.177978515625, -0.1633453369140625, -0.148712158203125, -0.1340789794921875, -0.11944580078125, -0.1048126220703125, -0.090179443359375, -0.0755462646484375, -0.0609130859375, -0.0462799072265625, -0.031646728515625, -0.0170135498046875, -0.00238037109375, 0.0122528076171875, 0.026885986328125, 0.0415191650390625, 0.05615234375, 0.0707855224609375, 0.085418701171875, 0.1000518798828125, 0.11468505859375, 0.1293182373046875, 0.143951416015625, 0.1585845947265625, 0.1732177734375, 0.1878509521484375, 0.202484130859375, 0.2171173095703125, 0.23175048828125, 0.2463836669921875, 0.261016845703125, 0.2756500244140625, 0.290283203125, 0.3049163818359375, 0.319549560546875, 0.3341827392578125, 0.34881591796875, 0.3634490966796875, 0.378082275390625, 0.3927154541015625, 0.4073486328125, 0.4219818115234375, 0.436614990234375, 0.4512481689453125, 0.46588134765625, 0.4805145263671875, 0.495147705078125, 0.5097808837890625, 0.5244140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 6.0, 7.0, 10.0, 8.0, 16.0, 15.0, 31.0, 43.0, 68.0, 91.0, 298.0, 1041.0, 6013.0, 99939.0, 915062.0, 22575.0, 2371.0, 518.0, 168.0, 80.0, 60.0, 29.0, 22.0, 23.0, 6.0, 13.0, 4.0, 9.0, 6.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193359375, -0.18697166442871094, -0.18058395385742188, -0.1741962432861328, -0.16780853271484375, -0.1614208221435547, -0.15503311157226562, -0.14864540100097656, -0.1422576904296875, -0.13586997985839844, -0.12948226928710938, -0.12309455871582031, -0.11670684814453125, -0.11031913757324219, -0.10393142700195312, -0.09754371643066406, -0.091156005859375, -0.08476829528808594, -0.07838058471679688, -0.07199287414550781, -0.06560516357421875, -0.05921745300292969, -0.052829742431640625, -0.04644203186035156, -0.0400543212890625, -0.03366661071777344, -0.027278900146484375, -0.020891189575195312, -0.01450347900390625, -0.008115768432617188, -0.001728057861328125, 0.0046596527099609375, 0.01104736328125, 0.017435073852539062, 0.023822784423828125, 0.030210494995117188, 0.03659820556640625, 0.04298591613769531, 0.049373626708984375, 0.05576133728027344, 0.0621490478515625, 0.06853675842285156, 0.07492446899414062, 0.08131217956542969, 0.08769989013671875, 0.09408760070800781, 0.10047531127929688, 0.10686302185058594, 0.113250732421875, 0.11963844299316406, 0.12602615356445312, 0.1324138641357422, 0.13880157470703125, 0.1451892852783203, 0.15157699584960938, 0.15796470642089844, 0.1643524169921875, 0.17074012756347656, 0.17712783813476562, 0.1835155487060547, 0.18990325927734375, 0.1962909698486328, 0.20267868041992188, 0.20906639099121094, 0.2154541015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 4.0, 12.0, 8.0, 7.0, 16.0, 8.0, 22.0, 28.0, 45.0, 79.0, 119.0, 195.0, 156.0, 117.0, 45.0, 35.0, 27.0, 11.0, 11.0, 12.0, 12.0, 2.0, 2.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3768672943115234e-05, -1.3319775462150574e-05, -1.2870877981185913e-05, -1.2421980500221252e-05, -1.1973083019256592e-05, -1.1524185538291931e-05, -1.107528805732727e-05, -1.062639057636261e-05, -1.017749309539795e-05, -9.728595614433289e-06, -9.279698133468628e-06, -8.830800652503967e-06, -8.381903171539307e-06, -7.933005690574646e-06, -7.484108209609985e-06, -7.035210728645325e-06, -6.586313247680664e-06, -6.137415766716003e-06, -5.688518285751343e-06, -5.239620804786682e-06, -4.7907233238220215e-06, -4.341825842857361e-06, -3.8929283618927e-06, -3.4440308809280396e-06, -2.995133399963379e-06, -2.5462359189987183e-06, -2.0973384380340576e-06, -1.648440957069397e-06, -1.1995434761047363e-06, -7.506459951400757e-07, -3.0174851417541504e-07, 1.471489667892456e-07, 5.960464477539062e-07, 1.044943928718567e-06, 1.4938414096832275e-06, 1.942738890647888e-06, 2.391636371612549e-06, 2.8405338525772095e-06, 3.28943133354187e-06, 3.7383288145065308e-06, 4.187226295471191e-06, 4.636123776435852e-06, 5.085021257400513e-06, 5.533918738365173e-06, 5.982816219329834e-06, 6.431713700294495e-06, 6.880611181259155e-06, 7.329508662223816e-06, 7.778406143188477e-06, 8.227303624153137e-06, 8.676201105117798e-06, 9.125098586082458e-06, 9.573996067047119e-06, 1.002289354801178e-05, 1.047179102897644e-05, 1.0920688509941101e-05, 1.1369585990905762e-05, 1.1818483471870422e-05, 1.2267380952835083e-05, 1.2716278433799744e-05, 1.3165175914764404e-05, 1.3614073395729065e-05, 1.4062970876693726e-05, 1.4511868357658386e-05, 1.4960765838623047e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 4.0, 7.0, 12.0, 12.0, 16.0, 38.0, 50.0, 82.0, 159.0, 366.0, 1070.0, 5053.0, 59917.0, 949820.0, 27222.0, 3289.0, 777.0, 302.0, 151.0, 65.0, 41.0, 23.0, 10.0, 10.0, 15.0, 5.0, 6.0, 6.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.269775390625, -0.2616920471191406, -0.25360870361328125, -0.24552536010742188, -0.2374420166015625, -0.22935867309570312, -0.22127532958984375, -0.21319198608398438, -0.205108642578125, -0.19702529907226562, -0.18894195556640625, -0.18085861206054688, -0.1727752685546875, -0.16469192504882812, -0.15660858154296875, -0.14852523803710938, -0.14044189453125, -0.13235855102539062, -0.12427520751953125, -0.11619186401367188, -0.1081085205078125, -0.10002517700195312, -0.09194183349609375, -0.08385848999023438, -0.075775146484375, -0.06769180297851562, -0.05960845947265625, -0.051525115966796875, -0.0434417724609375, -0.035358428955078125, -0.02727508544921875, -0.019191741943359375, -0.0111083984375, -0.003025054931640625, 0.00505828857421875, 0.013141632080078125, 0.0212249755859375, 0.029308319091796875, 0.03739166259765625, 0.045475006103515625, 0.053558349609375, 0.061641693115234375, 0.06972503662109375, 0.07780838012695312, 0.0858917236328125, 0.09397506713867188, 0.10205841064453125, 0.11014175415039062, 0.11822509765625, 0.12630844116210938, 0.13439178466796875, 0.14247512817382812, 0.1505584716796875, 0.15864181518554688, 0.16672515869140625, 0.17480850219726562, 0.182891845703125, 0.19097518920898438, 0.19905853271484375, 0.20714187622070312, 0.2152252197265625, 0.22330856323242188, 0.23139190673828125, 0.23947525024414062, 0.24755859375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 7.0, 5.0, 14.0, 17.0, 25.0, 32.0, 22.0, 54.0, 80.0, 159.0, 204.0, 149.0, 76.0, 40.0, 33.0, 17.0, 15.0, 8.0, 6.0, 5.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05029296875, -0.04857444763183594, -0.046855926513671875, -0.04513740539550781, -0.04341888427734375, -0.04170036315917969, -0.039981842041015625, -0.03826332092285156, -0.0365447998046875, -0.03482627868652344, -0.033107757568359375, -0.03138923645019531, -0.02967071533203125, -0.027952194213867188, -0.026233673095703125, -0.024515151977539062, -0.022796630859375, -0.021078109741210938, -0.019359588623046875, -0.017641067504882812, -0.01592254638671875, -0.014204025268554688, -0.012485504150390625, -0.010766983032226562, -0.0090484619140625, -0.0073299407958984375, -0.005611419677734375, -0.0038928985595703125, -0.00217437744140625, -0.0004558563232421875, 0.001262664794921875, 0.0029811859130859375, 0.00469970703125, 0.0064182281494140625, 0.008136749267578125, 0.009855270385742188, 0.01157379150390625, 0.013292312622070312, 0.015010833740234375, 0.016729354858398438, 0.0184478759765625, 0.020166397094726562, 0.021884918212890625, 0.023603439331054688, 0.02532196044921875, 0.027040481567382812, 0.028759002685546875, 0.030477523803710938, 0.032196044921875, 0.03391456604003906, 0.035633087158203125, 0.03735160827636719, 0.03907012939453125, 0.04078865051269531, 0.042507171630859375, 0.04422569274902344, 0.0459442138671875, 0.04766273498535156, 0.049381256103515625, 0.05109977722167969, 0.05281829833984375, 0.05453681945800781, 0.056255340576171875, 0.05797386169433594, 0.0596923828125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 8.0, 7.0, 14.0, 33.0, 48.0, 76.0, 146.0, 183.0, 178.0, 121.0, 81.0, 50.0, 25.0, 18.0, 9.0, 8.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4034570455551147, -1.369112253189087, -1.334767460823059, -1.3004226684570312, -1.2660778760910034, -1.2317330837249756, -1.1973882913589478, -1.16304349899292, -1.128698706626892, -1.0943539142608643, -1.0600091218948364, -1.0256643295288086, -0.9913195371627808, -0.9569747447967529, -0.9226299524307251, -0.8882851600646973, -0.8539403676986694, -0.8195955753326416, -0.7852507829666138, -0.7509059906005859, -0.7165611982345581, -0.6822164058685303, -0.6478716135025024, -0.6135268211364746, -0.5791820287704468, -0.544837236404419, -0.5104924440383911, -0.4761476516723633, -0.44180285930633545, -0.4074580669403076, -0.3731132745742798, -0.33876848220825195, -0.30442357063293457, -0.27007877826690674, -0.2357339859008789, -0.20138919353485107, -0.16704440116882324, -0.1326996088027954, -0.09835481643676758, -0.06401002407073975, -0.029665231704711914, 0.004679560661315918, 0.03902435302734375, 0.07336914539337158, 0.10771393775939941, 0.14205873012542725, 0.17640352249145508, 0.2107483148574829, 0.24509310722351074, 0.2794378995895386, 0.3137826919555664, 0.34812748432159424, 0.38247227668762207, 0.4168170690536499, 0.45116186141967773, 0.48550665378570557, 0.5198514461517334, 0.5541962385177612, 0.5885410308837891, 0.6228858232498169, 0.6572306156158447, 0.6915754079818726, 0.7259202003479004, 0.7602649927139282, 0.794609785079956]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 11.0, 15.0, 6.0, 9.0, 19.0, 14.0, 27.0, 29.0, 24.0, 30.0, 27.0, 36.0, 37.0, 57.0, 38.0, 51.0, 46.0, 50.0, 46.0, 41.0, 38.0, 47.0, 39.0, 42.0, 30.0, 24.0, 22.0, 32.0, 19.0, 24.0, 20.0, 15.0, 5.0, 7.0, 7.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.768673837184906, -0.7442319989204407, -0.7197902202606201, -0.6953483819961548, -0.6709065437316895, -0.6464647650718689, -0.6220229268074036, -0.597581148147583, -0.5731393098831177, -0.5486974716186523, -0.5242556929588318, -0.49981385469436646, -0.4753720462322235, -0.45093023777008057, -0.42648839950561523, -0.4020465910434723, -0.37760478258132935, -0.3531629741191864, -0.32872116565704346, -0.3042793273925781, -0.2798375189304352, -0.25539571046829224, -0.2309538871049881, -0.20651206374168396, -0.18207025527954102, -0.15762844681739807, -0.13318662345409393, -0.10874480754137039, -0.08430299162864685, -0.05986117571592331, -0.03541935980319977, -0.01097753643989563, 0.01346433162689209, 0.03790614753961563, 0.06234796345233917, 0.08678977936506271, 0.11123159527778625, 0.1356734037399292, 0.16011522710323334, 0.18455705046653748, 0.20899885892868042, 0.23344066739082336, 0.2578824758529663, 0.28232431411743164, 0.3067661225795746, 0.33120793104171753, 0.35564976930618286, 0.3800915777683258, 0.40453338623046875, 0.4289751946926117, 0.45341700315475464, 0.47785884141921997, 0.5023006200790405, 0.5267424583435059, 0.5511842966079712, 0.5756261348724365, 0.6000679135322571, 0.6245097517967224, 0.648951530456543, 0.6733933687210083, 0.6978352069854736, 0.7222769856452942, 0.7467188239097595, 0.7711606025695801, 0.7956024408340454]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 6.0, 6.0, 17.0, 18.0, 36.0, 34.0, 56.0, 100.0, 132.0, 247.0, 411.0, 813.0, 1611.0, 3838.0, 11252.0, 63542.0, 947314.0, 2787360.0, 336323.0, 29014.0, 7048.0, 2541.0, 1145.0, 570.0, 302.0, 200.0, 118.0, 69.0, 44.0, 30.0, 28.0, 19.0, 15.0, 7.0, 6.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5068359375, -0.48827362060546875, -0.4697113037109375, -0.45114898681640625, -0.432586669921875, -0.41402435302734375, -0.3954620361328125, -0.37689971923828125, -0.35833740234375, -0.33977508544921875, -0.3212127685546875, -0.30265045166015625, -0.284088134765625, -0.26552581787109375, -0.2469635009765625, -0.22840118408203125, -0.2098388671875, -0.19127655029296875, -0.1727142333984375, -0.15415191650390625, -0.135589599609375, -0.11702728271484375, -0.0984649658203125, -0.07990264892578125, -0.06134033203125, -0.04277801513671875, -0.0242156982421875, -0.00565338134765625, 0.012908935546875, 0.03147125244140625, 0.0500335693359375, 0.06859588623046875, 0.087158203125, 0.10572052001953125, 0.1242828369140625, 0.14284515380859375, 0.161407470703125, 0.17996978759765625, 0.1985321044921875, 0.21709442138671875, 0.23565673828125, 0.25421905517578125, 0.2727813720703125, 0.29134368896484375, 0.309906005859375, 0.32846832275390625, 0.3470306396484375, 0.36559295654296875, 0.3841552734375, 0.40271759033203125, 0.4212799072265625, 0.43984222412109375, 0.458404541015625, 0.47696685791015625, 0.4955291748046875, 0.5140914916992188, 0.53265380859375, 0.5512161254882812, 0.5697784423828125, 0.5883407592773438, 0.606903076171875, 0.6254653930664062, 0.6440277099609375, 0.6625900268554688, 0.68115234375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 3.0, 8.0, 7.0, 15.0, 15.0, 7.0, 15.0, 19.0, 30.0, 30.0, 35.0, 48.0, 35.0, 40.0, 46.0, 54.0, 51.0, 57.0, 50.0, 49.0, 52.0, 48.0, 44.0, 28.0, 45.0, 30.0, 30.0, 22.0, 19.0, 15.0, 8.0, 10.0, 4.0, 12.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0], "bins": [-0.3369140625, -0.32721710205078125, -0.3175201416015625, -0.30782318115234375, -0.298126220703125, -0.28842926025390625, -0.2787322998046875, -0.26903533935546875, -0.25933837890625, -0.24964141845703125, -0.2399444580078125, -0.23024749755859375, -0.220550537109375, -0.21085357666015625, -0.2011566162109375, -0.19145965576171875, -0.1817626953125, -0.17206573486328125, -0.1623687744140625, -0.15267181396484375, -0.142974853515625, -0.13327789306640625, -0.1235809326171875, -0.11388397216796875, -0.10418701171875, -0.09449005126953125, -0.0847930908203125, -0.07509613037109375, -0.065399169921875, -0.05570220947265625, -0.0460052490234375, -0.03630828857421875, -0.026611328125, -0.01691436767578125, -0.0072174072265625, 0.00247955322265625, 0.012176513671875, 0.02187347412109375, 0.0315704345703125, 0.04126739501953125, 0.05096435546875, 0.06066131591796875, 0.0703582763671875, 0.08005523681640625, 0.089752197265625, 0.09944915771484375, 0.1091461181640625, 0.11884307861328125, 0.1285400390625, 0.13823699951171875, 0.1479339599609375, 0.15763092041015625, 0.167327880859375, 0.17702484130859375, 0.1867218017578125, 0.19641876220703125, 0.20611572265625, 0.21581268310546875, 0.2255096435546875, 0.23520660400390625, 0.244903564453125, 0.25460052490234375, 0.2642974853515625, 0.27399444580078125, 0.28369140625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 15.0, 32.0, 49.0, 139.0, 259.0, 630.0, 2992.0, 3780664.0, 406268.0, 2195.0, 564.0, 239.0, 102.0, 72.0, 30.0, 16.0, 8.0, 3.0, 5.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.720703125, -1.638458251953125, -1.55621337890625, -1.473968505859375, -1.3917236328125, -1.309478759765625, -1.22723388671875, -1.144989013671875, -1.062744140625, -0.980499267578125, -0.89825439453125, -0.816009521484375, -0.7337646484375, -0.651519775390625, -0.56927490234375, -0.487030029296875, -0.40478515625, -0.322540283203125, -0.24029541015625, -0.158050537109375, -0.0758056640625, 0.006439208984375, 0.08868408203125, 0.170928955078125, 0.253173828125, 0.335418701171875, 0.41766357421875, 0.499908447265625, 0.5821533203125, 0.664398193359375, 0.74664306640625, 0.828887939453125, 0.9111328125, 0.993377685546875, 1.07562255859375, 1.157867431640625, 1.2401123046875, 1.322357177734375, 1.40460205078125, 1.486846923828125, 1.569091796875, 1.651336669921875, 1.73358154296875, 1.815826416015625, 1.8980712890625, 1.980316162109375, 2.06256103515625, 2.144805908203125, 2.22705078125, 2.309295654296875, 2.39154052734375, 2.473785400390625, 2.5560302734375, 2.638275146484375, 2.72052001953125, 2.802764892578125, 2.885009765625, 2.967254638671875, 3.04949951171875, 3.131744384765625, 3.2139892578125, 3.296234130859375, 3.37847900390625, 3.460723876953125, 3.54296875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 8.0, 18.0, 24.0, 45.0, 65.0, 152.0, 417.0, 1401.0, 1289.0, 386.0, 123.0, 61.0, 38.0, 28.0, 10.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.435302734375, -0.42492103576660156, -0.4145393371582031, -0.4041576385498047, -0.39377593994140625, -0.3833942413330078, -0.3730125427246094, -0.36263084411621094, -0.3522491455078125, -0.34186744689941406, -0.3314857482910156, -0.3211040496826172, -0.31072235107421875, -0.3003406524658203, -0.2899589538574219, -0.27957725524902344, -0.269195556640625, -0.25881385803222656, -0.24843215942382812, -0.2380504608154297, -0.22766876220703125, -0.2172870635986328, -0.20690536499023438, -0.19652366638183594, -0.1861419677734375, -0.17576026916503906, -0.16537857055664062, -0.1549968719482422, -0.14461517333984375, -0.1342334747314453, -0.12385177612304688, -0.11347007751464844, -0.10308837890625, -0.09270668029785156, -0.08232498168945312, -0.07194328308105469, -0.06156158447265625, -0.05117988586425781, -0.040798187255859375, -0.030416488647460938, -0.0200347900390625, -0.009653091430664062, 0.000728607177734375, 0.011110305786132812, 0.02149200439453125, 0.03187370300292969, 0.042255401611328125, 0.05263710021972656, 0.063018798828125, 0.07340049743652344, 0.08378219604492188, 0.09416389465332031, 0.10454559326171875, 0.11492729187011719, 0.12530899047851562, 0.13569068908691406, 0.1460723876953125, 0.15645408630371094, 0.16683578491210938, 0.1772174835205078, 0.18759918212890625, 0.1979808807373047, 0.20836257934570312, 0.21874427795410156, 0.2291259765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 13.0, 5.0, 14.0, 11.0, 27.0, 35.0, 50.0, 67.0, 65.0, 106.0, 112.0, 107.0, 100.0, 70.0, 49.0, 54.0, 28.0, 30.0, 13.0, 15.0, 9.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.455891489982605, -0.4389473795890808, -0.42200329899787903, -0.40505921840667725, -0.3881151080131531, -0.3711709976196289, -0.3542269170284271, -0.33728283643722534, -0.32033872604370117, -0.303394615650177, -0.2864505350589752, -0.26950645446777344, -0.25256234407424927, -0.2356182485818863, -0.21867415308952332, -0.20173005759716034, -0.18478596210479736, -0.1678418666124344, -0.1508977711200714, -0.13395367562770844, -0.11700958013534546, -0.10006548464298248, -0.0831213891506195, -0.06617729365825653, -0.049233198165893555, -0.03228910267353058, -0.015345007181167603, 0.0015990883111953735, 0.01854318380355835, 0.035487279295921326, 0.0524313747882843, 0.06937547028064728, 0.08631950616836548, 0.10326360166072845, 0.12020769715309143, 0.1371517926454544, 0.15409588813781738, 0.17103998363018036, 0.18798407912254333, 0.2049281746149063, 0.2218722701072693, 0.23881636559963226, 0.25576046109199524, 0.272704541683197, 0.2896486520767212, 0.30659276247024536, 0.32353684306144714, 0.3404809236526489, 0.3574250340461731, 0.37436914443969727, 0.39131322503089905, 0.40825730562210083, 0.425201416015625, 0.44214552640914917, 0.45908960700035095, 0.47603368759155273, 0.4929777979850769, 0.5099219083786011, 0.5268659591674805, 0.5438100695610046, 0.5607541799545288, 0.577698290348053, 0.5946424007415771, 0.6115864515304565, 0.6285305619239807]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 5.0, 3.0, 12.0, 12.0, 13.0, 15.0, 20.0, 38.0, 39.0, 41.0, 56.0, 44.0, 50.0, 44.0, 38.0, 47.0, 46.0, 46.0, 54.0, 64.0, 50.0, 41.0, 34.0, 28.0, 33.0, 24.0, 19.0, 18.0, 19.0, 14.0, 8.0, 10.0, 7.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26405179500579834, -0.2526823878288269, -0.24131295084953308, -0.22994352877140045, -0.21857410669326782, -0.2072046846151352, -0.19583526253700256, -0.18446584045886993, -0.1730964183807373, -0.16172699630260468, -0.15035757422447205, -0.13898815214633942, -0.1276187300682068, -0.11624930799007416, -0.10487988591194153, -0.0935104638338089, -0.08214104175567627, -0.07077161967754364, -0.05940219759941101, -0.04803277552127838, -0.03666335344314575, -0.025293931365013123, -0.013924509286880493, -0.0025550872087478638, 0.008814334869384766, 0.020183756947517395, 0.031553179025650024, 0.042922601103782654, 0.05429202318191528, 0.06566144526004791, 0.07703086733818054, 0.08840028941631317, 0.09976968169212341, 0.11113910377025604, 0.12250852584838867, 0.1338779479265213, 0.14524737000465393, 0.15661679208278656, 0.1679862141609192, 0.17935563623905182, 0.19072505831718445, 0.20209448039531708, 0.2134639024734497, 0.22483332455158234, 0.23620274662971497, 0.2475721687078476, 0.2589415907859802, 0.27031099796295166, 0.2816804349422455, 0.2930498719215393, 0.30441927909851074, 0.3157886862754822, 0.327158123254776, 0.3385275602340698, 0.34989696741104126, 0.3612663745880127, 0.3726358115673065, 0.38400524854660034, 0.3953746557235718, 0.4067440629005432, 0.41811349987983704, 0.42948293685913086, 0.4408523440361023, 0.45222175121307373, 0.46359118819236755]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 1.0, 5.0, 7.0, 10.0, 12.0, 23.0, 34.0, 42.0, 53.0, 79.0, 134.0, 204.0, 328.0, 577.0, 1169.0, 2380.0, 5115.0, 11869.0, 30339.0, 84611.0, 267401.0, 407193.0, 152197.0, 50669.0, 19036.0, 7879.0, 3464.0, 1640.0, 854.0, 455.0, 259.0, 149.0, 110.0, 71.0, 53.0, 35.0, 23.0, 23.0, 11.0, 12.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0821533203125, -0.0794382095336914, -0.07672309875488281, -0.07400798797607422, -0.07129287719726562, -0.06857776641845703, -0.06586265563964844, -0.06314754486083984, -0.06043243408203125, -0.057717323303222656, -0.05500221252441406, -0.05228710174560547, -0.049571990966796875, -0.04685688018798828, -0.04414176940917969, -0.041426658630371094, -0.0387115478515625, -0.035996437072753906, -0.03328132629394531, -0.03056621551513672, -0.027851104736328125, -0.02513599395751953, -0.022420883178710938, -0.019705772399902344, -0.01699066162109375, -0.014275550842285156, -0.011560440063476562, -0.008845329284667969, -0.006130218505859375, -0.0034151077270507812, -0.0006999969482421875, 0.0020151138305664062, 0.004730224609375, 0.007445335388183594, 0.010160446166992188, 0.012875556945800781, 0.015590667724609375, 0.01830577850341797, 0.021020889282226562, 0.023736000061035156, 0.02645111083984375, 0.029166221618652344, 0.03188133239746094, 0.03459644317626953, 0.037311553955078125, 0.04002666473388672, 0.04274177551269531, 0.045456886291503906, 0.0481719970703125, 0.050887107849121094, 0.05360221862792969, 0.05631732940673828, 0.059032440185546875, 0.06174755096435547, 0.06446266174316406, 0.06717777252197266, 0.06989288330078125, 0.07260799407958984, 0.07532310485839844, 0.07803821563720703, 0.08075332641601562, 0.08346843719482422, 0.08618354797363281, 0.0888986587524414, 0.09161376953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 10.0, 8.0, 8.0, 12.0, 20.0, 25.0, 44.0, 42.0, 50.0, 67.0, 60.0, 60.0, 61.0, 59.0, 74.0, 69.0, 70.0, 64.0, 42.0, 34.0, 27.0, 35.0, 16.0, 18.0, 11.0, 6.0, 4.0, 6.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.230224609375, -0.2204132080078125, -0.210601806640625, -0.2007904052734375, -0.19097900390625, -0.1811676025390625, -0.171356201171875, -0.1615447998046875, -0.1517333984375, -0.1419219970703125, -0.132110595703125, -0.1222991943359375, -0.11248779296875, -0.1026763916015625, -0.092864990234375, -0.0830535888671875, -0.0732421875, -0.0634307861328125, -0.053619384765625, -0.0438079833984375, -0.03399658203125, -0.0241851806640625, -0.014373779296875, -0.0045623779296875, 0.0052490234375, 0.0150604248046875, 0.024871826171875, 0.0346832275390625, 0.04449462890625, 0.0543060302734375, 0.064117431640625, 0.0739288330078125, 0.083740234375, 0.0935516357421875, 0.103363037109375, 0.1131744384765625, 0.12298583984375, 0.1327972412109375, 0.142608642578125, 0.1524200439453125, 0.1622314453125, 0.1720428466796875, 0.181854248046875, 0.1916656494140625, 0.20147705078125, 0.2112884521484375, 0.221099853515625, 0.2309112548828125, 0.24072265625, 0.2505340576171875, 0.260345458984375, 0.2701568603515625, 0.27996826171875, 0.2897796630859375, 0.299591064453125, 0.3094024658203125, 0.3192138671875, 0.3290252685546875, 0.338836669921875, 0.3486480712890625, 0.35845947265625, 0.3682708740234375, 0.378082275390625, 0.3878936767578125, 0.397705078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 6.0, 9.0, 13.0, 19.0, 19.0, 16.0, 36.0, 44.0, 82.0, 98.0, 153.0, 229.0, 423.0, 831.0, 1524.0, 2940.0, 6399.0, 14356.0, 36169.0, 104116.0, 321670.0, 362967.0, 124242.0, 41934.0, 16535.0, 6914.0, 3236.0, 1600.0, 823.0, 473.0, 257.0, 143.0, 88.0, 51.0, 29.0, 31.0, 23.0, 17.0, 8.0, 8.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07470703125, -0.07237815856933594, -0.07004928588867188, -0.06772041320800781, -0.06539154052734375, -0.06306266784667969, -0.060733795166015625, -0.05840492248535156, -0.0560760498046875, -0.05374717712402344, -0.051418304443359375, -0.04908943176269531, -0.04676055908203125, -0.04443168640136719, -0.042102813720703125, -0.03977394104003906, -0.037445068359375, -0.03511619567871094, -0.032787322998046875, -0.030458450317382812, -0.02812957763671875, -0.025800704956054688, -0.023471832275390625, -0.021142959594726562, -0.0188140869140625, -0.016485214233398438, -0.014156341552734375, -0.011827468872070312, -0.00949859619140625, -0.0071697235107421875, -0.004840850830078125, -0.0025119781494140625, -0.00018310546875, 0.0021457672119140625, 0.004474639892578125, 0.0068035125732421875, 0.00913238525390625, 0.011461257934570312, 0.013790130615234375, 0.016119003295898438, 0.0184478759765625, 0.020776748657226562, 0.023105621337890625, 0.025434494018554688, 0.02776336669921875, 0.030092239379882812, 0.032421112060546875, 0.03474998474121094, 0.037078857421875, 0.03940773010253906, 0.041736602783203125, 0.04406547546386719, 0.04639434814453125, 0.04872322082519531, 0.051052093505859375, 0.05338096618652344, 0.0557098388671875, 0.05803871154785156, 0.060367584228515625, 0.06269645690917969, 0.06502532958984375, 0.06735420227050781, 0.06968307495117188, 0.07201194763183594, 0.0743408203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 7.0, 5.0, 4.0, 10.0, 10.0, 16.0, 11.0, 22.0, 33.0, 32.0, 36.0, 54.0, 49.0, 72.0, 67.0, 67.0, 73.0, 68.0, 74.0, 55.0, 42.0, 44.0, 27.0, 32.0, 17.0, 22.0, 15.0, 16.0, 9.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.376953125, -0.35794830322265625, -0.3389434814453125, -0.31993865966796875, -0.300933837890625, -0.28192901611328125, -0.2629241943359375, -0.24391937255859375, -0.22491455078125, -0.20590972900390625, -0.1869049072265625, -0.16790008544921875, -0.148895263671875, -0.12989044189453125, -0.1108856201171875, -0.09188079833984375, -0.0728759765625, -0.05387115478515625, -0.0348663330078125, -0.01586151123046875, 0.003143310546875, 0.02214813232421875, 0.0411529541015625, 0.06015777587890625, 0.07916259765625, 0.09816741943359375, 0.1171722412109375, 0.13617706298828125, 0.155181884765625, 0.17418670654296875, 0.1931915283203125, 0.21219635009765625, 0.231201171875, 0.25020599365234375, 0.2692108154296875, 0.28821563720703125, 0.307220458984375, 0.32622528076171875, 0.3452301025390625, 0.36423492431640625, 0.38323974609375, 0.40224456787109375, 0.4212493896484375, 0.44025421142578125, 0.459259033203125, 0.47826385498046875, 0.4972686767578125, 0.5162734985351562, 0.5352783203125, 0.5542831420898438, 0.5732879638671875, 0.5922927856445312, 0.611297607421875, 0.6303024291992188, 0.6493072509765625, 0.6683120727539062, 0.68731689453125, 0.7063217163085938, 0.7253265380859375, 0.7443313598632812, 0.763336181640625, 0.7823410034179688, 0.8013458251953125, 0.8203506469726562, 0.83935546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 10.0, 9.0, 12.0, 16.0, 21.0, 26.0, 30.0, 66.0, 67.0, 85.0, 114.0, 182.0, 236.0, 324.0, 487.0, 742.0, 1077.0, 1665.0, 2677.0, 4824.0, 8465.0, 15789.0, 31643.0, 65743.0, 140065.0, 267619.0, 253459.0, 128495.0, 60642.0, 29113.0, 14869.0, 7946.0, 4407.0, 2636.0, 1592.0, 1096.0, 670.0, 482.0, 333.0, 214.0, 170.0, 113.0, 84.0, 61.0, 51.0, 36.0, 26.0, 21.0, 10.0, 12.0, 5.0, 6.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.00435638427734375, -0.0042108893394470215, -0.004065394401550293, -0.0039198994636535645, -0.003774404525756836, -0.0036289095878601074, -0.003483414649963379, -0.0033379197120666504, -0.003192424774169922, -0.0030469298362731934, -0.002901434898376465, -0.0027559399604797363, -0.002610445022583008, -0.0024649500846862793, -0.0023194551467895508, -0.0021739602088928223, -0.0020284652709960938, -0.0018829703330993652, -0.0017374753952026367, -0.0015919804573059082, -0.0014464855194091797, -0.0013009905815124512, -0.0011554956436157227, -0.0010100007057189941, -0.0008645057678222656, -0.0007190108299255371, -0.0005735158920288086, -0.0004280209541320801, -0.00028252601623535156, -0.00013703107833862305, 8.463859558105469e-06, 0.00015395879745483398, 0.0002994537353515625, 0.000444948673248291, 0.0005904436111450195, 0.000735938549041748, 0.0008814334869384766, 0.001026928424835205, 0.0011724233627319336, 0.0013179183006286621, 0.0014634132385253906, 0.0016089081764221191, 0.0017544031143188477, 0.0018998980522155762, 0.0020453929901123047, 0.002190887928009033, 0.0023363828659057617, 0.0024818778038024902, 0.0026273727416992188, 0.0027728676795959473, 0.0029183626174926758, 0.0030638575553894043, 0.003209352493286133, 0.0033548474311828613, 0.00350034236907959, 0.0036458373069763184, 0.003791332244873047, 0.003936827182769775, 0.004082322120666504, 0.004227817058563232, 0.004373311996459961, 0.0045188069343566895, 0.004664301872253418, 0.0048097968101501465, 0.004955291748046875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 6.0, 9.0, 18.0, 18.0, 31.0, 33.0, 37.0, 70.0, 57.0, 81.0, 96.0, 97.0, 92.0, 75.0, 45.0, 46.0, 54.0, 36.0, 20.0, 13.0, 16.0, 11.0, 9.0, 6.0, 0.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-05, -1.1525116860866547e-05, -1.1129304766654968e-05, -1.073349267244339e-05, -1.0337680578231812e-05, -9.941868484020233e-06, -9.546056389808655e-06, -9.150244295597076e-06, -8.754432201385498e-06, -8.35862010717392e-06, -7.962808012962341e-06, -7.566995918750763e-06, -7.1711838245391846e-06, -6.775371730327606e-06, -6.379559636116028e-06, -5.9837475419044495e-06, -5.587935447692871e-06, -5.192123353481293e-06, -4.796311259269714e-06, -4.400499165058136e-06, -4.004687070846558e-06, -3.6088749766349792e-06, -3.213062882423401e-06, -2.8172507882118225e-06, -2.421438694000244e-06, -2.0256265997886658e-06, -1.6298145055770874e-06, -1.234002411365509e-06, -8.381903171539307e-07, -4.423782229423523e-07, -4.6566128730773926e-08, 3.4924596548080444e-07, 7.450580596923828e-07, 1.1408701539039612e-06, 1.5366822481155396e-06, 1.932494342327118e-06, 2.3283064365386963e-06, 2.7241185307502747e-06, 3.119930624961853e-06, 3.5157427191734314e-06, 3.91155481338501e-06, 4.307366907596588e-06, 4.7031790018081665e-06, 5.098991096019745e-06, 5.494803190231323e-06, 5.890615284442902e-06, 6.28642737865448e-06, 6.682239472866058e-06, 7.078051567077637e-06, 7.473863661289215e-06, 7.869675755500793e-06, 8.265487849712372e-06, 8.66129994392395e-06, 9.057112038135529e-06, 9.452924132347107e-06, 9.848736226558685e-06, 1.0244548320770264e-05, 1.0640360414981842e-05, 1.103617250919342e-05, 1.1431984603404999e-05, 1.1827796697616577e-05, 1.2223608791828156e-05, 1.2619420886039734e-05, 1.3015232980251312e-05, 1.341104507446289e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 6.0, 9.0, 8.0, 12.0, 17.0, 17.0, 14.0, 34.0, 49.0, 66.0, 138.0, 225.0, 678.0, 2964.0, 19954.0, 208256.0, 705737.0, 97253.0, 10299.0, 1798.0, 487.0, 171.0, 110.0, 55.0, 50.0, 34.0, 24.0, 25.0, 16.0, 7.0, 12.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01308441162109375, -0.01267993450164795, -0.012275457382202148, -0.011870980262756348, -0.011466503143310547, -0.011062026023864746, -0.010657548904418945, -0.010253071784973145, -0.009848594665527344, -0.009444117546081543, -0.009039640426635742, -0.008635163307189941, -0.00823068618774414, -0.00782620906829834, -0.007421731948852539, -0.007017254829406738, -0.0066127777099609375, -0.006208300590515137, -0.005803823471069336, -0.005399346351623535, -0.004994869232177734, -0.004590392112731934, -0.004185914993286133, -0.003781437873840332, -0.0033769607543945312, -0.0029724836349487305, -0.0025680065155029297, -0.002163529396057129, -0.0017590522766113281, -0.0013545751571655273, -0.0009500980377197266, -0.0005456209182739258, -0.000141143798828125, 0.0002633333206176758, 0.0006678104400634766, 0.0010722875595092773, 0.0014767646789550781, 0.001881241798400879, 0.0022857189178466797, 0.0026901960372924805, 0.0030946731567382812, 0.003499150276184082, 0.003903627395629883, 0.004308104515075684, 0.004712581634521484, 0.005117058753967285, 0.005521535873413086, 0.005926012992858887, 0.0063304901123046875, 0.006734967231750488, 0.007139444351196289, 0.00754392147064209, 0.00794839859008789, 0.008352875709533691, 0.008757352828979492, 0.009161829948425293, 0.009566307067871094, 0.009970784187316895, 0.010375261306762695, 0.010779738426208496, 0.011184215545654297, 0.011588692665100098, 0.011993169784545898, 0.0123976469039917, 0.0128021240234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 9.0, 4.0, 8.0, 6.0, 7.0, 8.0, 13.0, 17.0, 17.0, 26.0, 35.0, 54.0, 53.0, 56.0, 68.0, 91.0, 74.0, 74.0, 97.0, 66.0, 36.0, 36.0, 35.0, 35.0, 15.0, 23.0, 5.0, 6.0, 8.0, 7.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0019483566284179688, -0.0018882006406784058, -0.0018280446529388428, -0.0017678886651992798, -0.0017077326774597168, -0.0016475766897201538, -0.0015874207019805908, -0.0015272647142410278, -0.0014671087265014648, -0.0014069527387619019, -0.0013467967510223389, -0.0012866407632827759, -0.0012264847755432129, -0.00116632878780365, -0.001106172800064087, -0.001046016812324524, -0.000985860824584961, -0.000925704836845398, -0.000865548849105835, -0.000805392861366272, -0.000745236873626709, -0.000685080885887146, -0.000624924898147583, -0.00056476891040802, -0.000504612922668457, -0.00044445693492889404, -0.00038430094718933105, -0.00032414495944976807, -0.0002639889717102051, -0.0002038329839706421, -0.0001436769962310791, -8.352100849151611e-05, -2.3365020751953125e-05, 3.679096698760986e-05, 9.694695472717285e-05, 0.00015710294246673584, 0.00021725893020629883, 0.0002774149179458618, 0.0003375709056854248, 0.0003977268934249878, 0.0004578828811645508, 0.0005180388689041138, 0.0005781948566436768, 0.0006383508443832397, 0.0006985068321228027, 0.0007586628198623657, 0.0008188188076019287, 0.0008789747953414917, 0.0009391307830810547, 0.0009992867708206177, 0.0010594427585601807, 0.0011195987462997437, 0.0011797547340393066, 0.0012399107217788696, 0.0013000667095184326, 0.0013602226972579956, 0.0014203786849975586, 0.0014805346727371216, 0.0015406906604766846, 0.0016008466482162476, 0.0016610026359558105, 0.0017211586236953735, 0.0017813146114349365, 0.0018414705991744995, 0.0019016265869140625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 17.0, 15.0, 25.0, 45.0, 80.0, 107.0, 136.0, 126.0, 123.0, 112.0, 58.0, 49.0, 31.0, 27.0, 16.0, 9.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35137131810188293, -0.33860769867897034, -0.32584407925605774, -0.31308045983314514, -0.30031681060791016, -0.28755319118499756, -0.27478957176208496, -0.26202595233917236, -0.24926233291625977, -0.23649871349334717, -0.22373509407043457, -0.21097145974636078, -0.19820784032344818, -0.18544422090053558, -0.1726805865764618, -0.1599169671535492, -0.1471533477306366, -0.134389728307724, -0.1216261014342308, -0.10886247456073761, -0.09609885513782501, -0.08333523571491241, -0.07057160884141922, -0.057807981967926025, -0.04504436254501343, -0.03228073939681053, -0.019517116248607635, -0.006753493100404739, 0.006010130047798157, 0.018773749470710754, 0.03153737634420395, 0.044301003217697144, 0.05706465244293213, 0.06982827186584473, 0.08259189873933792, 0.09535552561283112, 0.10811914503574371, 0.12088276445865631, 0.1336463987827301, 0.1464100182056427, 0.1591736376285553, 0.1719372570514679, 0.1847008764743805, 0.19746451079845428, 0.21022813022136688, 0.22299174964427948, 0.23575538396835327, 0.24851900339126587, 0.26128262281417847, 0.27404624223709106, 0.28680986166000366, 0.29957348108291626, 0.31233710050582886, 0.32510071992874146, 0.33786436915397644, 0.35062798857688904, 0.36339160799980164, 0.37615522742271423, 0.38891884684562683, 0.40168246626853943, 0.4144461154937744, 0.427209734916687, 0.4399733543395996, 0.4527369737625122, 0.4655005931854248]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 9.0, 14.0, 15.0, 20.0, 24.0, 43.0, 49.0, 59.0, 61.0, 58.0, 58.0, 50.0, 51.0, 65.0, 76.0, 64.0, 60.0, 41.0, 36.0, 32.0, 31.0, 23.0, 20.0, 11.0, 10.0, 7.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20771726965904236, -0.19885408878326416, -0.18999090790748596, -0.18112772703170776, -0.17226453125476837, -0.16340135037899017, -0.15453816950321198, -0.14567498862743378, -0.13681179285049438, -0.1279486119747162, -0.11908542364835739, -0.1102222427725792, -0.1013590544462204, -0.0924958735704422, -0.083632692694664, -0.0747695118188858, -0.0659063309431076, -0.05704314634203911, -0.04817996174097061, -0.03931678086519241, -0.030453596264123917, -0.02159041166305542, -0.012727230787277222, -0.003864046186208725, 0.004999138414859772, 0.013862322084605694, 0.022725505754351616, 0.03158868849277496, 0.04045187309384346, 0.04931505769491196, 0.058178238570690155, 0.06704142689704895, 0.07590460777282715, 0.08476778864860535, 0.09363097697496414, 0.10249415785074234, 0.11135734617710114, 0.12022052705287933, 0.12908370792865753, 0.13794688880443573, 0.14681008458137512, 0.15567326545715332, 0.16453644633293152, 0.17339962720870972, 0.1822628229856491, 0.1911260038614273, 0.1999891847372055, 0.2088523656129837, 0.2177155464887619, 0.2265787273645401, 0.2354419082403183, 0.2443051040172577, 0.2531682848930359, 0.2620314657688141, 0.2708946466445923, 0.2797578275203705, 0.2886210083961487, 0.2974841892719269, 0.3063473701477051, 0.3152105510234833, 0.3240737318992615, 0.33293694257736206, 0.34180009365081787, 0.35066330432891846, 0.35952648520469666]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 3.0, 9.0, 12.0, 19.0, 44.0, 95.0, 209.0, 450.0, 1127.0, 2834.0, 9716.0, 59412.0, 684030.0, 258071.0, 23865.0, 5376.0, 1886.0, 777.0, 308.0, 146.0, 65.0, 48.0, 17.0, 11.0, 5.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2130126953125, -0.2065143585205078, -0.20001602172851562, -0.19351768493652344, -0.18701934814453125, -0.18052101135253906, -0.17402267456054688, -0.1675243377685547, -0.1610260009765625, -0.1545276641845703, -0.14802932739257812, -0.14153099060058594, -0.13503265380859375, -0.12853431701660156, -0.12203598022460938, -0.11553764343261719, -0.109039306640625, -0.10254096984863281, -0.09604263305664062, -0.08954429626464844, -0.08304595947265625, -0.07654762268066406, -0.07004928588867188, -0.06355094909667969, -0.0570526123046875, -0.05055427551269531, -0.044055938720703125, -0.03755760192871094, -0.03105926513671875, -0.024560928344726562, -0.018062591552734375, -0.011564254760742188, -0.00506591796875, 0.0014324188232421875, 0.007930755615234375, 0.014429092407226562, 0.02092742919921875, 0.027425765991210938, 0.033924102783203125, 0.04042243957519531, 0.0469207763671875, 0.05341911315917969, 0.059917449951171875, 0.06641578674316406, 0.07291412353515625, 0.07941246032714844, 0.08591079711914062, 0.09240913391113281, 0.098907470703125, 0.10540580749511719, 0.11190414428710938, 0.11840248107910156, 0.12490081787109375, 0.13139915466308594, 0.13789749145507812, 0.1443958282470703, 0.1508941650390625, 0.1573925018310547, 0.16389083862304688, 0.17038917541503906, 0.17688751220703125, 0.18338584899902344, 0.18988418579101562, 0.1963825225830078, 0.202880859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 9.0, 4.0, 11.0, 17.0, 12.0, 13.0, 25.0, 37.0, 41.0, 46.0, 48.0, 62.0, 53.0, 41.0, 48.0, 66.0, 64.0, 64.0, 54.0, 50.0, 46.0, 34.0, 34.0, 31.0, 19.0, 27.0, 21.0, 9.0, 9.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.437744140625, -0.4211540222167969, -0.40456390380859375, -0.3879737854003906, -0.3713836669921875, -0.3547935485839844, -0.33820343017578125, -0.3216133117675781, -0.305023193359375, -0.2884330749511719, -0.27184295654296875, -0.2552528381347656, -0.2386627197265625, -0.22207260131835938, -0.20548248291015625, -0.18889236450195312, -0.17230224609375, -0.15571212768554688, -0.13912200927734375, -0.12253189086914062, -0.1059417724609375, -0.08935165405273438, -0.07276153564453125, -0.056171417236328125, -0.039581298828125, -0.022991180419921875, -0.00640106201171875, 0.010189056396484375, 0.0267791748046875, 0.043369293212890625, 0.05995941162109375, 0.07654953002929688, 0.0931396484375, 0.10972976684570312, 0.12631988525390625, 0.14291000366210938, 0.1595001220703125, 0.17609024047851562, 0.19268035888671875, 0.20927047729492188, 0.225860595703125, 0.24245071411132812, 0.25904083251953125, 0.2756309509277344, 0.2922210693359375, 0.3088111877441406, 0.32540130615234375, 0.3419914245605469, 0.35858154296875, 0.3751716613769531, 0.39176177978515625, 0.4083518981933594, 0.4249420166015625, 0.4415321350097656, 0.45812225341796875, 0.4747123718261719, 0.491302490234375, 0.5078926086425781, 0.5244827270507812, 0.5410728454589844, 0.5576629638671875, 0.5742530822753906, 0.5908432006835938, 0.6074333190917969, 0.6240234375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 0.0, 2.0, 10.0, 4.0, 9.0, 8.0, 9.0, 9.0, 9.0, 19.0, 14.0, 26.0, 32.0, 28.0, 38.0, 59.0, 74.0, 84.0, 148.0, 332.0, 1373.0, 18422.0, 982651.0, 41971.0, 2163.0, 416.0, 187.0, 78.0, 63.0, 53.0, 48.0, 41.0, 36.0, 19.0, 20.0, 24.0, 12.0, 6.0, 11.0, 10.0, 7.0, 9.0, 10.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.525390625, -0.5087661743164062, -0.4921417236328125, -0.47551727294921875, -0.458892822265625, -0.44226837158203125, -0.4256439208984375, -0.40901947021484375, -0.39239501953125, -0.37577056884765625, -0.3591461181640625, -0.34252166748046875, -0.325897216796875, -0.30927276611328125, -0.2926483154296875, -0.27602386474609375, -0.2593994140625, -0.24277496337890625, -0.2261505126953125, -0.20952606201171875, -0.192901611328125, -0.17627716064453125, -0.1596527099609375, -0.14302825927734375, -0.12640380859375, -0.10977935791015625, -0.0931549072265625, -0.07653045654296875, -0.059906005859375, -0.04328155517578125, -0.0266571044921875, -0.01003265380859375, 0.006591796875, 0.02321624755859375, 0.0398406982421875, 0.05646514892578125, 0.073089599609375, 0.08971405029296875, 0.1063385009765625, 0.12296295166015625, 0.13958740234375, 0.15621185302734375, 0.1728363037109375, 0.18946075439453125, 0.206085205078125, 0.22270965576171875, 0.2393341064453125, 0.25595855712890625, 0.2725830078125, 0.28920745849609375, 0.3058319091796875, 0.32245635986328125, 0.339080810546875, 0.35570526123046875, 0.3723297119140625, 0.38895416259765625, 0.40557861328125, 0.42220306396484375, 0.4388275146484375, 0.45545196533203125, 0.472076416015625, 0.48870086669921875, 0.5053253173828125, 0.5219497680664062, 0.53857421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 8.0, 5.0, 8.0, 8.0, 5.0, 8.0, 11.0, 12.0, 18.0, 15.0, 23.0, 35.0, 30.0, 41.0, 42.0, 31.0, 44.0, 49.0, 59.0, 45.0, 49.0, 57.0, 53.0, 45.0, 40.0, 45.0, 29.0, 33.0, 31.0, 21.0, 21.0, 17.0, 16.0, 8.0, 13.0, 7.0, 8.0, 4.0, 6.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.499267578125, -0.4827003479003906, -0.46613311767578125, -0.4495658874511719, -0.4329986572265625, -0.4164314270019531, -0.39986419677734375, -0.3832969665527344, -0.366729736328125, -0.3501625061035156, -0.33359527587890625, -0.3170280456542969, -0.3004608154296875, -0.2838935852050781, -0.26732635498046875, -0.2507591247558594, -0.23419189453125, -0.21762466430664062, -0.20105743408203125, -0.18449020385742188, -0.1679229736328125, -0.15135574340820312, -0.13478851318359375, -0.11822128295898438, -0.101654052734375, -0.08508682250976562, -0.06851959228515625, -0.051952362060546875, -0.0353851318359375, -0.018817901611328125, -0.00225067138671875, 0.014316558837890625, 0.0308837890625, 0.047451019287109375, 0.06401824951171875, 0.08058547973632812, 0.0971527099609375, 0.11371994018554688, 0.13028717041015625, 0.14685440063476562, 0.163421630859375, 0.17998886108398438, 0.19655609130859375, 0.21312332153320312, 0.2296905517578125, 0.24625778198242188, 0.26282501220703125, 0.2793922424316406, 0.29595947265625, 0.3125267028808594, 0.32909393310546875, 0.3456611633300781, 0.3622283935546875, 0.3787956237792969, 0.39536285400390625, 0.4119300842285156, 0.428497314453125, 0.4450645446777344, 0.46163177490234375, 0.4781990051269531, 0.4947662353515625, 0.5113334655761719, 0.5279006958007812, 0.5444679260253906, 0.56103515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 8.0, 7.0, 16.0, 23.0, 37.0, 44.0, 90.0, 371.0, 1881.0, 40039.0, 987325.0, 17022.0, 1184.0, 263.0, 95.0, 50.0, 34.0, 16.0, 11.0, 9.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2030029296875, -0.19632530212402344, -0.18964767456054688, -0.1829700469970703, -0.17629241943359375, -0.1696147918701172, -0.16293716430664062, -0.15625953674316406, -0.1495819091796875, -0.14290428161621094, -0.13622665405273438, -0.1295490264892578, -0.12287139892578125, -0.11619377136230469, -0.10951614379882812, -0.10283851623535156, -0.096160888671875, -0.08948326110839844, -0.08280563354492188, -0.07612800598144531, -0.06945037841796875, -0.06277275085449219, -0.056095123291015625, -0.04941749572753906, -0.0427398681640625, -0.03606224060058594, -0.029384613037109375, -0.022706985473632812, -0.01602935791015625, -0.009351730346679688, -0.002674102783203125, 0.0040035247802734375, 0.01068115234375, 0.017358779907226562, 0.024036407470703125, 0.030714035034179688, 0.03739166259765625, 0.04406929016113281, 0.050746917724609375, 0.05742454528808594, 0.0641021728515625, 0.07077980041503906, 0.07745742797851562, 0.08413505554199219, 0.09081268310546875, 0.09749031066894531, 0.10416793823242188, 0.11084556579589844, 0.117523193359375, 0.12420082092285156, 0.13087844848632812, 0.1375560760498047, 0.14423370361328125, 0.1509113311767578, 0.15758895874023438, 0.16426658630371094, 0.1709442138671875, 0.17762184143066406, 0.18429946899414062, 0.1909770965576172, 0.19765472412109375, 0.2043323516845703, 0.21100997924804688, 0.21768760681152344, 0.224365234375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 11.0, 13.0, 17.0, 41.0, 57.0, 101.0, 197.0, 237.0, 131.0, 67.0, 37.0, 31.0, 9.0, 11.0, 10.0, 6.0, 10.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.7344951629638672e-05, -1.691281795501709e-05, -1.6480684280395508e-05, -1.6048550605773926e-05, -1.5616416931152344e-05, -1.5184283256530762e-05, -1.475214958190918e-05, -1.4320015907287598e-05, -1.3887882232666016e-05, -1.3455748558044434e-05, -1.3023614883422852e-05, -1.259148120880127e-05, -1.2159347534179688e-05, -1.1727213859558105e-05, -1.1295080184936523e-05, -1.0862946510314941e-05, -1.043081283569336e-05, -9.998679161071777e-06, -9.566545486450195e-06, -9.134411811828613e-06, -8.702278137207031e-06, -8.27014446258545e-06, -7.838010787963867e-06, -7.405877113342285e-06, -6.973743438720703e-06, -6.541609764099121e-06, -6.109476089477539e-06, -5.677342414855957e-06, -5.245208740234375e-06, -4.813075065612793e-06, -4.380941390991211e-06, -3.948807716369629e-06, -3.516674041748047e-06, -3.084540367126465e-06, -2.652406692504883e-06, -2.2202730178833008e-06, -1.7881393432617188e-06, -1.3560056686401367e-06, -9.238719940185547e-07, -4.917383193969727e-07, -5.960464477539063e-08, 3.725290298461914e-07, 8.046627044677734e-07, 1.2367963790893555e-06, 1.6689300537109375e-06, 2.1010637283325195e-06, 2.5331974029541016e-06, 2.9653310775756836e-06, 3.3974647521972656e-06, 3.829598426818848e-06, 4.26173210144043e-06, 4.693865776062012e-06, 5.125999450683594e-06, 5.558133125305176e-06, 5.990266799926758e-06, 6.42240047454834e-06, 6.854534149169922e-06, 7.286667823791504e-06, 7.718801498413086e-06, 8.150935173034668e-06, 8.58306884765625e-06, 9.015202522277832e-06, 9.447336196899414e-06, 9.879469871520996e-06, 1.0311603546142578e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 4.0, 4.0, 15.0, 13.0, 21.0, 28.0, 56.0, 186.0, 546.0, 2341.0, 27627.0, 995164.0, 19571.0, 2181.0, 491.0, 161.0, 48.0, 28.0, 16.0, 12.0, 8.0, 4.0, 4.0, 3.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.283447265625, -0.2752208709716797, -0.2669944763183594, -0.25876808166503906, -0.25054168701171875, -0.24231529235839844, -0.23408889770507812, -0.2258625030517578, -0.2176361083984375, -0.2094097137451172, -0.20118331909179688, -0.19295692443847656, -0.18473052978515625, -0.17650413513183594, -0.16827774047851562, -0.1600513458251953, -0.151824951171875, -0.1435985565185547, -0.13537216186523438, -0.12714576721191406, -0.11891937255859375, -0.11069297790527344, -0.10246658325195312, -0.09424018859863281, -0.0860137939453125, -0.07778739929199219, -0.06956100463867188, -0.06133460998535156, -0.05310821533203125, -0.04488182067871094, -0.036655426025390625, -0.028429031372070312, -0.02020263671875, -0.011976242065429688, -0.003749847412109375, 0.0044765472412109375, 0.01270294189453125, 0.020929336547851562, 0.029155731201171875, 0.03738212585449219, 0.0456085205078125, 0.05383491516113281, 0.062061309814453125, 0.07028770446777344, 0.07851409912109375, 0.08674049377441406, 0.09496688842773438, 0.10319328308105469, 0.111419677734375, 0.11964607238769531, 0.12787246704101562, 0.13609886169433594, 0.14432525634765625, 0.15255165100097656, 0.16077804565429688, 0.1690044403076172, 0.1772308349609375, 0.1854572296142578, 0.19368362426757812, 0.20191001892089844, 0.21013641357421875, 0.21836280822753906, 0.22658920288085938, 0.2348155975341797, 0.2430419921875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 6.0, 4.0, 12.0, 16.0, 20.0, 26.0, 81.0, 94.0, 151.0, 199.0, 137.0, 76.0, 62.0, 39.0, 24.0, 19.0, 11.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.05047607421875, -0.04881858825683594, -0.047161102294921875, -0.04550361633300781, -0.04384613037109375, -0.04218864440917969, -0.040531158447265625, -0.03887367248535156, -0.0372161865234375, -0.03555870056152344, -0.033901214599609375, -0.03224372863769531, -0.03058624267578125, -0.028928756713867188, -0.027271270751953125, -0.025613784790039062, -0.023956298828125, -0.022298812866210938, -0.020641326904296875, -0.018983840942382812, -0.01732635498046875, -0.015668869018554688, -0.014011383056640625, -0.012353897094726562, -0.0106964111328125, -0.009038925170898438, -0.007381439208984375, -0.0057239532470703125, -0.00406646728515625, -0.0024089813232421875, -0.000751495361328125, 0.0009059906005859375, 0.0025634765625, 0.0042209625244140625, 0.005878448486328125, 0.0075359344482421875, 0.00919342041015625, 0.010850906372070312, 0.012508392333984375, 0.014165878295898438, 0.0158233642578125, 0.017480850219726562, 0.019138336181640625, 0.020795822143554688, 0.02245330810546875, 0.024110794067382812, 0.025768280029296875, 0.027425765991210938, 0.029083251953125, 0.030740737915039062, 0.032398223876953125, 0.03405570983886719, 0.03571319580078125, 0.03737068176269531, 0.039028167724609375, 0.04068565368652344, 0.0423431396484375, 0.04400062561035156, 0.045658111572265625, 0.04731559753417969, 0.04897308349609375, 0.05063056945800781, 0.052288055419921875, 0.05394554138183594, 0.05560302734375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 14.0, 30.0, 71.0, 127.0, 220.0, 222.0, 153.0, 76.0, 45.0, 25.0, 9.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5231166481971741, -0.4801306128501892, -0.43714454770088196, -0.3941584825515747, -0.35117244720458984, -0.308186411857605, -0.26520034670829773, -0.22221428155899048, -0.17922824621200562, -0.13624219596385956, -0.0932561457157135, -0.050270095467567444, -0.007284045219421387, 0.03570200502872467, 0.07868805527687073, 0.12167412042617798, 0.16466015577316284, 0.2076462060213089, 0.25063225626945496, 0.2936183214187622, 0.33660435676574707, 0.37959039211273193, 0.4225764572620392, 0.46556252241134644, 0.5085485577583313, 0.5515345931053162, 0.5945206880569458, 0.6375067234039307, 0.6804927587509155, 0.7234787940979004, 0.7664648294448853, 0.8094509243965149, 0.8524370193481445, 0.8954230546951294, 0.9384090900421143, 0.9813951849937439, 1.024381160736084, 1.0673673152923584, 1.1103533506393433, 1.1533393859863281, 1.196325421333313, 1.2393114566802979, 1.2822974920272827, 1.3252835273742676, 1.368269681930542, 1.4112557172775269, 1.4542417526245117, 1.4972277879714966, 1.5402138233184814, 1.5831998586654663, 1.6261858940124512, 1.669171929359436, 1.712157964706421, 1.7551441192626953, 1.7981301546096802, 1.841116189956665, 1.88410222530365, 1.9270882606506348, 1.9700742959976196, 2.0130603313446045, 2.056046485900879, 2.099032402038574, 2.1420185565948486, 2.185004711151123, 2.2279906272888184]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 2.0, 7.0, 9.0, 10.0, 13.0, 17.0, 15.0, 18.0, 30.0, 22.0, 24.0, 18.0, 32.0, 37.0, 43.0, 32.0, 43.0, 41.0, 43.0, 44.0, 54.0, 37.0, 40.0, 33.0, 36.0, 29.0, 44.0, 35.0, 36.0, 23.0, 16.0, 14.0, 23.0, 17.0, 10.0, 13.0, 13.0, 8.0, 4.0, 2.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.713683009147644, -0.6889926791191101, -0.664302408695221, -0.639612078666687, -0.6149217486381531, -0.5902314782142639, -0.56554114818573, -0.5408508777618408, -0.5161605477333069, -0.49147024750709534, -0.4667799174785614, -0.44208961725234985, -0.4173993170261383, -0.39270901679992676, -0.3680186867713928, -0.3433283865451813, -0.31863805651664734, -0.2939477562904358, -0.26925742626190186, -0.2445671260356903, -0.21987682580947876, -0.19518651068210602, -0.17049619555473328, -0.14580589532852173, -0.12111558020114899, -0.09642527252435684, -0.0717349648475647, -0.047044649720191956, -0.02235434204339981, 0.002335965633392334, 0.027026280760765076, 0.051716580986976624, 0.07640689611434937, 0.10109720379114151, 0.12578751146793365, 0.1504778265953064, 0.17516812682151794, 0.19985844194889069, 0.22454875707626343, 0.24923905730247498, 0.2739293575286865, 0.29861965775489807, 0.323309987783432, 0.34800028800964355, 0.3726905882358551, 0.39738088846206665, 0.4220712184906006, 0.44676151871681213, 0.47145184874534607, 0.4961421489715576, 0.5208324790000916, 0.5455228090286255, 0.5702130794525146, 0.5949034094810486, 0.6195937395095825, 0.6442840099334717, 0.6689743399620056, 0.6936646699905396, 0.7183549404144287, 0.7430452704429626, 0.7677356004714966, 0.7924258708953857, 0.8171162009239197, 0.8418065309524536, 0.8664968013763428]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 6.0, 13.0, 17.0, 26.0, 55.0, 85.0, 126.0, 265.0, 515.0, 1007.0, 2089.0, 5534.0, 17353.0, 163323.0, 2964798.0, 978623.0, 45822.0, 8626.0, 3035.0, 1401.0, 722.0, 356.0, 205.0, 104.0, 68.0, 33.0, 30.0, 16.0, 12.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.63525390625, -0.6158599853515625, -0.596466064453125, -0.5770721435546875, -0.55767822265625, -0.5382843017578125, -0.518890380859375, -0.4994964599609375, -0.4801025390625, -0.4607086181640625, -0.441314697265625, -0.4219207763671875, -0.40252685546875, -0.3831329345703125, -0.363739013671875, -0.3443450927734375, -0.324951171875, -0.3055572509765625, -0.286163330078125, -0.2667694091796875, -0.24737548828125, -0.2279815673828125, -0.208587646484375, -0.1891937255859375, -0.1697998046875, -0.1504058837890625, -0.131011962890625, -0.1116180419921875, -0.09222412109375, -0.0728302001953125, -0.053436279296875, -0.0340423583984375, -0.0146484375, 0.0047454833984375, 0.024139404296875, 0.0435333251953125, 0.06292724609375, 0.0823211669921875, 0.101715087890625, 0.1211090087890625, 0.1405029296875, 0.1598968505859375, 0.179290771484375, 0.1986846923828125, 0.21807861328125, 0.2374725341796875, 0.256866455078125, 0.2762603759765625, 0.295654296875, 0.3150482177734375, 0.334442138671875, 0.3538360595703125, 0.37322998046875, 0.3926239013671875, 0.412017822265625, 0.4314117431640625, 0.4508056640625, 0.4701995849609375, 0.489593505859375, 0.5089874267578125, 0.52838134765625, 0.5477752685546875, 0.567169189453125, 0.5865631103515625, 0.60595703125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 6.0, 7.0, 14.0, 19.0, 18.0, 31.0, 25.0, 49.0, 49.0, 67.0, 51.0, 67.0, 84.0, 58.0, 67.0, 75.0, 60.0, 62.0, 42.0, 38.0, 27.0, 24.0, 24.0, 13.0, 7.0, 5.0, 10.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27587890625, -0.26447296142578125, -0.2530670166015625, -0.24166107177734375, -0.230255126953125, -0.21884918212890625, -0.2074432373046875, -0.19603729248046875, -0.18463134765625, -0.17322540283203125, -0.1618194580078125, -0.15041351318359375, -0.139007568359375, -0.12760162353515625, -0.1161956787109375, -0.10478973388671875, -0.0933837890625, -0.08197784423828125, -0.0705718994140625, -0.05916595458984375, -0.047760009765625, -0.03635406494140625, -0.0249481201171875, -0.01354217529296875, -0.00213623046875, 0.00926971435546875, 0.0206756591796875, 0.03208160400390625, 0.043487548828125, 0.05489349365234375, 0.0662994384765625, 0.07770538330078125, 0.089111328125, 0.10051727294921875, 0.1119232177734375, 0.12332916259765625, 0.134735107421875, 0.14614105224609375, 0.1575469970703125, 0.16895294189453125, 0.18035888671875, 0.19176483154296875, 0.2031707763671875, 0.21457672119140625, 0.225982666015625, 0.23738861083984375, 0.2487945556640625, 0.26020050048828125, 0.2716064453125, 0.28301239013671875, 0.2944183349609375, 0.30582427978515625, 0.317230224609375, 0.32863616943359375, 0.3400421142578125, 0.35144805908203125, 0.36285400390625, 0.37425994873046875, 0.3856658935546875, 0.39707183837890625, 0.408477783203125, 0.41988372802734375, 0.4312896728515625, 0.44269561767578125, 0.4541015625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 6.0, 11.0, 19.0, 28.0, 29.0, 52.0, 72.0, 134.0, 203.0, 450.0, 1016.0, 3521.0, 22208.0, 1367975.0, 2764023.0, 28339.0, 4054.0, 1104.0, 425.0, 233.0, 120.0, 67.0, 60.0, 27.0, 21.0, 24.0, 10.0, 10.0, 9.0, 6.0, 6.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9658203125, -0.938262939453125, -0.91070556640625, -0.883148193359375, -0.8555908203125, -0.828033447265625, -0.80047607421875, -0.772918701171875, -0.745361328125, -0.717803955078125, -0.69024658203125, -0.662689208984375, -0.6351318359375, -0.607574462890625, -0.58001708984375, -0.552459716796875, -0.52490234375, -0.497344970703125, -0.46978759765625, -0.442230224609375, -0.4146728515625, -0.387115478515625, -0.35955810546875, -0.332000732421875, -0.304443359375, -0.276885986328125, -0.24932861328125, -0.221771240234375, -0.1942138671875, -0.166656494140625, -0.13909912109375, -0.111541748046875, -0.083984375, -0.056427001953125, -0.02886962890625, -0.001312255859375, 0.0262451171875, 0.053802490234375, 0.08135986328125, 0.108917236328125, 0.136474609375, 0.164031982421875, 0.19158935546875, 0.219146728515625, 0.2467041015625, 0.274261474609375, 0.30181884765625, 0.329376220703125, 0.35693359375, 0.384490966796875, 0.41204833984375, 0.439605712890625, 0.4671630859375, 0.494720458984375, 0.52227783203125, 0.549835205078125, 0.577392578125, 0.604949951171875, 0.63250732421875, 0.660064697265625, 0.6876220703125, 0.715179443359375, 0.74273681640625, 0.770294189453125, 0.7978515625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 5.0, 12.0, 9.0, 24.0, 18.0, 35.0, 35.0, 60.0, 108.0, 207.0, 451.0, 804.0, 950.0, 614.0, 321.0, 141.0, 92.0, 54.0, 36.0, 15.0, 23.0, 14.0, 13.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.148681640625, -0.1434173583984375, -0.138153076171875, -0.1328887939453125, -0.12762451171875, -0.1223602294921875, -0.117095947265625, -0.1118316650390625, -0.1065673828125, -0.1013031005859375, -0.096038818359375, -0.0907745361328125, -0.08551025390625, -0.0802459716796875, -0.074981689453125, -0.0697174072265625, -0.064453125, -0.0591888427734375, -0.053924560546875, -0.0486602783203125, -0.04339599609375, -0.0381317138671875, -0.032867431640625, -0.0276031494140625, -0.0223388671875, -0.0170745849609375, -0.011810302734375, -0.0065460205078125, -0.00128173828125, 0.0039825439453125, 0.009246826171875, 0.0145111083984375, 0.019775390625, 0.0250396728515625, 0.030303955078125, 0.0355682373046875, 0.04083251953125, 0.0460968017578125, 0.051361083984375, 0.0566253662109375, 0.0618896484375, 0.0671539306640625, 0.072418212890625, 0.0776824951171875, 0.08294677734375, 0.0882110595703125, 0.093475341796875, 0.0987396240234375, 0.10400390625, 0.1092681884765625, 0.114532470703125, 0.1197967529296875, 0.12506103515625, 0.1303253173828125, 0.135589599609375, 0.1408538818359375, 0.1461181640625, 0.1513824462890625, 0.156646728515625, 0.1619110107421875, 0.16717529296875, 0.1724395751953125, 0.177703857421875, 0.1829681396484375, 0.188232421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 1.0, 6.0, 3.0, 7.0, 8.0, 10.0, 15.0, 22.0, 26.0, 54.0, 63.0, 74.0, 77.0, 90.0, 87.0, 92.0, 87.0, 73.0, 56.0, 36.0, 36.0, 17.0, 11.0, 20.0, 7.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3815903663635254, -0.3678026497364044, -0.35401496291160583, -0.34022724628448486, -0.3264395594596863, -0.3126518428325653, -0.2988641560077667, -0.28507643938064575, -0.27128875255584717, -0.2575010359287262, -0.2437133491039276, -0.22992564737796783, -0.21613794565200806, -0.20235022902488708, -0.1885625422000885, -0.17477482557296753, -0.16098712384700775, -0.14719942212104797, -0.1334117203950882, -0.11962401866912842, -0.10583631694316864, -0.09204860776662827, -0.07826090604066849, -0.06447320431470871, -0.05068550258874893, -0.036897800862789154, -0.023110097274184227, -0.0093223936855793, 0.004465308040380478, 0.018253013491630554, 0.03204071521759033, 0.04582841694355011, 0.05961611866950989, 0.07340382039546967, 0.08719152212142944, 0.10097922384738922, 0.114766925573349, 0.12855464220046997, 0.14234232902526855, 0.15613004565238953, 0.1699177324771881, 0.1837054342031479, 0.19749313592910767, 0.21128083765506744, 0.22506853938102722, 0.2388562560081482, 0.2526439428329468, 0.26643165946006775, 0.2802193760871887, 0.2940070927143097, 0.3077947795391083, 0.32158249616622925, 0.33537018299102783, 0.3491578996181488, 0.3629455864429474, 0.37673330307006836, 0.39052098989486694, 0.4043087065219879, 0.4180963933467865, 0.43188410997390747, 0.44567179679870605, 0.459459513425827, 0.4732472002506256, 0.4870349168777466, 0.5008226037025452]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 7.0, 6.0, 10.0, 9.0, 7.0, 10.0, 14.0, 24.0, 27.0, 26.0, 35.0, 59.0, 53.0, 58.0, 47.0, 57.0, 61.0, 47.0, 55.0, 47.0, 50.0, 50.0, 40.0, 38.0, 32.0, 30.0, 22.0, 21.0, 20.0, 13.0, 13.0, 7.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23207120597362518, -0.22092002630233765, -0.2097688466310501, -0.19861766695976257, -0.18746648728847504, -0.1763153076171875, -0.16516412794589996, -0.15401294827461243, -0.1428617686033249, -0.13171058893203735, -0.12055940926074982, -0.10940822958946228, -0.09825704991817474, -0.08710587024688721, -0.07595469057559967, -0.06480351090431213, -0.0536523312330246, -0.04250115156173706, -0.031349971890449524, -0.020198792219161987, -0.00904761254787445, 0.002103567123413086, 0.013254746794700623, 0.02440592646598816, 0.035557106137275696, 0.04670828580856323, 0.05785946547985077, 0.0690106451511383, 0.08016182482242584, 0.09131300449371338, 0.10246418416500092, 0.11361536383628845, 0.12476655840873718, 0.13591773808002472, 0.14706891775131226, 0.1582200974225998, 0.16937127709388733, 0.18052245676517487, 0.1916736364364624, 0.20282481610774994, 0.21397599577903748, 0.225127175450325, 0.23627835512161255, 0.24742953479290009, 0.2585807144641876, 0.26973187923431396, 0.2808830738067627, 0.2920342683792114, 0.30318543314933777, 0.3143365979194641, 0.32548779249191284, 0.3366389870643616, 0.3477901518344879, 0.35894131660461426, 0.370092511177063, 0.3812437057495117, 0.39239487051963806, 0.4035460352897644, 0.41469722986221313, 0.42584842443466187, 0.4369995892047882, 0.44815075397491455, 0.4593019485473633, 0.470453143119812, 0.48160430788993835]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 7.0, 7.0, 13.0, 12.0, 20.0, 29.0, 36.0, 63.0, 113.0, 163.0, 380.0, 793.0, 1952.0, 4906.0, 14069.0, 47687.0, 221590.0, 547486.0, 155091.0, 36040.0, 11004.0, 4059.0, 1615.0, 682.0, 309.0, 161.0, 98.0, 50.0, 34.0, 36.0, 14.0, 10.0, 7.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12298583984375, -0.1197824478149414, -0.11657905578613281, -0.11337566375732422, -0.11017227172851562, -0.10696887969970703, -0.10376548767089844, -0.10056209564208984, -0.09735870361328125, -0.09415531158447266, -0.09095191955566406, -0.08774852752685547, -0.08454513549804688, -0.08134174346923828, -0.07813835144042969, -0.0749349594116211, -0.0717315673828125, -0.0685281753540039, -0.06532478332519531, -0.06212139129638672, -0.058917999267578125, -0.05571460723876953, -0.05251121520996094, -0.049307823181152344, -0.04610443115234375, -0.042901039123535156, -0.03969764709472656, -0.03649425506591797, -0.033290863037109375, -0.03008747100830078, -0.026884078979492188, -0.023680686950683594, -0.020477294921875, -0.017273902893066406, -0.014070510864257812, -0.010867118835449219, -0.007663726806640625, -0.004460334777832031, -0.0012569427490234375, 0.0019464492797851562, 0.00514984130859375, 0.008353233337402344, 0.011556625366210938, 0.014760017395019531, 0.017963409423828125, 0.02116680145263672, 0.024370193481445312, 0.027573585510253906, 0.0307769775390625, 0.033980369567871094, 0.03718376159667969, 0.04038715362548828, 0.043590545654296875, 0.04679393768310547, 0.04999732971191406, 0.053200721740722656, 0.05640411376953125, 0.059607505798339844, 0.06281089782714844, 0.06601428985595703, 0.06921768188476562, 0.07242107391357422, 0.07562446594238281, 0.0788278579711914, 0.08203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 9.0, 10.0, 13.0, 20.0, 20.0, 31.0, 55.0, 53.0, 67.0, 59.0, 66.0, 74.0, 72.0, 73.0, 80.0, 52.0, 52.0, 51.0, 31.0, 28.0, 24.0, 17.0, 10.0, 13.0, 8.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1876220703125, -0.1783885955810547, -0.16915512084960938, -0.15992164611816406, -0.15068817138671875, -0.14145469665527344, -0.13222122192382812, -0.12298774719238281, -0.1137542724609375, -0.10452079772949219, -0.09528732299804688, -0.08605384826660156, -0.07682037353515625, -0.06758689880371094, -0.058353424072265625, -0.04911994934082031, -0.039886474609375, -0.030652999877929688, -0.021419525146484375, -0.012186050415039062, -0.00295257568359375, 0.0062808990478515625, 0.015514373779296875, 0.024747848510742188, 0.0339813232421875, 0.04321479797363281, 0.052448272705078125, 0.06168174743652344, 0.07091522216796875, 0.08014869689941406, 0.08938217163085938, 0.09861564636230469, 0.10784912109375, 0.11708259582519531, 0.12631607055664062, 0.13554954528808594, 0.14478302001953125, 0.15401649475097656, 0.16324996948242188, 0.1724834442138672, 0.1817169189453125, 0.1909503936767578, 0.20018386840820312, 0.20941734313964844, 0.21865081787109375, 0.22788429260253906, 0.23711776733398438, 0.2463512420654297, 0.255584716796875, 0.2648181915283203, 0.2740516662597656, 0.28328514099121094, 0.29251861572265625, 0.30175209045410156, 0.3109855651855469, 0.3202190399169922, 0.3294525146484375, 0.3386859893798828, 0.3479194641113281, 0.35715293884277344, 0.36638641357421875, 0.37561988830566406, 0.3848533630371094, 0.3940868377685547, 0.4033203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 13.0, 14.0, 12.0, 26.0, 49.0, 71.0, 94.0, 131.0, 197.0, 310.0, 377.0, 609.0, 887.0, 1223.0, 1875.0, 2812.0, 4073.0, 6435.0, 9770.0, 15266.0, 25163.0, 42970.0, 77814.0, 141904.0, 223115.0, 206009.0, 122139.0, 66164.0, 37519.0, 21860.0, 13566.0, 8565.0, 5728.0, 3806.0, 2466.0, 1717.0, 1167.0, 778.0, 563.0, 389.0, 272.0, 205.0, 154.0, 81.0, 54.0, 36.0, 31.0, 21.0, 19.0, 11.0, 4.0, 7.0, 6.0, 5.0, 3.0, 2.0], "bins": [-0.0374755859375, -0.03633546829223633, -0.035195350646972656, -0.034055233001708984, -0.03291511535644531, -0.03177499771118164, -0.03063488006591797, -0.029494762420654297, -0.028354644775390625, -0.027214527130126953, -0.02607440948486328, -0.02493429183959961, -0.023794174194335938, -0.022654056549072266, -0.021513938903808594, -0.020373821258544922, -0.01923370361328125, -0.018093585968017578, -0.016953468322753906, -0.015813350677490234, -0.014673233032226562, -0.01353311538696289, -0.012392997741699219, -0.011252880096435547, -0.010112762451171875, -0.008972644805908203, -0.007832527160644531, -0.006692409515380859, -0.0055522918701171875, -0.004412174224853516, -0.0032720565795898438, -0.002131938934326172, -0.0009918212890625, 0.00014829635620117188, 0.0012884140014648438, 0.0024285316467285156, 0.0035686492919921875, 0.004708766937255859, 0.005848884582519531, 0.006989002227783203, 0.008129119873046875, 0.009269237518310547, 0.010409355163574219, 0.01154947280883789, 0.012689590454101562, 0.013829708099365234, 0.014969825744628906, 0.016109943389892578, 0.01725006103515625, 0.018390178680419922, 0.019530296325683594, 0.020670413970947266, 0.021810531616210938, 0.02295064926147461, 0.02409076690673828, 0.025230884552001953, 0.026371002197265625, 0.027511119842529297, 0.02865123748779297, 0.02979135513305664, 0.030931472778320312, 0.032071590423583984, 0.033211708068847656, 0.03435182571411133, 0.035491943359375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 9.0, 5.0, 9.0, 11.0, 9.0, 16.0, 9.0, 16.0, 16.0, 22.0, 29.0, 22.0, 36.0, 37.0, 37.0, 39.0, 48.0, 61.0, 54.0, 44.0, 49.0, 44.0, 37.0, 47.0, 37.0, 51.0, 28.0, 28.0, 25.0, 16.0, 16.0, 14.0, 13.0, 7.0, 16.0, 9.0, 10.0, 5.0, 6.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.4443359375, -0.43137359619140625, -0.4184112548828125, -0.40544891357421875, -0.392486572265625, -0.37952423095703125, -0.3665618896484375, -0.35359954833984375, -0.34063720703125, -0.32767486572265625, -0.3147125244140625, -0.30175018310546875, -0.288787841796875, -0.27582550048828125, -0.2628631591796875, -0.24990081787109375, -0.2369384765625, -0.22397613525390625, -0.2110137939453125, -0.19805145263671875, -0.185089111328125, -0.17212677001953125, -0.1591644287109375, -0.14620208740234375, -0.13323974609375, -0.12027740478515625, -0.1073150634765625, -0.09435272216796875, -0.081390380859375, -0.06842803955078125, -0.0554656982421875, -0.04250335693359375, -0.029541015625, -0.01657867431640625, -0.0036163330078125, 0.00934600830078125, 0.022308349609375, 0.03527069091796875, 0.0482330322265625, 0.06119537353515625, 0.07415771484375, 0.08712005615234375, 0.1000823974609375, 0.11304473876953125, 0.126007080078125, 0.13896942138671875, 0.1519317626953125, 0.16489410400390625, 0.1778564453125, 0.19081878662109375, 0.2037811279296875, 0.21674346923828125, 0.229705810546875, 0.24266815185546875, 0.2556304931640625, 0.26859283447265625, 0.28155517578125, 0.29451751708984375, 0.3074798583984375, 0.32044219970703125, 0.333404541015625, 0.34636688232421875, 0.3593292236328125, 0.37229156494140625, 0.38525390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 6.0, 13.0, 19.0, 23.0, 20.0, 38.0, 49.0, 61.0, 78.0, 121.0, 174.0, 287.0, 386.0, 637.0, 888.0, 1517.0, 2527.0, 4735.0, 8749.0, 17151.0, 34023.0, 69184.0, 143539.0, 267343.0, 247307.0, 125774.0, 60475.0, 29978.0, 14925.0, 7929.0, 4136.0, 2479.0, 1411.0, 838.0, 565.0, 367.0, 219.0, 188.0, 123.0, 84.0, 54.0, 38.0, 26.0, 12.0, 15.0, 18.0, 9.0, 4.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.0035915374755859375, -0.0034824013710021973, -0.003373265266418457, -0.003264129161834717, -0.0031549930572509766, -0.0030458569526672363, -0.002936720848083496, -0.002827584743499756, -0.0027184486389160156, -0.0026093125343322754, -0.002500176429748535, -0.002391040325164795, -0.0022819042205810547, -0.0021727681159973145, -0.0020636320114135742, -0.001954495906829834, -0.0018453598022460938, -0.0017362236976623535, -0.0016270875930786133, -0.001517951488494873, -0.0014088153839111328, -0.0012996792793273926, -0.0011905431747436523, -0.0010814070701599121, -0.0009722709655761719, -0.0008631348609924316, -0.0007539987564086914, -0.0006448626518249512, -0.0005357265472412109, -0.0004265904426574707, -0.00031745433807373047, -0.00020831823348999023, -9.918212890625e-05, 9.953975677490234e-06, 0.00011909008026123047, 0.0002282261848449707, 0.00033736228942871094, 0.00044649839401245117, 0.0005556344985961914, 0.0006647706031799316, 0.0007739067077636719, 0.0008830428123474121, 0.0009921789169311523, 0.0011013150215148926, 0.0012104511260986328, 0.001319587230682373, 0.0014287233352661133, 0.0015378594398498535, 0.0016469955444335938, 0.001756131649017334, 0.0018652677536010742, 0.0019744038581848145, 0.0020835399627685547, 0.002192676067352295, 0.002301812171936035, 0.0024109482765197754, 0.0025200843811035156, 0.002629220485687256, 0.002738356590270996, 0.0028474926948547363, 0.0029566287994384766, 0.003065764904022217, 0.003174901008605957, 0.0032840371131896973, 0.0033931732177734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 6.0, 5.0, 5.0, 4.0, 9.0, 9.0, 23.0, 29.0, 28.0, 26.0, 32.0, 70.0, 61.0, 79.0, 73.0, 87.0, 86.0, 76.0, 66.0, 42.0, 43.0, 25.0, 22.0, 19.0, 21.0, 13.0, 7.0, 9.0, 7.0, 6.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.47713851928711e-06, -9.172596037387848e-06, -8.868053555488586e-06, -8.563511073589325e-06, -8.258968591690063e-06, -7.954426109790802e-06, -7.64988362789154e-06, -7.345341145992279e-06, -7.040798664093018e-06, -6.736256182193756e-06, -6.431713700294495e-06, -6.127171218395233e-06, -5.822628736495972e-06, -5.51808625459671e-06, -5.213543772697449e-06, -4.909001290798187e-06, -4.604458808898926e-06, -4.299916326999664e-06, -3.995373845100403e-06, -3.6908313632011414e-06, -3.38628888130188e-06, -3.0817463994026184e-06, -2.777203917503357e-06, -2.4726614356040955e-06, -2.168118953704834e-06, -1.8635764718055725e-06, -1.559033989906311e-06, -1.2544915080070496e-06, -9.499490261077881e-07, -6.454065442085266e-07, -3.4086406230926514e-07, -3.632158041000366e-08, 2.682209014892578e-07, 5.727633833885193e-07, 8.773058652877808e-07, 1.1818483471870422e-06, 1.4863908290863037e-06, 1.7909333109855652e-06, 2.0954757928848267e-06, 2.400018274784088e-06, 2.7045607566833496e-06, 3.009103238582611e-06, 3.3136457204818726e-06, 3.618188202381134e-06, 3.9227306842803955e-06, 4.227273166179657e-06, 4.5318156480789185e-06, 4.83635812997818e-06, 5.140900611877441e-06, 5.445443093776703e-06, 5.749985575675964e-06, 6.054528057575226e-06, 6.359070539474487e-06, 6.663613021373749e-06, 6.96815550327301e-06, 7.272697985172272e-06, 7.577240467071533e-06, 7.881782948970795e-06, 8.186325430870056e-06, 8.490867912769318e-06, 8.795410394668579e-06, 9.09995287656784e-06, 9.404495358467102e-06, 9.709037840366364e-06, 1.0013580322265625e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 4.0, 10.0, 7.0, 6.0, 14.0, 16.0, 29.0, 23.0, 26.0, 38.0, 39.0, 60.0, 49.0, 77.0, 102.0, 126.0, 206.0, 400.0, 920.0, 2282.0, 6954.0, 22025.0, 74825.0, 245255.0, 416741.0, 194601.0, 57472.0, 17065.0, 5451.0, 1856.0, 747.0, 329.0, 196.0, 127.0, 94.0, 74.0, 59.0, 50.0, 50.0, 28.0, 26.0, 22.0, 13.0, 19.0, 14.0, 10.0, 6.0, 9.0, 1.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00539398193359375, -0.005232453346252441, -0.005070924758911133, -0.004909396171569824, -0.004747867584228516, -0.004586338996887207, -0.0044248104095458984, -0.00426328182220459, -0.004101753234863281, -0.003940224647521973, -0.003778696060180664, -0.0036171674728393555, -0.003455638885498047, -0.0032941102981567383, -0.0031325817108154297, -0.002971053123474121, -0.0028095245361328125, -0.002647995948791504, -0.0024864673614501953, -0.0023249387741088867, -0.002163410186767578, -0.0020018815994262695, -0.001840353012084961, -0.0016788244247436523, -0.0015172958374023438, -0.0013557672500610352, -0.0011942386627197266, -0.001032710075378418, -0.0008711814880371094, -0.0007096529006958008, -0.0005481243133544922, -0.0003865957260131836, -0.000225067138671875, -6.35385513305664e-05, 9.799003601074219e-05, 0.0002595186233520508, 0.0004210472106933594, 0.000582575798034668, 0.0007441043853759766, 0.0009056329727172852, 0.0010671615600585938, 0.0012286901473999023, 0.001390218734741211, 0.0015517473220825195, 0.0017132759094238281, 0.0018748044967651367, 0.0020363330841064453, 0.002197861671447754, 0.0023593902587890625, 0.002520918846130371, 0.0026824474334716797, 0.0028439760208129883, 0.003005504608154297, 0.0031670331954956055, 0.003328561782836914, 0.0034900903701782227, 0.0036516189575195312, 0.00381314754486084, 0.0039746761322021484, 0.004136204719543457, 0.004297733306884766, 0.004459261894226074, 0.004620790481567383, 0.004782319068908691, 0.00494384765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 7.0, 7.0, 9.0, 11.0, 9.0, 16.0, 21.0, 23.0, 20.0, 23.0, 27.0, 28.0, 34.0, 41.0, 43.0, 47.0, 44.0, 56.0, 56.0, 45.0, 45.0, 56.0, 37.0, 37.0, 30.0, 36.0, 34.0, 31.0, 12.0, 14.0, 22.0, 6.0, 16.0, 17.0, 12.0, 2.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010671615600585938, -0.0010330379009246826, -0.0009989142417907715, -0.0009647905826568604, -0.0009306669235229492, -0.0008965432643890381, -0.000862419605255127, -0.0008282959461212158, -0.0007941722869873047, -0.0007600486278533936, -0.0007259249687194824, -0.0006918013095855713, -0.0006576776504516602, -0.000623553991317749, -0.0005894303321838379, -0.0005553066730499268, -0.0005211830139160156, -0.0004870593547821045, -0.00045293569564819336, -0.0004188120365142822, -0.0003846883773803711, -0.00035056471824645996, -0.00031644105911254883, -0.0002823173999786377, -0.00024819374084472656, -0.00021407008171081543, -0.0001799464225769043, -0.00014582276344299316, -0.00011169910430908203, -7.75754451751709e-05, -4.3451786041259766e-05, -9.328126907348633e-06, 2.47955322265625e-05, 5.891919136047363e-05, 9.304285049438477e-05, 0.0001271665096282959, 0.00016129016876220703, 0.00019541382789611816, 0.0002295374870300293, 0.00026366114616394043, 0.00029778480529785156, 0.0003319084644317627, 0.00036603212356567383, 0.00040015578269958496, 0.0004342794418334961, 0.0004684031009674072, 0.0005025267601013184, 0.0005366504192352295, 0.0005707740783691406, 0.0006048977375030518, 0.0006390213966369629, 0.000673145055770874, 0.0007072687149047852, 0.0007413923740386963, 0.0007755160331726074, 0.0008096396923065186, 0.0008437633514404297, 0.0008778870105743408, 0.000912010669708252, 0.0009461343288421631, 0.0009802579879760742, 0.0010143816471099854, 0.0010485053062438965, 0.0010826289653778076, 0.0011167526245117188]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 4.0, 6.0, 14.0, 11.0, 22.0, 45.0, 53.0, 92.0, 112.0, 132.0, 136.0, 108.0, 83.0, 65.0, 43.0, 24.0, 19.0, 12.0, 7.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.287964403629303, -0.27735719084739685, -0.2667500078678131, -0.256142795085907, -0.24553559720516205, -0.23492839932441711, -0.224321186542511, -0.21371398866176605, -0.20310679078102112, -0.19249959290027618, -0.18189239501953125, -0.17128518223762512, -0.1606779843568802, -0.15007078647613525, -0.13946357369422913, -0.1288563758134842, -0.11824917793273926, -0.10764198005199432, -0.09703477472066879, -0.08642756938934326, -0.07582037150859833, -0.0652131736278534, -0.05460596829652786, -0.04399876296520233, -0.0333915650844574, -0.022784363478422165, -0.012177161872386932, -0.0015699602663516998, 0.009037241339683533, 0.019644442945718765, 0.030251644551753998, 0.04085884988307953, 0.05146604776382446, 0.062073249369859695, 0.07268045097589493, 0.08328765630722046, 0.0938948541879654, 0.10450205206871033, 0.11510925740003586, 0.1257164627313614, 0.13632366061210632, 0.14693085849285126, 0.1575380563735962, 0.16814526915550232, 0.17875246703624725, 0.1893596649169922, 0.19996687769889832, 0.21057407557964325, 0.22118127346038818, 0.23178847134113312, 0.24239566922187805, 0.2530028820037842, 0.2636100649833679, 0.27421727776527405, 0.2848244905471802, 0.2954316735267639, 0.30603888630867004, 0.31664609909057617, 0.3272532820701599, 0.33786049485206604, 0.34846770763397217, 0.3590748906135559, 0.36968210339546204, 0.38028931617736816, 0.3908964991569519]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 16.0, 9.0, 10.0, 13.0, 25.0, 40.0, 36.0, 70.0, 66.0, 70.0, 76.0, 71.0, 59.0, 74.0, 53.0, 67.0, 47.0, 48.0, 34.0, 30.0, 22.0, 20.0, 11.0, 13.0, 10.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15957193076610565, -0.15079165995121002, -0.1420113891363144, -0.13323111832141876, -0.12445084005594254, -0.1156705692410469, -0.10689029097557068, -0.09811002016067505, -0.08932974934577942, -0.08054947853088379, -0.07176920771598816, -0.06298892945051193, -0.0542086586356163, -0.04542838782072067, -0.036648113280534744, -0.027867838740348816, -0.019087567925453186, -0.010307295247912407, -0.0015270225703716278, 0.007253250107169151, 0.01603352278470993, 0.02481379359960556, 0.03359406813979149, 0.04237434267997742, 0.05115461349487305, 0.05993488430976868, 0.0687151551246643, 0.07749543339014053, 0.08627570420503616, 0.0950559750199318, 0.10383625328540802, 0.11261652410030365, 0.12139678001403809, 0.13017705082893372, 0.13895732164382935, 0.14773759245872498, 0.1565178632736206, 0.16529813408851624, 0.17407841980457306, 0.1828586906194687, 0.19163896143436432, 0.20041923224925995, 0.20919950306415558, 0.2179797738790512, 0.22676005959510803, 0.23554033041000366, 0.2443206012248993, 0.2531008720397949, 0.26188114285469055, 0.2706614136695862, 0.2794416844844818, 0.28822195529937744, 0.29700222611427307, 0.3057824969291687, 0.31456276774406433, 0.32334303855895996, 0.332123339176178, 0.3409036099910736, 0.34968388080596924, 0.35846415162086487, 0.3672444224357605, 0.37602469325065613, 0.38480496406555176, 0.3935852646827698, 0.402365505695343]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 2.0, 4.0, 9.0, 7.0, 13.0, 18.0, 32.0, 28.0, 60.0, 56.0, 117.0, 165.0, 257.0, 410.0, 706.0, 1226.0, 2135.0, 4026.0, 8434.0, 21888.0, 78888.0, 427598.0, 392595.0, 72529.0, 20155.0, 8274.0, 3846.0, 2066.0, 1126.0, 712.0, 439.0, 227.0, 155.0, 118.0, 76.0, 48.0, 29.0, 20.0, 22.0, 16.0, 10.0, 4.0, 6.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.095458984375, -0.09256362915039062, -0.08966827392578125, -0.08677291870117188, -0.0838775634765625, -0.08098220825195312, -0.07808685302734375, -0.07519149780273438, -0.072296142578125, -0.06940078735351562, -0.06650543212890625, -0.06361007690429688, -0.0607147216796875, -0.057819366455078125, -0.05492401123046875, -0.052028656005859375, -0.04913330078125, -0.046237945556640625, -0.04334259033203125, -0.040447235107421875, -0.0375518798828125, -0.034656524658203125, -0.03176116943359375, -0.028865814208984375, -0.025970458984375, -0.023075103759765625, -0.02017974853515625, -0.017284393310546875, -0.0143890380859375, -0.011493682861328125, -0.00859832763671875, -0.005702972412109375, -0.0028076171875, 8.7738037109375e-05, 0.00298309326171875, 0.005878448486328125, 0.0087738037109375, 0.011669158935546875, 0.01456451416015625, 0.017459869384765625, 0.020355224609375, 0.023250579833984375, 0.02614593505859375, 0.029041290283203125, 0.0319366455078125, 0.034832000732421875, 0.03772735595703125, 0.040622711181640625, 0.04351806640625, 0.046413421630859375, 0.04930877685546875, 0.052204132080078125, 0.0550994873046875, 0.057994842529296875, 0.06089019775390625, 0.06378555297851562, 0.066680908203125, 0.06957626342773438, 0.07247161865234375, 0.07536697387695312, 0.0782623291015625, 0.08115768432617188, 0.08405303955078125, 0.08694839477539062, 0.08984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 8.0, 5.0, 9.0, 9.0, 5.0, 12.0, 17.0, 13.0, 24.0, 31.0, 35.0, 59.0, 53.0, 58.0, 48.0, 50.0, 66.0, 61.0, 56.0, 59.0, 64.0, 44.0, 35.0, 38.0, 33.0, 21.0, 22.0, 13.0, 17.0, 16.0, 6.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.349365234375, -0.3347969055175781, -0.32022857666015625, -0.3056602478027344, -0.2910919189453125, -0.2765235900878906, -0.26195526123046875, -0.24738693237304688, -0.232818603515625, -0.21825027465820312, -0.20368194580078125, -0.18911361694335938, -0.1745452880859375, -0.15997695922851562, -0.14540863037109375, -0.13084030151367188, -0.11627197265625, -0.10170364379882812, -0.08713531494140625, -0.07256698608398438, -0.0579986572265625, -0.043430328369140625, -0.02886199951171875, -0.014293670654296875, 0.000274658203125, 0.014842987060546875, 0.02941131591796875, 0.043979644775390625, 0.0585479736328125, 0.07311630249023438, 0.08768463134765625, 0.10225296020507812, 0.1168212890625, 0.13138961791992188, 0.14595794677734375, 0.16052627563476562, 0.1750946044921875, 0.18966293334960938, 0.20423126220703125, 0.21879959106445312, 0.233367919921875, 0.24793624877929688, 0.26250457763671875, 0.2770729064941406, 0.2916412353515625, 0.3062095642089844, 0.32077789306640625, 0.3353462219238281, 0.34991455078125, 0.3644828796386719, 0.37905120849609375, 0.3936195373535156, 0.4081878662109375, 0.4227561950683594, 0.43732452392578125, 0.4518928527832031, 0.466461181640625, 0.4810295104980469, 0.49559783935546875, 0.5101661682128906, 0.5247344970703125, 0.5393028259277344, 0.5538711547851562, 0.5684394836425781, 0.5830078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 10.0, 7.0, 8.0, 18.0, 25.0, 48.0, 47.0, 70.0, 90.0, 135.0, 253.0, 449.0, 1514.0, 13078.0, 973749.0, 54884.0, 2642.0, 655.0, 277.0, 188.0, 111.0, 80.0, 62.0, 47.0, 25.0, 18.0, 16.0, 7.0, 8.0, 6.0, 6.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.47998046875, -0.4672393798828125, -0.454498291015625, -0.4417572021484375, -0.42901611328125, -0.4162750244140625, -0.403533935546875, -0.3907928466796875, -0.3780517578125, -0.3653106689453125, -0.352569580078125, -0.3398284912109375, -0.32708740234375, -0.3143463134765625, -0.301605224609375, -0.2888641357421875, -0.276123046875, -0.2633819580078125, -0.250640869140625, -0.2378997802734375, -0.22515869140625, -0.2124176025390625, -0.199676513671875, -0.1869354248046875, -0.1741943359375, -0.1614532470703125, -0.148712158203125, -0.1359710693359375, -0.12322998046875, -0.1104888916015625, -0.097747802734375, -0.0850067138671875, -0.072265625, -0.0595245361328125, -0.046783447265625, -0.0340423583984375, -0.02130126953125, -0.0085601806640625, 0.004180908203125, 0.0169219970703125, 0.0296630859375, 0.0424041748046875, 0.055145263671875, 0.0678863525390625, 0.08062744140625, 0.0933685302734375, 0.106109619140625, 0.1188507080078125, 0.131591796875, 0.1443328857421875, 0.157073974609375, 0.1698150634765625, 0.18255615234375, 0.1952972412109375, 0.208038330078125, 0.2207794189453125, 0.2335205078125, 0.2462615966796875, 0.259002685546875, 0.2717437744140625, 0.28448486328125, 0.2972259521484375, 0.309967041015625, 0.3227081298828125, 0.33544921875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 5.0, 7.0, 14.0, 11.0, 18.0, 22.0, 27.0, 33.0, 28.0, 31.0, 48.0, 44.0, 44.0, 53.0, 57.0, 61.0, 53.0, 65.0, 38.0, 53.0, 41.0, 42.0, 42.0, 20.0, 25.0, 25.0, 14.0, 14.0, 12.0, 7.0, 8.0, 9.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54638671875, -0.52960205078125, -0.5128173828125, -0.49603271484375, -0.479248046875, -0.46246337890625, -0.4456787109375, -0.42889404296875, -0.412109375, -0.39532470703125, -0.3785400390625, -0.36175537109375, -0.344970703125, -0.32818603515625, -0.3114013671875, -0.29461669921875, -0.27783203125, -0.26104736328125, -0.2442626953125, -0.22747802734375, -0.210693359375, -0.19390869140625, -0.1771240234375, -0.16033935546875, -0.1435546875, -0.12677001953125, -0.1099853515625, -0.09320068359375, -0.076416015625, -0.05963134765625, -0.0428466796875, -0.02606201171875, -0.00927734375, 0.00750732421875, 0.0242919921875, 0.04107666015625, 0.057861328125, 0.07464599609375, 0.0914306640625, 0.10821533203125, 0.125, 0.14178466796875, 0.1585693359375, 0.17535400390625, 0.192138671875, 0.20892333984375, 0.2257080078125, 0.24249267578125, 0.25927734375, 0.27606201171875, 0.2928466796875, 0.30963134765625, 0.326416015625, 0.34320068359375, 0.3599853515625, 0.37677001953125, 0.3935546875, 0.41033935546875, 0.4271240234375, 0.44390869140625, 0.460693359375, 0.47747802734375, 0.4942626953125, 0.51104736328125, 0.52783203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 4.0, 3.0, 17.0, 14.0, 36.0, 51.0, 112.0, 276.0, 1363.0, 18740.0, 1007610.0, 18491.0, 1302.0, 279.0, 111.0, 43.0, 22.0, 18.0, 9.0, 13.0, 7.0, 4.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1492919921875, -0.14293861389160156, -0.13658523559570312, -0.1302318572998047, -0.12387847900390625, -0.11752510070800781, -0.11117172241210938, -0.10481834411621094, -0.0984649658203125, -0.09211158752441406, -0.08575820922851562, -0.07940483093261719, -0.07305145263671875, -0.06669807434082031, -0.060344696044921875, -0.05399131774902344, -0.047637939453125, -0.04128456115722656, -0.034931182861328125, -0.028577804565429688, -0.02222442626953125, -0.015871047973632812, -0.009517669677734375, -0.0031642913818359375, 0.0031890869140625, 0.009542465209960938, 0.015895843505859375, 0.022249221801757812, 0.02860260009765625, 0.03495597839355469, 0.041309356689453125, 0.04766273498535156, 0.05401611328125, 0.06036949157714844, 0.06672286987304688, 0.07307624816894531, 0.07942962646484375, 0.08578300476074219, 0.09213638305664062, 0.09848976135253906, 0.1048431396484375, 0.11119651794433594, 0.11754989624023438, 0.12390327453613281, 0.13025665283203125, 0.1366100311279297, 0.14296340942382812, 0.14931678771972656, 0.155670166015625, 0.16202354431152344, 0.16837692260742188, 0.1747303009033203, 0.18108367919921875, 0.1874370574951172, 0.19379043579101562, 0.20014381408691406, 0.2064971923828125, 0.21285057067871094, 0.21920394897460938, 0.2255573272705078, 0.23191070556640625, 0.2382640838623047, 0.24461746215820312, 0.25097084045410156, 0.25732421875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 12.0, 13.0, 26.0, 48.0, 94.0, 216.0, 327.0, 139.0, 58.0, 31.0, 20.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3053417205810547e-05, -1.2537464499473572e-05, -1.2021511793136597e-05, -1.1505559086799622e-05, -1.0989606380462646e-05, -1.0473653674125671e-05, -9.957700967788696e-06, -9.441748261451721e-06, -8.925795555114746e-06, -8.409842848777771e-06, -7.893890142440796e-06, -7.377937436103821e-06, -6.861984729766846e-06, -6.346032023429871e-06, -5.8300793170928955e-06, -5.31412661075592e-06, -4.798173904418945e-06, -4.28222119808197e-06, -3.766268491744995e-06, -3.25031578540802e-06, -2.734363079071045e-06, -2.21841037273407e-06, -1.7024576663970947e-06, -1.1865049600601196e-06, -6.705522537231445e-07, -1.5459954738616943e-07, 3.6135315895080566e-07, 8.773058652877808e-07, 1.3932585716247559e-06, 1.909211277961731e-06, 2.425163984298706e-06, 2.941116690635681e-06, 3.4570693969726562e-06, 3.973022103309631e-06, 4.4889748096466064e-06, 5.0049275159835815e-06, 5.520880222320557e-06, 6.036832928657532e-06, 6.552785634994507e-06, 7.068738341331482e-06, 7.584691047668457e-06, 8.100643754005432e-06, 8.616596460342407e-06, 9.132549166679382e-06, 9.648501873016357e-06, 1.0164454579353333e-05, 1.0680407285690308e-05, 1.1196359992027283e-05, 1.1712312698364258e-05, 1.2228265404701233e-05, 1.2744218111038208e-05, 1.3260170817375183e-05, 1.3776123523712158e-05, 1.4292076230049133e-05, 1.4808028936386108e-05, 1.5323981642723083e-05, 1.583993434906006e-05, 1.6355887055397034e-05, 1.687183976173401e-05, 1.7387792468070984e-05, 1.790374517440796e-05, 1.8419697880744934e-05, 1.893565058708191e-05, 1.9451603293418884e-05, 1.996755599975586e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 10.0, 3.0, 11.0, 18.0, 23.0, 66.0, 179.0, 848.0, 17832.0, 1022429.0, 6356.0, 530.0, 135.0, 53.0, 16.0, 16.0, 9.0, 3.0, 8.0, 2.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.363037109375, -0.35247802734375, -0.3419189453125, -0.33135986328125, -0.32080078125, -0.31024169921875, -0.2996826171875, -0.28912353515625, -0.278564453125, -0.26800537109375, -0.2574462890625, -0.24688720703125, -0.236328125, -0.22576904296875, -0.2152099609375, -0.20465087890625, -0.194091796875, -0.18353271484375, -0.1729736328125, -0.16241455078125, -0.15185546875, -0.14129638671875, -0.1307373046875, -0.12017822265625, -0.109619140625, -0.09906005859375, -0.0885009765625, -0.07794189453125, -0.0673828125, -0.05682373046875, -0.0462646484375, -0.03570556640625, -0.025146484375, -0.01458740234375, -0.0040283203125, 0.00653076171875, 0.01708984375, 0.02764892578125, 0.0382080078125, 0.04876708984375, 0.059326171875, 0.06988525390625, 0.0804443359375, 0.09100341796875, 0.1015625, 0.11212158203125, 0.1226806640625, 0.13323974609375, 0.143798828125, 0.15435791015625, 0.1649169921875, 0.17547607421875, 0.18603515625, 0.19659423828125, 0.2071533203125, 0.21771240234375, 0.228271484375, 0.23883056640625, 0.2493896484375, 0.25994873046875, 0.2705078125, 0.28106689453125, 0.2916259765625, 0.30218505859375, 0.312744140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 7.0, 6.0, 11.0, 8.0, 21.0, 20.0, 44.0, 91.0, 218.0, 253.0, 135.0, 70.0, 41.0, 30.0, 13.0, 10.0, 9.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044952392578125, -0.04341459274291992, -0.041876792907714844, -0.040338993072509766, -0.03880119323730469, -0.03726339340209961, -0.03572559356689453, -0.03418779373168945, -0.032649993896484375, -0.031112194061279297, -0.02957439422607422, -0.02803659439086914, -0.026498794555664062, -0.024960994720458984, -0.023423194885253906, -0.021885395050048828, -0.02034759521484375, -0.018809795379638672, -0.017271995544433594, -0.015734195709228516, -0.014196395874023438, -0.01265859603881836, -0.011120796203613281, -0.009582996368408203, -0.008045196533203125, -0.006507396697998047, -0.004969596862792969, -0.0034317970275878906, -0.0018939971923828125, -0.0003561973571777344, 0.0011816024780273438, 0.002719402313232422, 0.0042572021484375, 0.005795001983642578, 0.007332801818847656, 0.008870601654052734, 0.010408401489257812, 0.01194620132446289, 0.013484001159667969, 0.015021800994873047, 0.016559600830078125, 0.018097400665283203, 0.01963520050048828, 0.02117300033569336, 0.022710800170898438, 0.024248600006103516, 0.025786399841308594, 0.027324199676513672, 0.02886199951171875, 0.030399799346923828, 0.031937599182128906, 0.033475399017333984, 0.03501319885253906, 0.03655099868774414, 0.03808879852294922, 0.0396265983581543, 0.041164398193359375, 0.04270219802856445, 0.04423999786376953, 0.04577779769897461, 0.04731559753417969, 0.048853397369384766, 0.050391197204589844, 0.05192899703979492, 0.053466796875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 12.0, 12.0, 39.0, 56.0, 92.0, 151.0, 169.0, 194.0, 119.0, 66.0, 46.0, 17.0, 9.0, 5.0, 6.0, 0.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.390581339597702, -0.36007341742515564, -0.32956549525260925, -0.29905757308006287, -0.2685496509075165, -0.2380417287349701, -0.2075338065624237, -0.17702588438987732, -0.14651796221733093, -0.11601004004478455, -0.08550211787223816, -0.05499419569969177, -0.024486273527145386, 0.006021648645401001, 0.03652957081794739, 0.06703749299049377, 0.09754541516304016, 0.12805333733558655, 0.15856125950813293, 0.18906918168067932, 0.2195771038532257, 0.2500850260257721, 0.2805929481983185, 0.31110087037086487, 0.34160879254341125, 0.37211671471595764, 0.40262463688850403, 0.4331325590610504, 0.4636404812335968, 0.4941484034061432, 0.5246562957763672, 0.5551642179489136, 0.58567214012146, 0.6161800622940063, 0.6466879844665527, 0.6771959066390991, 0.7077038288116455, 0.7382117509841919, 0.7687196731567383, 0.7992275953292847, 0.829735517501831, 0.8602434396743774, 0.8907513618469238, 0.9212592840194702, 0.9517672061920166, 0.982275128364563, 1.0127830505371094, 1.0432909727096558, 1.0737988948822021, 1.1043068170547485, 1.134814739227295, 1.1653226613998413, 1.1958305835723877, 1.226338505744934, 1.2568464279174805, 1.2873543500900269, 1.3178622722625732, 1.3483701944351196, 1.378878116607666, 1.4093860387802124, 1.4398939609527588, 1.4704018831253052, 1.5009098052978516, 1.531417727470398, 1.5619256496429443]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 5.0, 3.0, 3.0, 1.0, 5.0, 15.0, 15.0, 9.0, 21.0, 18.0, 25.0, 35.0, 29.0, 46.0, 46.0, 41.0, 44.0, 53.0, 59.0, 61.0, 51.0, 58.0, 41.0, 50.0, 37.0, 39.0, 35.0, 33.0, 33.0, 21.0, 14.0, 19.0, 13.0, 11.0, 6.0, 4.0, 9.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7703253030776978, -0.7379761338233948, -0.7056269645690918, -0.673277735710144, -0.6409285664558411, -0.6085793972015381, -0.5762301683425903, -0.5438809990882874, -0.5115318298339844, -0.4791826605796814, -0.44683346152305603, -0.41448426246643066, -0.3821350932121277, -0.3497859239578247, -0.31743672490119934, -0.285087525844574, -0.252738356590271, -0.22038917243480682, -0.18803998827934265, -0.15569080412387848, -0.1233416199684143, -0.09099243581295013, -0.05864325165748596, -0.02629406750202179, 0.006055116653442383, 0.038404300808906555, 0.07075348496437073, 0.1031026691198349, 0.13545185327529907, 0.16780103743076324, 0.20015022158622742, 0.2324994057416916, 0.2648487091064453, 0.2971978783607483, 0.32954707741737366, 0.361896276473999, 0.394245445728302, 0.426594614982605, 0.45894381403923035, 0.4912930130958557, 0.5236421823501587, 0.5559913516044617, 0.5883405208587646, 0.6206897497177124, 0.6530389189720154, 0.6853880882263184, 0.7177373170852661, 0.7500864863395691, 0.7824356555938721, 0.814784824848175, 0.847133994102478, 0.8794832229614258, 0.9118323922157288, 0.9441815614700317, 0.9765307903289795, 1.0088798999786377, 1.0412291288375854, 1.0735783576965332, 1.1059274673461914, 1.1382766962051392, 1.170625925064087, 1.2029750347137451, 1.2353242635726929, 1.267673373222351, 1.3000226020812988]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 11.0, 26.0, 32.0, 62.0, 113.0, 243.0, 473.0, 1114.0, 3038.0, 11284.0, 77024.0, 3201004.0, 866054.0, 25029.0, 5332.0, 1895.0, 788.0, 374.0, 175.0, 69.0, 54.0, 36.0, 13.0, 12.0, 3.0, 10.0, 4.0, 0.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92041015625, -0.8966827392578125, -0.872955322265625, -0.8492279052734375, -0.82550048828125, -0.8017730712890625, -0.778045654296875, -0.7543182373046875, -0.7305908203125, -0.7068634033203125, -0.683135986328125, -0.6594085693359375, -0.63568115234375, -0.6119537353515625, -0.588226318359375, -0.5644989013671875, -0.540771484375, -0.5170440673828125, -0.493316650390625, -0.4695892333984375, -0.44586181640625, -0.4221343994140625, -0.398406982421875, -0.3746795654296875, -0.3509521484375, -0.3272247314453125, -0.303497314453125, -0.2797698974609375, -0.25604248046875, -0.2323150634765625, -0.208587646484375, -0.1848602294921875, -0.1611328125, -0.1374053955078125, -0.113677978515625, -0.0899505615234375, -0.06622314453125, -0.0424957275390625, -0.018768310546875, 0.0049591064453125, 0.0286865234375, 0.0524139404296875, 0.076141357421875, 0.0998687744140625, 0.12359619140625, 0.1473236083984375, 0.171051025390625, 0.1947784423828125, 0.218505859375, 0.2422332763671875, 0.265960693359375, 0.2896881103515625, 0.31341552734375, 0.3371429443359375, 0.360870361328125, 0.3845977783203125, 0.4083251953125, 0.4320526123046875, 0.455780029296875, 0.4795074462890625, 0.50323486328125, 0.5269622802734375, 0.550689697265625, 0.5744171142578125, 0.59814453125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 6.0, 13.0, 7.0, 12.0, 31.0, 26.0, 41.0, 54.0, 74.0, 61.0, 79.0, 84.0, 81.0, 96.0, 67.0, 46.0, 53.0, 50.0, 24.0, 27.0, 21.0, 7.0, 16.0, 13.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.240966796875, -0.22958755493164062, -0.21820831298828125, -0.20682907104492188, -0.1954498291015625, -0.18407058715820312, -0.17269134521484375, -0.16131210327148438, -0.149932861328125, -0.13855361938476562, -0.12717437744140625, -0.11579513549804688, -0.1044158935546875, -0.09303665161132812, -0.08165740966796875, -0.07027816772460938, -0.05889892578125, -0.047519683837890625, -0.03614044189453125, -0.024761199951171875, -0.0133819580078125, -0.002002716064453125, 0.00937652587890625, 0.020755767822265625, 0.032135009765625, 0.043514251708984375, 0.05489349365234375, 0.06627273559570312, 0.0776519775390625, 0.08903121948242188, 0.10041046142578125, 0.11178970336914062, 0.1231689453125, 0.13454818725585938, 0.14592742919921875, 0.15730667114257812, 0.1686859130859375, 0.18006515502929688, 0.19144439697265625, 0.20282363891601562, 0.214202880859375, 0.22558212280273438, 0.23696136474609375, 0.24834060668945312, 0.2597198486328125, 0.2710990905761719, 0.28247833251953125, 0.2938575744628906, 0.30523681640625, 0.3166160583496094, 0.32799530029296875, 0.3393745422363281, 0.3507537841796875, 0.3621330261230469, 0.37351226806640625, 0.3848915100097656, 0.396270751953125, 0.4076499938964844, 0.41902923583984375, 0.4304084777832031, 0.4417877197265625, 0.4531669616699219, 0.46454620361328125, 0.4759254455566406, 0.4873046875]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 7.0, 3.0, 1.0, 4.0, 1.0, 4.0, 11.0, 9.0, 7.0, 14.0, 17.0, 20.0, 38.0, 61.0, 85.0, 164.0, 348.0, 816.0, 2792.0, 18986.0, 2997985.0, 1155018.0, 14326.0, 2158.0, 740.0, 282.0, 159.0, 87.0, 43.0, 33.0, 25.0, 8.0, 9.0, 1.0, 5.0, 8.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9775390625, -0.945953369140625, -0.91436767578125, -0.882781982421875, -0.8511962890625, -0.819610595703125, -0.78802490234375, -0.756439208984375, -0.724853515625, -0.693267822265625, -0.66168212890625, -0.630096435546875, -0.5985107421875, -0.566925048828125, -0.53533935546875, -0.503753662109375, -0.47216796875, -0.440582275390625, -0.40899658203125, -0.377410888671875, -0.3458251953125, -0.314239501953125, -0.28265380859375, -0.251068115234375, -0.219482421875, -0.187896728515625, -0.15631103515625, -0.124725341796875, -0.0931396484375, -0.061553955078125, -0.02996826171875, 0.001617431640625, 0.033203125, 0.064788818359375, 0.09637451171875, 0.127960205078125, 0.1595458984375, 0.191131591796875, 0.22271728515625, 0.254302978515625, 0.285888671875, 0.317474365234375, 0.34906005859375, 0.380645751953125, 0.4122314453125, 0.443817138671875, 0.47540283203125, 0.506988525390625, 0.53857421875, 0.570159912109375, 0.60174560546875, 0.633331298828125, 0.6649169921875, 0.696502685546875, 0.72808837890625, 0.759674072265625, 0.791259765625, 0.822845458984375, 0.85443115234375, 0.886016845703125, 0.9176025390625, 0.949188232421875, 0.98077392578125, 1.012359619140625, 1.0439453125]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 9.0, 11.0, 27.0, 28.0, 50.0, 92.0, 159.0, 496.0, 1121.0, 1185.0, 453.0, 175.0, 98.0, 55.0, 29.0, 25.0, 11.0, 13.0, 8.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.2264404296875, -0.2199726104736328, -0.21350479125976562, -0.20703697204589844, -0.20056915283203125, -0.19410133361816406, -0.18763351440429688, -0.1811656951904297, -0.1746978759765625, -0.1682300567626953, -0.16176223754882812, -0.15529441833496094, -0.14882659912109375, -0.14235877990722656, -0.13589096069335938, -0.1294231414794922, -0.122955322265625, -0.11648750305175781, -0.11001968383789062, -0.10355186462402344, -0.09708404541015625, -0.09061622619628906, -0.08414840698242188, -0.07768058776855469, -0.0712127685546875, -0.06474494934082031, -0.058277130126953125, -0.05180931091308594, -0.04534149169921875, -0.03887367248535156, -0.032405853271484375, -0.025938034057617188, -0.01947021484375, -0.013002395629882812, -0.006534576416015625, -6.67572021484375e-05, 0.00640106201171875, 0.012868881225585938, 0.019336700439453125, 0.025804519653320312, 0.0322723388671875, 0.03874015808105469, 0.045207977294921875, 0.05167579650878906, 0.05814361572265625, 0.06461143493652344, 0.07107925415039062, 0.07754707336425781, 0.084014892578125, 0.09048271179199219, 0.09695053100585938, 0.10341835021972656, 0.10988616943359375, 0.11635398864746094, 0.12282180786132812, 0.1292896270751953, 0.1357574462890625, 0.1422252655029297, 0.14869308471679688, 0.15516090393066406, 0.16162872314453125, 0.16809654235839844, 0.17456436157226562, 0.1810321807861328, 0.1875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 7.0, 11.0, 15.0, 18.0, 30.0, 31.0, 59.0, 59.0, 70.0, 86.0, 108.0, 100.0, 80.0, 90.0, 62.0, 52.0, 30.0, 19.0, 15.0, 24.0, 9.0, 8.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37839633226394653, -0.3649967312812805, -0.3515971302986145, -0.3381975293159485, -0.32479792833328247, -0.31139832735061646, -0.29799869656562805, -0.28459909558296204, -0.271199494600296, -0.25779989361763, -0.244400292634964, -0.23100067675113678, -0.21760107576847076, -0.20420147478580475, -0.19080185890197754, -0.17740225791931152, -0.1640026569366455, -0.1506030559539795, -0.13720345497131348, -0.12380383908748627, -0.11040423810482025, -0.09700463712215424, -0.08360502868890762, -0.07020542025566101, -0.056805819272994995, -0.04340621456503868, -0.030006609857082367, -0.016607005149126053, -0.0032074004411697388, 0.010192200541496277, 0.02359180897474289, 0.0369914174079895, 0.05039098858833313, 0.06379058957099915, 0.07719019800424576, 0.09058980643749237, 0.10398940742015839, 0.1173890084028244, 0.1307886242866516, 0.14418822526931763, 0.15758782625198364, 0.17098742723464966, 0.18438702821731567, 0.19778664410114288, 0.2111862450838089, 0.22458584606647491, 0.23798546195030212, 0.25138506293296814, 0.26478466391563416, 0.27818426489830017, 0.2915838658809662, 0.3049834668636322, 0.3183830976486206, 0.3317826986312866, 0.34518229961395264, 0.35858190059661865, 0.37198150157928467, 0.3853811025619507, 0.3987807035446167, 0.4121803045272827, 0.42557990550994873, 0.43897950649261475, 0.45237913727760315, 0.46577873826026917, 0.4791783392429352]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 8.0, 11.0, 15.0, 17.0, 17.0, 21.0, 27.0, 36.0, 54.0, 54.0, 69.0, 73.0, 81.0, 81.0, 63.0, 70.0, 58.0, 45.0, 50.0, 41.0, 28.0, 20.0, 22.0, 23.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26738089323043823, -0.25571855902671814, -0.24405625462532043, -0.23239392042160034, -0.22073160111904144, -0.20906928181648254, -0.19740694761276245, -0.18574462831020355, -0.17408230900764465, -0.16241998970508575, -0.15075767040252686, -0.13909533619880676, -0.12743301689624786, -0.11577069759368896, -0.10410837084054947, -0.09244604408740997, -0.08078372478485107, -0.06912140548229218, -0.05745907872915268, -0.04579675570130348, -0.034134432673454285, -0.022472109645605087, -0.01080978661775589, 0.000852540135383606, 0.012514859437942505, 0.024177182465791702, 0.0358395054936409, 0.0475018285214901, 0.059164151549339294, 0.0708264708518982, 0.08248879760503769, 0.09415112435817719, 0.1058134138584137, 0.1174757331609726, 0.1291380524635315, 0.1408003866672516, 0.15246270596981049, 0.16412502527236938, 0.17578735947608948, 0.18744967877864838, 0.19911199808120728, 0.21077431738376617, 0.22243663668632507, 0.23409897089004517, 0.24576129019260406, 0.25742360949516296, 0.26908594369888306, 0.28074824810028076, 0.29241058230400085, 0.30407291650772095, 0.31573522090911865, 0.32739755511283875, 0.33905988931655884, 0.35072219371795654, 0.36238452792167664, 0.37404686212539673, 0.38570916652679443, 0.3973715007305145, 0.40903380513191223, 0.4206961393356323, 0.43235844373703003, 0.4440207779407501, 0.4556831121444702, 0.4673454165458679, 0.479007750749588]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 1.0, 5.0, 5.0, 15.0, 11.0, 11.0, 15.0, 25.0, 26.0, 40.0, 58.0, 135.0, 246.0, 750.0, 2871.0, 15596.0, 122133.0, 744313.0, 140559.0, 17131.0, 3178.0, 785.0, 303.0, 129.0, 63.0, 37.0, 29.0, 30.0, 22.0, 9.0, 13.0, 4.0, 0.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13525390625, -0.130340576171875, -0.12542724609375, -0.120513916015625, -0.1156005859375, -0.110687255859375, -0.10577392578125, -0.100860595703125, -0.095947265625, -0.091033935546875, -0.08612060546875, -0.081207275390625, -0.0762939453125, -0.071380615234375, -0.06646728515625, -0.061553955078125, -0.056640625, -0.051727294921875, -0.04681396484375, -0.041900634765625, -0.0369873046875, -0.032073974609375, -0.02716064453125, -0.022247314453125, -0.017333984375, -0.012420654296875, -0.00750732421875, -0.002593994140625, 0.0023193359375, 0.007232666015625, 0.01214599609375, 0.017059326171875, 0.02197265625, 0.026885986328125, 0.03179931640625, 0.036712646484375, 0.0416259765625, 0.046539306640625, 0.05145263671875, 0.056365966796875, 0.061279296875, 0.066192626953125, 0.07110595703125, 0.076019287109375, 0.0809326171875, 0.085845947265625, 0.09075927734375, 0.095672607421875, 0.1005859375, 0.105499267578125, 0.11041259765625, 0.115325927734375, 0.1202392578125, 0.125152587890625, 0.13006591796875, 0.134979248046875, 0.139892578125, 0.144805908203125, 0.14971923828125, 0.154632568359375, 0.1595458984375, 0.164459228515625, 0.16937255859375, 0.174285888671875, 0.17919921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 7.0, 3.0, 8.0, 23.0, 16.0, 22.0, 42.0, 57.0, 73.0, 87.0, 117.0, 97.0, 100.0, 92.0, 78.0, 59.0, 41.0, 31.0, 24.0, 16.0, 13.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.176025390625, -0.16479110717773438, -0.15355682373046875, -0.14232254028320312, -0.1310882568359375, -0.11985397338867188, -0.10861968994140625, -0.09738540649414062, -0.086151123046875, -0.07491683959960938, -0.06368255615234375, -0.052448272705078125, -0.0412139892578125, -0.029979705810546875, -0.01874542236328125, -0.007511138916015625, 0.00372314453125, 0.014957427978515625, 0.02619171142578125, 0.037425994873046875, 0.0486602783203125, 0.059894561767578125, 0.07112884521484375, 0.08236312866210938, 0.093597412109375, 0.10483169555664062, 0.11606597900390625, 0.12730026245117188, 0.1385345458984375, 0.14976882934570312, 0.16100311279296875, 0.17223739624023438, 0.1834716796875, 0.19470596313476562, 0.20594024658203125, 0.21717453002929688, 0.2284088134765625, 0.23964309692382812, 0.25087738037109375, 0.2621116638183594, 0.273345947265625, 0.2845802307128906, 0.29581451416015625, 0.3070487976074219, 0.3182830810546875, 0.3295173645019531, 0.34075164794921875, 0.3519859313964844, 0.36322021484375, 0.3744544982910156, 0.38568878173828125, 0.3969230651855469, 0.4081573486328125, 0.4193916320800781, 0.43062591552734375, 0.4418601989746094, 0.453094482421875, 0.4643287658691406, 0.47556304931640625, 0.4867973327636719, 0.4980316162109375, 0.5092658996582031, 0.5205001831054688, 0.5317344665527344, 0.54296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 9.0, 9.0, 8.0, 11.0, 17.0, 25.0, 41.0, 44.0, 81.0, 98.0, 153.0, 229.0, 323.0, 442.0, 651.0, 1005.0, 1389.0, 2078.0, 3033.0, 4528.0, 6759.0, 10348.0, 16116.0, 25440.0, 41991.0, 71359.0, 120890.0, 184698.0, 198260.0, 142597.0, 83780.0, 49110.0, 29753.0, 18575.0, 11642.0, 7660.0, 5062.0, 3307.0, 2229.0, 1503.0, 1025.0, 682.0, 519.0, 340.0, 220.0, 161.0, 120.0, 80.0, 59.0, 34.0, 28.0, 20.0, 15.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.029266357421875, -0.028356313705444336, -0.027446269989013672, -0.026536226272583008, -0.025626182556152344, -0.02471613883972168, -0.023806095123291016, -0.02289605140686035, -0.021986007690429688, -0.021075963973999023, -0.02016592025756836, -0.019255876541137695, -0.01834583282470703, -0.017435789108276367, -0.016525745391845703, -0.015615701675415039, -0.014705657958984375, -0.013795614242553711, -0.012885570526123047, -0.011975526809692383, -0.011065483093261719, -0.010155439376831055, -0.00924539566040039, -0.008335351943969727, -0.0074253082275390625, -0.0065152645111083984, -0.005605220794677734, -0.00469517707824707, -0.0037851333618164062, -0.002875089645385742, -0.001965045928955078, -0.001055002212524414, -0.00014495849609375, 0.0007650852203369141, 0.0016751289367675781, 0.002585172653198242, 0.0034952163696289062, 0.00440526008605957, 0.005315303802490234, 0.0062253475189208984, 0.0071353912353515625, 0.008045434951782227, 0.00895547866821289, 0.009865522384643555, 0.010775566101074219, 0.011685609817504883, 0.012595653533935547, 0.013505697250366211, 0.014415740966796875, 0.015325784683227539, 0.016235828399658203, 0.017145872116088867, 0.01805591583251953, 0.018965959548950195, 0.01987600326538086, 0.020786046981811523, 0.021696090698242188, 0.02260613441467285, 0.023516178131103516, 0.02442622184753418, 0.025336265563964844, 0.026246309280395508, 0.027156352996826172, 0.028066396713256836, 0.0289764404296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 2.0, 7.0, 8.0, 10.0, 11.0, 6.0, 13.0, 14.0, 23.0, 34.0, 22.0, 29.0, 24.0, 27.0, 38.0, 43.0, 46.0, 45.0, 40.0, 37.0, 45.0, 46.0, 41.0, 40.0, 27.0, 42.0, 42.0, 20.0, 38.0, 18.0, 11.0, 27.0, 17.0, 18.0, 15.0, 14.0, 13.0, 14.0, 6.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2978515625, -0.2875022888183594, -0.27715301513671875, -0.2668037414550781, -0.2564544677734375, -0.24610519409179688, -0.23575592041015625, -0.22540664672851562, -0.215057373046875, -0.20470809936523438, -0.19435882568359375, -0.18400955200195312, -0.1736602783203125, -0.16331100463867188, -0.15296173095703125, -0.14261245727539062, -0.13226318359375, -0.12191390991210938, -0.11156463623046875, -0.10121536254882812, -0.0908660888671875, -0.08051681518554688, -0.07016754150390625, -0.059818267822265625, -0.049468994140625, -0.039119720458984375, -0.02877044677734375, -0.018421173095703125, -0.0080718994140625, 0.002277374267578125, 0.01262664794921875, 0.022975921630859375, 0.0333251953125, 0.043674468994140625, 0.05402374267578125, 0.06437301635742188, 0.0747222900390625, 0.08507156372070312, 0.09542083740234375, 0.10577011108398438, 0.116119384765625, 0.12646865844726562, 0.13681793212890625, 0.14716720581054688, 0.1575164794921875, 0.16786575317382812, 0.17821502685546875, 0.18856430053710938, 0.19891357421875, 0.20926284790039062, 0.21961212158203125, 0.22996139526367188, 0.2403106689453125, 0.2506599426269531, 0.26100921630859375, 0.2713584899902344, 0.281707763671875, 0.2920570373535156, 0.30240631103515625, 0.3127555847167969, 0.3231048583984375, 0.3334541320800781, 0.34380340576171875, 0.3541526794433594, 0.364501953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 14.0, 6.0, 18.0, 17.0, 26.0, 26.0, 47.0, 55.0, 67.0, 107.0, 138.0, 220.0, 331.0, 524.0, 939.0, 1492.0, 2680.0, 4990.0, 9573.0, 19104.0, 38695.0, 81965.0, 167554.0, 264394.0, 223612.0, 118783.0, 56364.0, 27416.0, 13430.0, 6892.0, 3783.0, 2079.0, 1192.0, 683.0, 421.0, 282.0, 189.0, 138.0, 84.0, 64.0, 38.0, 30.0, 29.0, 11.0, 11.0, 16.0, 5.0, 8.0, 4.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.003704071044921875, -0.0035909712314605713, -0.0034778714179992676, -0.003364771604537964, -0.00325167179107666, -0.0031385719776153564, -0.0030254721641540527, -0.002912372350692749, -0.0027992725372314453, -0.0026861727237701416, -0.002573072910308838, -0.002459973096847534, -0.0023468732833862305, -0.0022337734699249268, -0.002120673656463623, -0.0020075738430023193, -0.0018944740295410156, -0.001781374216079712, -0.0016682744026184082, -0.0015551745891571045, -0.0014420747756958008, -0.001328974962234497, -0.0012158751487731934, -0.0011027753353118896, -0.000989675521850586, -0.0008765757083892822, -0.0007634758949279785, -0.0006503760814666748, -0.0005372762680053711, -0.0004241764545440674, -0.00031107664108276367, -0.00019797682762145996, -8.487701416015625e-05, 2.822279930114746e-05, 0.00014132261276245117, 0.0002544224262237549, 0.0003675222396850586, 0.0004806220531463623, 0.000593721866607666, 0.0007068216800689697, 0.0008199214935302734, 0.0009330213069915771, 0.0010461211204528809, 0.0011592209339141846, 0.0012723207473754883, 0.001385420560836792, 0.0014985203742980957, 0.0016116201877593994, 0.0017247200012207031, 0.0018378198146820068, 0.0019509196281433105, 0.0020640194416046143, 0.002177119255065918, 0.0022902190685272217, 0.0024033188819885254, 0.002516418695449829, 0.002629518508911133, 0.0027426183223724365, 0.0028557181358337402, 0.002968817949295044, 0.0030819177627563477, 0.0031950175762176514, 0.003308117389678955, 0.003421217203140259, 0.0035343170166015625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 7.0, 8.0, 7.0, 10.0, 12.0, 19.0, 39.0, 45.0, 44.0, 75.0, 90.0, 105.0, 110.0, 91.0, 67.0, 59.0, 63.0, 41.0, 30.0, 16.0, 15.0, 10.0, 4.0, 5.0, 6.0, 6.0, 8.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.357929229736328e-06, -9.000301361083984e-06, -8.64267349243164e-06, -8.285045623779297e-06, -7.927417755126953e-06, -7.569789886474609e-06, -7.212162017822266e-06, -6.854534149169922e-06, -6.496906280517578e-06, -6.139278411865234e-06, -5.781650543212891e-06, -5.424022674560547e-06, -5.066394805908203e-06, -4.708766937255859e-06, -4.351139068603516e-06, -3.993511199951172e-06, -3.635883331298828e-06, -3.2782554626464844e-06, -2.9206275939941406e-06, -2.562999725341797e-06, -2.205371856689453e-06, -1.8477439880371094e-06, -1.4901161193847656e-06, -1.1324882507324219e-06, -7.748603820800781e-07, -4.172325134277344e-07, -5.960464477539063e-08, 2.980232238769531e-07, 6.556510925292969e-07, 1.0132789611816406e-06, 1.3709068298339844e-06, 1.7285346984863281e-06, 2.086162567138672e-06, 2.4437904357910156e-06, 2.8014183044433594e-06, 3.159046173095703e-06, 3.516674041748047e-06, 3.874301910400391e-06, 4.231929779052734e-06, 4.589557647705078e-06, 4.947185516357422e-06, 5.304813385009766e-06, 5.662441253662109e-06, 6.020069122314453e-06, 6.377696990966797e-06, 6.735324859619141e-06, 7.092952728271484e-06, 7.450580596923828e-06, 7.808208465576172e-06, 8.165836334228516e-06, 8.52346420288086e-06, 8.881092071533203e-06, 9.238719940185547e-06, 9.59634780883789e-06, 9.953975677490234e-06, 1.0311603546142578e-05, 1.0669231414794922e-05, 1.1026859283447266e-05, 1.138448715209961e-05, 1.1742115020751953e-05, 1.2099742889404297e-05, 1.245737075805664e-05, 1.2814998626708984e-05, 1.3172626495361328e-05, 1.3530254364013672e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 9.0, 13.0, 16.0, 19.0, 21.0, 33.0, 41.0, 46.0, 82.0, 101.0, 134.0, 196.0, 341.0, 707.0, 1670.0, 4569.0, 13975.0, 46530.0, 162127.0, 413204.0, 282159.0, 85195.0, 24680.0, 7604.0, 2648.0, 1038.0, 486.0, 259.0, 157.0, 110.0, 86.0, 60.0, 50.0, 30.0, 35.0, 29.0, 20.0, 15.0, 17.0, 3.0, 7.0, 4.0, 5.0, 2.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.00543212890625, -0.00527113676071167, -0.00511014461517334, -0.00494915246963501, -0.00478816032409668, -0.00462716817855835, -0.0044661760330200195, -0.0043051838874816895, -0.004144191741943359, -0.003983199596405029, -0.0038222074508666992, -0.003661215305328369, -0.003500223159790039, -0.003339231014251709, -0.003178238868713379, -0.003017246723175049, -0.0028562545776367188, -0.0026952624320983887, -0.0025342702865600586, -0.0023732781410217285, -0.0022122859954833984, -0.0020512938499450684, -0.0018903017044067383, -0.0017293095588684082, -0.0015683174133300781, -0.001407325267791748, -0.001246333122253418, -0.0010853409767150879, -0.0009243488311767578, -0.0007633566856384277, -0.0006023645401000977, -0.0004413723945617676, -0.0002803802490234375, -0.00011938810348510742, 4.1604042053222656e-05, 0.00020259618759155273, 0.0003635883331298828, 0.0005245804786682129, 0.000685572624206543, 0.000846564769744873, 0.0010075569152832031, 0.0011685490608215332, 0.0013295412063598633, 0.0014905333518981934, 0.0016515254974365234, 0.0018125176429748535, 0.0019735097885131836, 0.0021345019340515137, 0.0022954940795898438, 0.002456486225128174, 0.002617478370666504, 0.002778470516204834, 0.002939462661743164, 0.003100454807281494, 0.0032614469528198242, 0.0034224390983581543, 0.0035834312438964844, 0.0037444233894348145, 0.0039054155349731445, 0.004066407680511475, 0.004227399826049805, 0.004388391971588135, 0.004549384117126465, 0.004710376262664795, 0.004871368408203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 2.0, 13.0, 16.0, 12.0, 10.0, 10.0, 19.0, 21.0, 23.0, 23.0, 30.0, 28.0, 38.0, 39.0, 51.0, 55.0, 60.0, 63.0, 50.0, 41.0, 41.0, 49.0, 33.0, 55.0, 32.0, 24.0, 29.0, 17.0, 30.0, 12.0, 16.0, 13.0, 8.0, 9.0, 4.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00115203857421875, -0.0011134743690490723, -0.0010749101638793945, -0.0010363459587097168, -0.000997781753540039, -0.0009592175483703613, -0.0009206533432006836, -0.0008820891380310059, -0.0008435249328613281, -0.0008049607276916504, -0.0007663965225219727, -0.0007278323173522949, -0.0006892681121826172, -0.0006507039070129395, -0.0006121397018432617, -0.000573575496673584, -0.0005350112915039062, -0.0004964470863342285, -0.0004578828811645508, -0.00041931867599487305, -0.0003807544708251953, -0.0003421902656555176, -0.00030362606048583984, -0.0002650618553161621, -0.00022649765014648438, -0.00018793344497680664, -0.0001493692398071289, -0.00011080503463745117, -7.224082946777344e-05, -3.36766242980957e-05, 4.887580871582031e-06, 4.3451786041259766e-05, 8.20159912109375e-05, 0.00012058019638061523, 0.00015914440155029297, 0.0001977086067199707, 0.00023627281188964844, 0.00027483701705932617, 0.0003134012222290039, 0.00035196542739868164, 0.0003905296325683594, 0.0004290938377380371, 0.00046765804290771484, 0.0005062222480773926, 0.0005447864532470703, 0.000583350658416748, 0.0006219148635864258, 0.0006604790687561035, 0.0006990432739257812, 0.000737607479095459, 0.0007761716842651367, 0.0008147358894348145, 0.0008533000946044922, 0.0008918642997741699, 0.0009304285049438477, 0.0009689927101135254, 0.0010075569152832031, 0.0010461211204528809, 0.0010846853256225586, 0.0011232495307922363, 0.001161813735961914, 0.0012003779411315918, 0.0012389421463012695, 0.0012775063514709473, 0.001316070556640625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 21.0, 64.0, 238.0, 380.0, 209.0, 71.0, 19.0, 9.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1329808235168457, -1.1049716472625732, -1.0769625902175903, -1.0489534139633179, -1.020944356918335, -0.9929351806640625, -0.9649260640144348, -0.9369169473648071, -0.9089078307151794, -0.8808987140655518, -0.8528895974159241, -0.8248804807662964, -0.7968713045120239, -0.768862247467041, -0.7408530712127686, -0.7128439545631409, -0.6848348379135132, -0.6568257212638855, -0.6288166046142578, -0.6008074879646301, -0.5727983713150024, -0.54478919506073, -0.5167800784111023, -0.4887709617614746, -0.4607618451118469, -0.43275272846221924, -0.40474361181259155, -0.3767344653606415, -0.3487253487110138, -0.3207162320613861, -0.29270708560943604, -0.26469796895980835, -0.23668885231018066, -0.20867973566055298, -0.1806706041097641, -0.15266147255897522, -0.12465235590934753, -0.09664323925971985, -0.06863410770893097, -0.04062497615814209, -0.012615859508514404, 0.015393264591693878, 0.04340238869190216, 0.07141151279211044, 0.09942063689231873, 0.1274297535419464, 0.1554388850927353, 0.18344801664352417, 0.21145713329315186, 0.23946624994277954, 0.2674753665924072, 0.2954845130443573, 0.323493629693985, 0.35150274634361267, 0.37951189279556274, 0.40752100944519043, 0.4355301260948181, 0.4635392427444458, 0.4915483593940735, 0.5195574760437012, 0.5475666522979736, 0.5755757093429565, 0.603584885597229, 0.6315940022468567, 0.6596031188964844]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 10.0, 7.0, 13.0, 18.0, 25.0, 30.0, 45.0, 63.0, 75.0, 92.0, 114.0, 103.0, 85.0, 81.0, 70.0, 56.0, 39.0, 31.0, 22.0, 16.0, 11.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16945044696331024, -0.15903118252754211, -0.1486119031906128, -0.13819262385368347, -0.12777335941791534, -0.11735408753156662, -0.1069348156452179, -0.09651554375886917, -0.08609627187252045, -0.07567699998617172, -0.065257728099823, -0.054838456213474274, -0.04441918432712555, -0.033999912440776825, -0.0235806405544281, -0.013161368668079376, -0.002742096781730652, 0.0076771751046180725, 0.018096446990966797, 0.02851571887731552, 0.038934990763664246, 0.04935426265001297, 0.059773534536361694, 0.07019280642271042, 0.08061207830905914, 0.09103135019540787, 0.10145062208175659, 0.11186989396810532, 0.12228916585445404, 0.13270843029022217, 0.1431277096271515, 0.1535469889640808, 0.16396623849868774, 0.17438551783561707, 0.1848047822713852, 0.19522404670715332, 0.20564332604408264, 0.21606260538101196, 0.2264818698167801, 0.23690113425254822, 0.24732041358947754, 0.25773969292640686, 0.2681589722633362, 0.2785782217979431, 0.28899750113487244, 0.29941678047180176, 0.3098360300064087, 0.320255309343338, 0.33067458868026733, 0.34109386801719666, 0.351513147354126, 0.3619323968887329, 0.37235167622566223, 0.38277095556259155, 0.3931902050971985, 0.4036094844341278, 0.41402876377105713, 0.42444804310798645, 0.43486732244491577, 0.4452865719795227, 0.455705851316452, 0.46612513065338135, 0.4765443801879883, 0.4869636595249176, 0.4973829388618469]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 10.0, 13.0, 11.0, 23.0, 43.0, 51.0, 84.0, 131.0, 208.0, 326.0, 548.0, 1077.0, 1975.0, 4032.0, 9520.0, 26378.0, 103876.0, 584071.0, 243223.0, 46358.0, 14685.0, 5926.0, 2718.0, 1407.0, 747.0, 416.0, 240.0, 157.0, 100.0, 73.0, 37.0, 24.0, 29.0, 12.0, 10.0, 7.0, 2.0, 5.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1146240234375, -0.11132335662841797, -0.10802268981933594, -0.1047220230102539, -0.10142135620117188, -0.09812068939208984, -0.09482002258300781, -0.09151935577392578, -0.08821868896484375, -0.08491802215576172, -0.08161735534667969, -0.07831668853759766, -0.07501602172851562, -0.0717153549194336, -0.06841468811035156, -0.06511402130126953, -0.0618133544921875, -0.05851268768310547, -0.05521202087402344, -0.051911354064941406, -0.048610687255859375, -0.045310020446777344, -0.04200935363769531, -0.03870868682861328, -0.03540802001953125, -0.03210735321044922, -0.028806686401367188, -0.025506019592285156, -0.022205352783203125, -0.018904685974121094, -0.015604019165039062, -0.012303352355957031, -0.009002685546875, -0.005702018737792969, -0.0024013519287109375, 0.0008993148803710938, 0.004199981689453125, 0.007500648498535156, 0.010801315307617188, 0.014101982116699219, 0.01740264892578125, 0.02070331573486328, 0.024003982543945312, 0.027304649353027344, 0.030605316162109375, 0.033905982971191406, 0.03720664978027344, 0.04050731658935547, 0.0438079833984375, 0.04710865020751953, 0.05040931701660156, 0.053709983825683594, 0.057010650634765625, 0.060311317443847656, 0.06361198425292969, 0.06691265106201172, 0.07021331787109375, 0.07351398468017578, 0.07681465148925781, 0.08011531829833984, 0.08341598510742188, 0.0867166519165039, 0.09001731872558594, 0.09331798553466797, 0.09661865234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 7.0, 8.0, 7.0, 14.0, 8.0, 15.0, 19.0, 21.0, 28.0, 39.0, 39.0, 42.0, 58.0, 46.0, 73.0, 72.0, 58.0, 47.0, 49.0, 53.0, 52.0, 38.0, 37.0, 46.0, 30.0, 17.0, 17.0, 19.0, 5.0, 11.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.34228515625, -0.33013153076171875, -0.3179779052734375, -0.30582427978515625, -0.293670654296875, -0.28151702880859375, -0.2693634033203125, -0.25720977783203125, -0.24505615234375, -0.23290252685546875, -0.2207489013671875, -0.20859527587890625, -0.196441650390625, -0.18428802490234375, -0.1721343994140625, -0.15998077392578125, -0.1478271484375, -0.13567352294921875, -0.1235198974609375, -0.11136627197265625, -0.099212646484375, -0.08705902099609375, -0.0749053955078125, -0.06275177001953125, -0.05059814453125, -0.03844451904296875, -0.0262908935546875, -0.01413726806640625, -0.001983642578125, 0.01016998291015625, 0.0223236083984375, 0.03447723388671875, 0.046630859375, 0.05878448486328125, 0.0709381103515625, 0.08309173583984375, 0.095245361328125, 0.10739898681640625, 0.1195526123046875, 0.13170623779296875, 0.14385986328125, 0.15601348876953125, 0.1681671142578125, 0.18032073974609375, 0.192474365234375, 0.20462799072265625, 0.2167816162109375, 0.22893524169921875, 0.2410888671875, 0.25324249267578125, 0.2653961181640625, 0.27754974365234375, 0.289703369140625, 0.30185699462890625, 0.3140106201171875, 0.32616424560546875, 0.33831787109375, 0.35047149658203125, 0.3626251220703125, 0.37477874755859375, 0.386932373046875, 0.39908599853515625, 0.4112396240234375, 0.42339324951171875, 0.435546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 9.0, 11.0, 10.0, 24.0, 25.0, 36.0, 52.0, 106.0, 151.0, 254.0, 676.0, 2687.0, 89554.0, 944383.0, 8528.0, 1147.0, 396.0, 201.0, 105.0, 72.0, 41.0, 27.0, 18.0, 10.0, 9.0, 8.0, 1.0, 6.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43603515625, -0.42111968994140625, -0.4062042236328125, -0.39128875732421875, -0.376373291015625, -0.36145782470703125, -0.3465423583984375, -0.33162689208984375, -0.31671142578125, -0.30179595947265625, -0.2868804931640625, -0.27196502685546875, -0.257049560546875, -0.24213409423828125, -0.2272186279296875, -0.21230316162109375, -0.1973876953125, -0.18247222900390625, -0.1675567626953125, -0.15264129638671875, -0.137725830078125, -0.12281036376953125, -0.1078948974609375, -0.09297943115234375, -0.07806396484375, -0.06314849853515625, -0.0482330322265625, -0.03331756591796875, -0.018402099609375, -0.00348663330078125, 0.0114288330078125, 0.02634429931640625, 0.041259765625, 0.05617523193359375, 0.0710906982421875, 0.08600616455078125, 0.100921630859375, 0.11583709716796875, 0.1307525634765625, 0.14566802978515625, 0.16058349609375, 0.17549896240234375, 0.1904144287109375, 0.20532989501953125, 0.220245361328125, 0.23516082763671875, 0.2500762939453125, 0.26499176025390625, 0.2799072265625, 0.29482269287109375, 0.3097381591796875, 0.32465362548828125, 0.339569091796875, 0.35448455810546875, 0.3694000244140625, 0.38431549072265625, 0.39923095703125, 0.41414642333984375, 0.4290618896484375, 0.44397735595703125, 0.458892822265625, 0.47380828857421875, 0.4887237548828125, 0.5036392211914062, 0.5185546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 5.0, 12.0, 15.0, 14.0, 23.0, 24.0, 30.0, 53.0, 55.0, 82.0, 65.0, 86.0, 86.0, 83.0, 86.0, 69.0, 60.0, 51.0, 30.0, 18.0, 19.0, 14.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81201171875, -0.7875137329101562, -0.7630157470703125, -0.7385177612304688, -0.714019775390625, -0.6895217895507812, -0.6650238037109375, -0.6405258178710938, -0.61602783203125, -0.5915298461914062, -0.5670318603515625, -0.5425338745117188, -0.518035888671875, -0.49353790283203125, -0.4690399169921875, -0.44454193115234375, -0.4200439453125, -0.39554595947265625, -0.3710479736328125, -0.34654998779296875, -0.322052001953125, -0.29755401611328125, -0.2730560302734375, -0.24855804443359375, -0.22406005859375, -0.19956207275390625, -0.1750640869140625, -0.15056610107421875, -0.126068115234375, -0.10157012939453125, -0.0770721435546875, -0.05257415771484375, -0.028076171875, -0.00357818603515625, 0.0209197998046875, 0.04541778564453125, 0.069915771484375, 0.09441375732421875, 0.1189117431640625, 0.14340972900390625, 0.16790771484375, 0.19240570068359375, 0.2169036865234375, 0.24140167236328125, 0.265899658203125, 0.29039764404296875, 0.3148956298828125, 0.33939361572265625, 0.3638916015625, 0.38838958740234375, 0.4128875732421875, 0.43738555908203125, 0.461883544921875, 0.48638153076171875, 0.5108795166015625, 0.5353775024414062, 0.55987548828125, 0.5843734741210938, 0.6088714599609375, 0.6333694458007812, 0.657867431640625, 0.6823654174804688, 0.7068634033203125, 0.7313613891601562, 0.755859375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 10.0, 15.0, 20.0, 51.0, 146.0, 659.0, 12198.0, 1027798.0, 6900.0, 517.0, 129.0, 52.0, 17.0, 11.0, 7.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.355712890625, -0.34645843505859375, -0.3372039794921875, -0.32794952392578125, -0.318695068359375, -0.30944061279296875, -0.3001861572265625, -0.29093170166015625, -0.28167724609375, -0.27242279052734375, -0.2631683349609375, -0.25391387939453125, -0.244659423828125, -0.23540496826171875, -0.2261505126953125, -0.21689605712890625, -0.2076416015625, -0.19838714599609375, -0.1891326904296875, -0.17987823486328125, -0.170623779296875, -0.16136932373046875, -0.1521148681640625, -0.14286041259765625, -0.13360595703125, -0.12435150146484375, -0.1150970458984375, -0.10584259033203125, -0.096588134765625, -0.08733367919921875, -0.0780792236328125, -0.06882476806640625, -0.0595703125, -0.05031585693359375, -0.0410614013671875, -0.03180694580078125, -0.022552490234375, -0.01329803466796875, -0.0040435791015625, 0.00521087646484375, 0.01446533203125, 0.02371978759765625, 0.0329742431640625, 0.04222869873046875, 0.051483154296875, 0.06073760986328125, 0.0699920654296875, 0.07924652099609375, 0.0885009765625, 0.09775543212890625, 0.1070098876953125, 0.11626434326171875, 0.125518798828125, 0.13477325439453125, 0.1440277099609375, 0.15328216552734375, 0.16253662109375, 0.17179107666015625, 0.1810455322265625, 0.19029998779296875, 0.199554443359375, 0.20880889892578125, 0.2180633544921875, 0.22731781005859375, 0.236572265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 22.0, 29.0, 42.0, 113.0, 232.0, 285.0, 123.0, 64.0, 30.0, 19.0, 14.0, 4.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7464160919189453e-05, -1.6965903341770172e-05, -1.646764576435089e-05, -1.596938818693161e-05, -1.547113060951233e-05, -1.4972873032093048e-05, -1.4474615454673767e-05, -1.3976357877254486e-05, -1.3478100299835205e-05, -1.2979842722415924e-05, -1.2481585144996643e-05, -1.1983327567577362e-05, -1.1485069990158081e-05, -1.09868124127388e-05, -1.0488554835319519e-05, -9.990297257900238e-06, -9.492039680480957e-06, -8.993782103061676e-06, -8.495524525642395e-06, -7.997266948223114e-06, -7.499009370803833e-06, -7.000751793384552e-06, -6.502494215965271e-06, -6.00423663854599e-06, -5.505979061126709e-06, -5.007721483707428e-06, -4.509463906288147e-06, -4.011206328868866e-06, -3.512948751449585e-06, -3.014691174030304e-06, -2.516433596611023e-06, -2.018176019191742e-06, -1.519918441772461e-06, -1.02166086435318e-06, -5.234032869338989e-07, -2.514570951461792e-08, 4.731118679046631e-07, 9.71369445323944e-07, 1.469627022743225e-06, 1.967884600162506e-06, 2.466142177581787e-06, 2.964399755001068e-06, 3.462657332420349e-06, 3.96091490983963e-06, 4.459172487258911e-06, 4.957430064678192e-06, 5.455687642097473e-06, 5.953945219516754e-06, 6.452202796936035e-06, 6.950460374355316e-06, 7.448717951774597e-06, 7.946975529193878e-06, 8.44523310661316e-06, 8.94349068403244e-06, 9.441748261451721e-06, 9.940005838871002e-06, 1.0438263416290283e-05, 1.0936520993709564e-05, 1.1434778571128845e-05, 1.1933036148548126e-05, 1.2431293725967407e-05, 1.2929551303386688e-05, 1.342780888080597e-05, 1.392606645822525e-05, 1.4424324035644531e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 14.0, 14.0, 18.0, 49.0, 166.0, 822.0, 6119.0, 996840.0, 42126.0, 1911.0, 315.0, 76.0, 29.0, 13.0, 11.0, 4.0, 7.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2379150390625, -0.2290172576904297, -0.22011947631835938, -0.21122169494628906, -0.20232391357421875, -0.19342613220214844, -0.18452835083007812, -0.1756305694580078, -0.1667327880859375, -0.1578350067138672, -0.14893722534179688, -0.14003944396972656, -0.13114166259765625, -0.12224388122558594, -0.11334609985351562, -0.10444831848144531, -0.095550537109375, -0.08665275573730469, -0.07775497436523438, -0.06885719299316406, -0.05995941162109375, -0.05106163024902344, -0.042163848876953125, -0.03326606750488281, -0.0243682861328125, -0.015470504760742188, -0.006572723388671875, 0.0023250579833984375, 0.01122283935546875, 0.020120620727539062, 0.029018402099609375, 0.03791618347167969, 0.04681396484375, 0.05571174621582031, 0.06460952758789062, 0.07350730895996094, 0.08240509033203125, 0.09130287170410156, 0.10020065307617188, 0.10909843444824219, 0.1179962158203125, 0.1268939971923828, 0.13579177856445312, 0.14468955993652344, 0.15358734130859375, 0.16248512268066406, 0.17138290405273438, 0.1802806854248047, 0.189178466796875, 0.1980762481689453, 0.20697402954101562, 0.21587181091308594, 0.22476959228515625, 0.23366737365722656, 0.24256515502929688, 0.2514629364013672, 0.2603607177734375, 0.2692584991455078, 0.2781562805175781, 0.28705406188964844, 0.29595184326171875, 0.30484962463378906, 0.3137474060058594, 0.3226451873779297, 0.33154296875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 2.0, 7.0, 10.0, 13.0, 23.0, 39.0, 76.0, 156.0, 311.0, 151.0, 75.0, 56.0, 28.0, 14.0, 10.0, 8.0, 10.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05426025390625, -0.05281209945678711, -0.05136394500732422, -0.04991579055786133, -0.04846763610839844, -0.04701948165893555, -0.045571327209472656, -0.044123172760009766, -0.042675018310546875, -0.041226863861083984, -0.039778709411621094, -0.0383305549621582, -0.03688240051269531, -0.03543424606323242, -0.03398609161376953, -0.03253793716430664, -0.03108978271484375, -0.02964162826538086, -0.02819347381591797, -0.026745319366455078, -0.025297164916992188, -0.023849010467529297, -0.022400856018066406, -0.020952701568603516, -0.019504547119140625, -0.018056392669677734, -0.016608238220214844, -0.015160083770751953, -0.013711929321289062, -0.012263774871826172, -0.010815620422363281, -0.00936746597290039, -0.0079193115234375, -0.006471157073974609, -0.005023002624511719, -0.003574848175048828, -0.0021266937255859375, -0.0006785392761230469, 0.0007696151733398438, 0.0022177696228027344, 0.003665924072265625, 0.005114078521728516, 0.006562232971191406, 0.008010387420654297, 0.009458541870117188, 0.010906696319580078, 0.012354850769042969, 0.01380300521850586, 0.01525115966796875, 0.01669931411743164, 0.01814746856689453, 0.019595623016357422, 0.021043777465820312, 0.022491931915283203, 0.023940086364746094, 0.025388240814208984, 0.026836395263671875, 0.028284549713134766, 0.029732704162597656, 0.031180858612060547, 0.03262901306152344, 0.03407716751098633, 0.03552532196044922, 0.03697347640991211, 0.038421630859375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 14.0, 11.0, 21.0, 23.0, 46.0, 78.0, 87.0, 131.0, 128.0, 107.0, 113.0, 74.0, 58.0, 31.0, 21.0, 19.0, 13.0, 10.0, 4.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.486520379781723, -0.4683418273925781, -0.4501632750034332, -0.43198472261428833, -0.4138062000274658, -0.39562761783599854, -0.377449095249176, -0.35927054286003113, -0.34109199047088623, -0.32291343808174133, -0.30473488569259644, -0.28655633330345154, -0.26837778091430664, -0.25019925832748413, -0.23202070593833923, -0.21384215354919434, -0.19566360116004944, -0.17748504877090454, -0.15930649638175964, -0.14112795889377594, -0.12294940650463104, -0.10477085411548615, -0.08659230917692184, -0.06841376423835754, -0.050235211849212646, -0.03205666318535805, -0.013878114521503448, 0.0043004341423511505, 0.02247898280620575, 0.04065753519535065, 0.05883608013391495, 0.07701462507247925, 0.09519320726394653, 0.11337175965309143, 0.13155031204223633, 0.14972884953022003, 0.16790740191936493, 0.18608595430850983, 0.20426449179649353, 0.22244304418563843, 0.24062159657478333, 0.2588001489639282, 0.2769787013530731, 0.295157253742218, 0.3133357763290405, 0.3315143585205078, 0.3496928811073303, 0.3678714334964752, 0.3860499858856201, 0.404228538274765, 0.4224070906639099, 0.4405856430530548, 0.4587641954421997, 0.4769427180290222, 0.4951212704181671, 0.513299822807312, 0.5314784049987793, 0.5496569275856018, 0.5678355097770691, 0.5860140323638916, 0.6041926145553589, 0.6223711371421814, 0.6405497193336487, 0.6587282419204712, 0.6769067645072937]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 2.0, 5.0, 4.0, 5.0, 6.0, 16.0, 19.0, 18.0, 34.0, 48.0, 46.0, 56.0, 62.0, 53.0, 61.0, 56.0, 65.0, 76.0, 62.0, 57.0, 51.0, 39.0, 52.0, 26.0, 25.0, 18.0, 18.0, 11.0, 9.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7541993260383606, -0.7166398763656616, -0.6790804266929626, -0.6415209770202637, -0.6039614677429199, -0.5664020776748657, -0.528842568397522, -0.491283118724823, -0.453723669052124, -0.41616421937942505, -0.3786047697067261, -0.3410452902317047, -0.30348584055900574, -0.26592639088630676, -0.2283669263124466, -0.19080746173858643, -0.15324801206588745, -0.11568855494260788, -0.07812909781932831, -0.04056964069604874, -0.003010183572769165, 0.03454926609992981, 0.07210873067378998, 0.10966819524765015, 0.14722764492034912, 0.1847870945930481, 0.22234655916690826, 0.25990602374076843, 0.2974654734134674, 0.3350249230861664, 0.37258440256118774, 0.4101438522338867, 0.4477032423019409, 0.4852626919746399, 0.5228221416473389, 0.5603815913200378, 0.5979410409927368, 0.6355005502700806, 0.6730599999427795, 0.7106194496154785, 0.7481788992881775, 0.7857383489608765, 0.8232977986335754, 0.8608572483062744, 0.8984167575836182, 0.9359761476516724, 0.9735356569290161, 1.0110950469970703, 1.048654556274414, 1.0862140655517578, 1.123773455619812, 1.1613329648971558, 1.19889235496521, 1.2364518642425537, 1.274011254310608, 1.3115707635879517, 1.3491301536560059, 1.3866896629333496, 1.4242490530014038, 1.4618085622787476, 1.4993679523468018, 1.5369274616241455, 1.5744868516921997, 1.6120463609695435, 1.6496058702468872]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 1.0, 14.0, 19.0, 43.0, 95.0, 161.0, 357.0, 966.0, 2717.0, 7777.0, 29259.0, 1369451.0, 2728145.0, 44502.0, 6930.0, 2248.0, 775.0, 394.0, 173.0, 92.0, 59.0, 42.0, 25.0, 13.0, 6.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43798828125, -0.41815948486328125, -0.3983306884765625, -0.37850189208984375, -0.358673095703125, -0.33884429931640625, -0.3190155029296875, -0.29918670654296875, -0.27935791015625, -0.25952911376953125, -0.2397003173828125, -0.21987152099609375, -0.200042724609375, -0.18021392822265625, -0.1603851318359375, -0.14055633544921875, -0.1207275390625, -0.10089874267578125, -0.0810699462890625, -0.06124114990234375, -0.041412353515625, -0.02158355712890625, -0.0017547607421875, 0.01807403564453125, 0.03790283203125, 0.05773162841796875, 0.0775604248046875, 0.09738922119140625, 0.117218017578125, 0.13704681396484375, 0.1568756103515625, 0.17670440673828125, 0.196533203125, 0.21636199951171875, 0.2361907958984375, 0.25601959228515625, 0.275848388671875, 0.29567718505859375, 0.3155059814453125, 0.33533477783203125, 0.35516357421875, 0.37499237060546875, 0.3948211669921875, 0.41464996337890625, 0.434478759765625, 0.45430755615234375, 0.4741363525390625, 0.49396514892578125, 0.5137939453125, 0.5336227416992188, 0.5534515380859375, 0.5732803344726562, 0.593109130859375, 0.6129379272460938, 0.6327667236328125, 0.6525955200195312, 0.67242431640625, 0.6922531127929688, 0.7120819091796875, 0.7319107055664062, 0.751739501953125, 0.7715682983398438, 0.7913970947265625, 0.8112258911132812, 0.8310546875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 16.0, 25.0, 18.0, 21.0, 45.0, 70.0, 76.0, 103.0, 85.0, 115.0, 90.0, 71.0, 75.0, 43.0, 48.0, 26.0, 29.0, 13.0, 10.0, 2.0, 4.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1922607421875, -0.1811389923095703, -0.17001724243164062, -0.15889549255371094, -0.14777374267578125, -0.13665199279785156, -0.12553024291992188, -0.11440849304199219, -0.1032867431640625, -0.09216499328613281, -0.08104324340820312, -0.06992149353027344, -0.05879974365234375, -0.04767799377441406, -0.036556243896484375, -0.025434494018554688, -0.014312744140625, -0.0031909942626953125, 0.007930755615234375, 0.019052505493164062, 0.03017425537109375, 0.04129600524902344, 0.052417755126953125, 0.06353950500488281, 0.0746612548828125, 0.08578300476074219, 0.09690475463867188, 0.10802650451660156, 0.11914825439453125, 0.13027000427246094, 0.14139175415039062, 0.1525135040283203, 0.16363525390625, 0.1747570037841797, 0.18587875366210938, 0.19700050354003906, 0.20812225341796875, 0.21924400329589844, 0.23036575317382812, 0.2414875030517578, 0.2526092529296875, 0.2637310028076172, 0.2748527526855469, 0.28597450256347656, 0.29709625244140625, 0.30821800231933594, 0.3193397521972656, 0.3304615020751953, 0.341583251953125, 0.3527050018310547, 0.3638267517089844, 0.37494850158691406, 0.38607025146484375, 0.39719200134277344, 0.4083137512207031, 0.4194355010986328, 0.4305572509765625, 0.4416790008544922, 0.4528007507324219, 0.46392250061035156, 0.47504425048828125, 0.48616600036621094, 0.4972877502441406, 0.5084095001220703, 0.51953125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 8.0, 17.0, 21.0, 28.0, 64.0, 174.0, 539.0, 3168.0, 160647.0, 4020360.0, 7742.0, 1010.0, 277.0, 110.0, 38.0, 26.0, 15.0, 9.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97412109375, -0.9281234741210938, -0.8821258544921875, -0.8361282348632812, -0.790130615234375, -0.7441329956054688, -0.6981353759765625, -0.6521377563476562, -0.60614013671875, -0.5601425170898438, -0.5141448974609375, -0.46814727783203125, -0.422149658203125, -0.37615203857421875, -0.3301544189453125, -0.28415679931640625, -0.2381591796875, -0.19216156005859375, -0.1461639404296875, -0.10016632080078125, -0.054168701171875, -0.00817108154296875, 0.0378265380859375, 0.08382415771484375, 0.12982177734375, 0.17581939697265625, 0.2218170166015625, 0.26781463623046875, 0.313812255859375, 0.35980987548828125, 0.4058074951171875, 0.45180511474609375, 0.497802734375, 0.5438003540039062, 0.5897979736328125, 0.6357955932617188, 0.681793212890625, 0.7277908325195312, 0.7737884521484375, 0.8197860717773438, 0.86578369140625, 0.9117813110351562, 0.9577789306640625, 1.0037765502929688, 1.049774169921875, 1.0957717895507812, 1.1417694091796875, 1.1877670288085938, 1.2337646484375, 1.2797622680664062, 1.3257598876953125, 1.3717575073242188, 1.417755126953125, 1.4637527465820312, 1.5097503662109375, 1.5557479858398438, 1.60174560546875, 1.6477432250976562, 1.6937408447265625, 1.7397384643554688, 1.785736083984375, 1.8317337036132812, 1.8777313232421875, 1.9237289428710938, 1.9697265625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 2.0, 17.0, 23.0, 52.0, 107.0, 321.0, 1489.0, 1519.0, 327.0, 105.0, 45.0, 29.0, 11.0, 5.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.344970703125, -0.33695030212402344, -0.3289299011230469, -0.3209095001220703, -0.31288909912109375, -0.3048686981201172, -0.2968482971191406, -0.28882789611816406, -0.2808074951171875, -0.27278709411621094, -0.2647666931152344, -0.2567462921142578, -0.24872589111328125, -0.2407054901123047, -0.23268508911132812, -0.22466468811035156, -0.216644287109375, -0.20862388610839844, -0.20060348510742188, -0.1925830841064453, -0.18456268310546875, -0.1765422821044922, -0.16852188110351562, -0.16050148010253906, -0.1524810791015625, -0.14446067810058594, -0.13644027709960938, -0.1284198760986328, -0.12039947509765625, -0.11237907409667969, -0.10435867309570312, -0.09633827209472656, -0.08831787109375, -0.08029747009277344, -0.07227706909179688, -0.06425666809082031, -0.05623626708984375, -0.04821586608886719, -0.040195465087890625, -0.03217506408691406, -0.0241546630859375, -0.016134262084960938, -0.008113861083984375, -9.34600830078125e-05, 0.00792694091796875, 0.015947341918945312, 0.023967742919921875, 0.03198814392089844, 0.040008544921875, 0.04802894592285156, 0.056049346923828125, 0.06406974792480469, 0.07209014892578125, 0.08011054992675781, 0.08813095092773438, 0.09615135192871094, 0.1041717529296875, 0.11219215393066406, 0.12021255493164062, 0.1282329559326172, 0.13625335693359375, 0.1442737579345703, 0.15229415893554688, 0.16031455993652344, 0.1683349609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 12.0, 20.0, 20.0, 40.0, 54.0, 85.0, 129.0, 118.0, 132.0, 106.0, 84.0, 69.0, 56.0, 39.0, 14.0, 12.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5826481580734253, -0.566158652305603, -0.5496692061424255, -0.5331797003746033, -0.516690194606781, -0.5002007484436035, -0.48371124267578125, -0.46722176671028137, -0.4507322907447815, -0.4342428147792816, -0.41775330901145935, -0.4012638330459595, -0.3847743570804596, -0.3682848811149597, -0.35179537534713745, -0.3353058993816376, -0.3188163936138153, -0.30232691764831543, -0.28583741188049316, -0.2693479359149933, -0.2528584599494934, -0.23636896908283234, -0.21987947821617126, -0.2033900022506714, -0.18690051138401031, -0.17041102051734924, -0.15392154455184937, -0.1374320536851883, -0.12094257026910782, -0.10445308685302734, -0.08796359598636627, -0.0714741125702858, -0.05498462915420532, -0.03849514573812485, -0.022005658596754074, -0.005516171455383301, 0.010973311960697174, 0.02746279537677765, 0.04395228624343872, 0.060441769659519196, 0.07693125307559967, 0.09342073649168015, 0.10991021990776062, 0.1263997107744217, 0.14288920164108276, 0.15937867760658264, 0.1758681684732437, 0.19235765933990479, 0.20884713530540466, 0.22533662617206573, 0.2418261021375656, 0.2583155930042267, 0.27480506896972656, 0.29129457473754883, 0.3077840507030487, 0.3242735266685486, 0.34076303243637085, 0.3572525084018707, 0.373742014169693, 0.39023149013519287, 0.40672096610069275, 0.4232104420661926, 0.4396999478340149, 0.45618942379951477, 0.47267889976501465]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 7.0, 11.0, 16.0, 13.0, 17.0, 27.0, 33.0, 44.0, 39.0, 56.0, 60.0, 57.0, 65.0, 69.0, 65.0, 65.0, 56.0, 52.0, 48.0, 32.0, 38.0, 36.0, 25.0, 16.0, 14.0, 12.0, 9.0, 5.0, 4.0, 6.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22549353539943695, -0.2163005769252777, -0.20710763335227966, -0.19791467487812042, -0.18872173130512238, -0.17952877283096313, -0.1703358292579651, -0.16114287078380585, -0.1519499123096466, -0.14275695383548737, -0.13356401026248932, -0.12437105178833008, -0.11517810821533203, -0.10598514974117279, -0.09679219871759415, -0.0875992476940155, -0.07840630412101746, -0.06921335309743881, -0.06002040207386017, -0.050827447324991226, -0.04163449630141258, -0.03244154527783394, -0.023248590528964996, -0.014055639505386353, -0.004862688481807709, 0.00433026347309351, 0.013523215427994728, 0.02271616831421852, 0.031909119337797165, 0.04110207036137581, 0.05029502511024475, 0.059487976133823395, 0.06868094205856323, 0.07787389308214188, 0.08706684410572052, 0.09625980257987976, 0.10545274615287781, 0.11464570462703705, 0.12383865565061569, 0.13303160667419434, 0.14222455024719238, 0.15141750872135162, 0.16061045229434967, 0.1698034107685089, 0.17899635434150696, 0.1881893128156662, 0.19738227128982544, 0.2065752148628235, 0.21576817333698273, 0.22496113181114197, 0.23415407538414001, 0.24334703385829926, 0.2525399923324585, 0.26173293590545654, 0.2709258794784546, 0.28011882305145264, 0.28931179642677307, 0.2985047399997711, 0.30769771337509155, 0.3168906569480896, 0.32608360052108765, 0.3352765440940857, 0.34446951746940613, 0.3536624610424042, 0.3628554046154022]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 10.0, 17.0, 16.0, 36.0, 44.0, 61.0, 152.0, 247.0, 542.0, 1154.0, 3006.0, 8689.0, 30581.0, 151475.0, 607662.0, 192744.0, 35888.0, 10176.0, 3482.0, 1358.0, 583.0, 249.0, 147.0, 104.0, 32.0, 33.0, 15.0, 12.0, 7.0, 7.0, 7.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08392333984375, -0.08098506927490234, -0.07804679870605469, -0.07510852813720703, -0.07217025756835938, -0.06923198699951172, -0.06629371643066406, -0.0633554458618164, -0.06041717529296875, -0.057478904724121094, -0.05454063415527344, -0.05160236358642578, -0.048664093017578125, -0.04572582244873047, -0.04278755187988281, -0.039849281311035156, -0.0369110107421875, -0.033972740173339844, -0.031034469604492188, -0.02809619903564453, -0.025157928466796875, -0.02221965789794922, -0.019281387329101562, -0.016343116760253906, -0.01340484619140625, -0.010466575622558594, -0.0075283050537109375, -0.004590034484863281, -0.001651763916015625, 0.0012865066528320312, 0.0042247772216796875, 0.007163047790527344, 0.010101318359375, 0.013039588928222656, 0.015977859497070312, 0.01891613006591797, 0.021854400634765625, 0.02479267120361328, 0.027730941772460938, 0.030669212341308594, 0.03360748291015625, 0.036545753479003906, 0.03948402404785156, 0.04242229461669922, 0.045360565185546875, 0.04829883575439453, 0.05123710632324219, 0.054175376892089844, 0.0571136474609375, 0.060051918029785156, 0.06299018859863281, 0.06592845916748047, 0.06886672973632812, 0.07180500030517578, 0.07474327087402344, 0.0776815414428711, 0.08061981201171875, 0.0835580825805664, 0.08649635314941406, 0.08943462371826172, 0.09237289428710938, 0.09531116485595703, 0.09824943542480469, 0.10118770599365234, 0.1041259765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 10.0, 19.0, 7.0, 14.0, 30.0, 33.0, 41.0, 39.0, 63.0, 71.0, 79.0, 67.0, 67.0, 63.0, 65.0, 63.0, 51.0, 46.0, 41.0, 40.0, 27.0, 13.0, 13.0, 18.0, 6.0, 5.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12744140625, -0.12094879150390625, -0.1144561767578125, -0.10796356201171875, -0.101470947265625, -0.09497833251953125, -0.0884857177734375, -0.08199310302734375, -0.07550048828125, -0.06900787353515625, -0.0625152587890625, -0.05602264404296875, -0.049530029296875, -0.04303741455078125, -0.0365447998046875, -0.03005218505859375, -0.0235595703125, -0.01706695556640625, -0.0105743408203125, -0.00408172607421875, 0.002410888671875, 0.00890350341796875, 0.0153961181640625, 0.02188873291015625, 0.02838134765625, 0.03487396240234375, 0.0413665771484375, 0.04785919189453125, 0.054351806640625, 0.06084442138671875, 0.0673370361328125, 0.07382965087890625, 0.080322265625, 0.08681488037109375, 0.0933074951171875, 0.09980010986328125, 0.106292724609375, 0.11278533935546875, 0.1192779541015625, 0.12577056884765625, 0.13226318359375, 0.13875579833984375, 0.1452484130859375, 0.15174102783203125, 0.158233642578125, 0.16472625732421875, 0.1712188720703125, 0.17771148681640625, 0.1842041015625, 0.19069671630859375, 0.1971893310546875, 0.20368194580078125, 0.210174560546875, 0.21666717529296875, 0.2231597900390625, 0.22965240478515625, 0.23614501953125, 0.24263763427734375, 0.2491302490234375, 0.25562286376953125, 0.262115478515625, 0.26860809326171875, 0.2751007080078125, 0.28159332275390625, 0.2880859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 14.0, 8.0, 12.0, 6.0, 21.0, 28.0, 34.0, 30.0, 42.0, 57.0, 113.0, 125.0, 184.0, 275.0, 449.0, 708.0, 1218.0, 2267.0, 4555.0, 9025.0, 19428.0, 43897.0, 111230.0, 285641.0, 329241.0, 140013.0, 53790.0, 23453.0, 10802.0, 5355.0, 2731.0, 1406.0, 821.0, 501.0, 307.0, 198.0, 134.0, 107.0, 69.0, 61.0, 45.0, 30.0, 25.0, 30.0, 15.0, 11.0, 8.0, 8.0, 8.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.042022705078125, -0.040714263916015625, -0.03940582275390625, -0.038097381591796875, -0.0367889404296875, -0.035480499267578125, -0.03417205810546875, -0.032863616943359375, -0.03155517578125, -0.030246734619140625, -0.02893829345703125, -0.027629852294921875, -0.0263214111328125, -0.025012969970703125, -0.02370452880859375, -0.022396087646484375, -0.021087646484375, -0.019779205322265625, -0.01847076416015625, -0.017162322998046875, -0.0158538818359375, -0.014545440673828125, -0.01323699951171875, -0.011928558349609375, -0.0106201171875, -0.009311676025390625, -0.00800323486328125, -0.006694793701171875, -0.0053863525390625, -0.004077911376953125, -0.00276947021484375, -0.001461029052734375, -0.000152587890625, 0.001155853271484375, 0.00246429443359375, 0.003772735595703125, 0.0050811767578125, 0.006389617919921875, 0.00769805908203125, 0.009006500244140625, 0.01031494140625, 0.011623382568359375, 0.01293182373046875, 0.014240264892578125, 0.0155487060546875, 0.016857147216796875, 0.01816558837890625, 0.019474029541015625, 0.020782470703125, 0.022090911865234375, 0.02339935302734375, 0.024707794189453125, 0.0260162353515625, 0.027324676513671875, 0.02863311767578125, 0.029941558837890625, 0.03125, 0.032558441162109375, 0.03386688232421875, 0.035175323486328125, 0.0364837646484375, 0.037792205810546875, 0.03910064697265625, 0.040409088134765625, 0.041717529296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 9.0, 7.0, 20.0, 24.0, 30.0, 33.0, 41.0, 62.0, 78.0, 66.0, 70.0, 81.0, 81.0, 78.0, 67.0, 56.0, 51.0, 37.0, 36.0, 21.0, 16.0, 14.0, 8.0, 6.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46484375, -0.449676513671875, -0.43450927734375, -0.419342041015625, -0.4041748046875, -0.389007568359375, -0.37384033203125, -0.358673095703125, -0.343505859375, -0.328338623046875, -0.31317138671875, -0.298004150390625, -0.2828369140625, -0.267669677734375, -0.25250244140625, -0.237335205078125, -0.22216796875, -0.207000732421875, -0.19183349609375, -0.176666259765625, -0.1614990234375, -0.146331787109375, -0.13116455078125, -0.115997314453125, -0.100830078125, -0.085662841796875, -0.07049560546875, -0.055328369140625, -0.0401611328125, -0.024993896484375, -0.00982666015625, 0.005340576171875, 0.0205078125, 0.035675048828125, 0.05084228515625, 0.066009521484375, 0.0811767578125, 0.096343994140625, 0.11151123046875, 0.126678466796875, 0.141845703125, 0.157012939453125, 0.17218017578125, 0.187347412109375, 0.2025146484375, 0.217681884765625, 0.23284912109375, 0.248016357421875, 0.26318359375, 0.278350830078125, 0.29351806640625, 0.308685302734375, 0.3238525390625, 0.339019775390625, 0.35418701171875, 0.369354248046875, 0.384521484375, 0.399688720703125, 0.41485595703125, 0.430023193359375, 0.4451904296875, 0.460357666015625, 0.47552490234375, 0.490692138671875, 0.505859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 9.0, 4.0, 12.0, 9.0, 19.0, 29.0, 39.0, 51.0, 76.0, 96.0, 112.0, 152.0, 219.0, 349.0, 511.0, 773.0, 1232.0, 2107.0, 3695.0, 7341.0, 15950.0, 41668.0, 120055.0, 310934.0, 329323.0, 132883.0, 45415.0, 17563.0, 7776.0, 4029.0, 2194.0, 1322.0, 821.0, 518.0, 384.0, 249.0, 179.0, 121.0, 78.0, 64.0, 46.0, 35.0, 34.0, 22.0, 20.0, 10.0, 7.0, 11.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.00421142578125, -0.004083991050720215, -0.00395655632019043, -0.0038291215896606445, -0.0037016868591308594, -0.0035742521286010742, -0.003446817398071289, -0.003319382667541504, -0.0031919479370117188, -0.0030645132064819336, -0.0029370784759521484, -0.0028096437454223633, -0.002682209014892578, -0.002554774284362793, -0.002427339553833008, -0.0022999048233032227, -0.0021724700927734375, -0.0020450353622436523, -0.0019176006317138672, -0.001790165901184082, -0.0016627311706542969, -0.0015352964401245117, -0.0014078617095947266, -0.0012804269790649414, -0.0011529922485351562, -0.001025557518005371, -0.0008981227874755859, -0.0007706880569458008, -0.0006432533264160156, -0.0005158185958862305, -0.0003883838653564453, -0.00026094913482666016, -0.000133514404296875, -6.079673767089844e-06, 0.00012135505676269531, 0.00024878978729248047, 0.0003762245178222656, 0.0005036592483520508, 0.0006310939788818359, 0.0007585287094116211, 0.0008859634399414062, 0.0010133981704711914, 0.0011408329010009766, 0.0012682676315307617, 0.0013957023620605469, 0.001523137092590332, 0.0016505718231201172, 0.0017780065536499023, 0.0019054412841796875, 0.0020328760147094727, 0.002160310745239258, 0.002287745475769043, 0.002415180206298828, 0.0025426149368286133, 0.0026700496673583984, 0.0027974843978881836, 0.0029249191284179688, 0.003052353858947754, 0.003179788589477539, 0.0033072233200073242, 0.0034346580505371094, 0.0035620927810668945, 0.0036895275115966797, 0.003816962242126465, 0.00394439697265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 9.0, 7.0, 9.0, 20.0, 29.0, 38.0, 54.0, 95.0, 138.0, 144.0, 150.0, 94.0, 75.0, 39.0, 32.0, 28.0, 13.0, 13.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-06, -9.134411811828613e-06, -8.732080459594727e-06, -8.32974910736084e-06, -7.927417755126953e-06, -7.525086402893066e-06, -7.12275505065918e-06, -6.720423698425293e-06, -6.318092346191406e-06, -5.9157609939575195e-06, -5.513429641723633e-06, -5.111098289489746e-06, -4.708766937255859e-06, -4.306435585021973e-06, -3.904104232788086e-06, -3.5017728805541992e-06, -3.0994415283203125e-06, -2.6971101760864258e-06, -2.294778823852539e-06, -1.8924474716186523e-06, -1.4901161193847656e-06, -1.087784767150879e-06, -6.854534149169922e-07, -2.8312206268310547e-07, 1.1920928955078125e-07, 5.21540641784668e-07, 9.238719940185547e-07, 1.3262033462524414e-06, 1.7285346984863281e-06, 2.130866050720215e-06, 2.5331974029541016e-06, 2.9355287551879883e-06, 3.337860107421875e-06, 3.7401914596557617e-06, 4.1425228118896484e-06, 4.544854164123535e-06, 4.947185516357422e-06, 5.349516868591309e-06, 5.751848220825195e-06, 6.154179573059082e-06, 6.556510925292969e-06, 6.9588422775268555e-06, 7.361173629760742e-06, 7.763504981994629e-06, 8.165836334228516e-06, 8.568167686462402e-06, 8.970499038696289e-06, 9.372830390930176e-06, 9.775161743164062e-06, 1.017749309539795e-05, 1.0579824447631836e-05, 1.0982155799865723e-05, 1.138448715209961e-05, 1.1786818504333496e-05, 1.2189149856567383e-05, 1.259148120880127e-05, 1.2993812561035156e-05, 1.3396143913269043e-05, 1.379847526550293e-05, 1.4200806617736816e-05, 1.4603137969970703e-05, 1.500546932220459e-05, 1.5407800674438477e-05, 1.5810132026672363e-05, 1.621246337890625e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 2.0, 7.0, 10.0, 6.0, 6.0, 13.0, 16.0, 30.0, 31.0, 62.0, 87.0, 139.0, 234.0, 371.0, 731.0, 1422.0, 3378.0, 10935.0, 51550.0, 301957.0, 521130.0, 124258.0, 22070.0, 5629.0, 2100.0, 989.0, 572.0, 308.0, 187.0, 95.0, 68.0, 52.0, 32.0, 28.0, 8.0, 12.0, 8.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005451202392578125, -0.005270957946777344, -0.0050907135009765625, -0.004910469055175781, -0.004730224609375, -0.004549980163574219, -0.0043697357177734375, -0.004189491271972656, -0.004009246826171875, -0.0038290023803710938, -0.0036487579345703125, -0.0034685134887695312, -0.00328826904296875, -0.0031080245971679688, -0.0029277801513671875, -0.0027475357055664062, -0.002567291259765625, -0.0023870468139648438, -0.0022068023681640625, -0.0020265579223632812, -0.0018463134765625, -0.0016660690307617188, -0.0014858245849609375, -0.0013055801391601562, -0.001125335693359375, -0.0009450912475585938, -0.0007648468017578125, -0.0005846023559570312, -0.00040435791015625, -0.00022411346435546875, -4.38690185546875e-05, 0.00013637542724609375, 0.000316619873046875, 0.0004968643188476562, 0.0006771087646484375, 0.0008573532104492188, 0.00103759765625, 0.0012178421020507812, 0.0013980865478515625, 0.0015783309936523438, 0.001758575439453125, 0.0019388198852539062, 0.0021190643310546875, 0.0022993087768554688, 0.00247955322265625, 0.0026597976684570312, 0.0028400421142578125, 0.0030202865600585938, 0.003200531005859375, 0.0033807754516601562, 0.0035610198974609375, 0.0037412643432617188, 0.0039215087890625, 0.004101753234863281, 0.0042819976806640625, 0.004462242126464844, 0.004642486572265625, 0.004822731018066406, 0.0050029754638671875, 0.005183219909667969, 0.00536346435546875, 0.005543708801269531, 0.0057239532470703125, 0.005904197692871094, 0.006084442138671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 7.0, 6.0, 5.0, 25.0, 11.0, 19.0, 34.0, 40.0, 60.0, 92.0, 91.0, 84.0, 97.0, 71.0, 91.0, 69.0, 47.0, 44.0, 31.0, 26.0, 15.0, 12.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0018110275268554688, -0.0017597228288650513, -0.0017084181308746338, -0.0016571134328842163, -0.0016058087348937988, -0.0015545040369033813, -0.0015031993389129639, -0.0014518946409225464, -0.001400589942932129, -0.0013492852449417114, -0.001297980546951294, -0.0012466758489608765, -0.001195371150970459, -0.0011440664529800415, -0.001092761754989624, -0.0010414570569992065, -0.000990152359008789, -0.0009388476610183716, -0.0008875429630279541, -0.0008362382650375366, -0.0007849335670471191, -0.0007336288690567017, -0.0006823241710662842, -0.0006310194730758667, -0.0005797147750854492, -0.0005284100770950317, -0.00047710537910461426, -0.0004258006811141968, -0.0003744959831237793, -0.0003231912851333618, -0.00027188658714294434, -0.00022058188915252686, -0.00016927719116210938, -0.0001179724931716919, -6.666779518127441e-05, -1.5363097190856934e-05, 3.594160079956055e-05, 8.724629878997803e-05, 0.0001385509967803955, 0.000189855694770813, 0.00024116039276123047, 0.00029246509075164795, 0.00034376978874206543, 0.0003950744867324829, 0.0004463791847229004, 0.0004976838827133179, 0.0005489885807037354, 0.0006002932786941528, 0.0006515979766845703, 0.0007029026746749878, 0.0007542073726654053, 0.0008055120706558228, 0.0008568167686462402, 0.0009081214666366577, 0.0009594261646270752, 0.0010107308626174927, 0.0010620355606079102, 0.0011133402585983276, 0.0011646449565887451, 0.0012159496545791626, 0.00126725435256958, 0.0013185590505599976, 0.001369863748550415, 0.0014211684465408325, 0.00147247314453125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 10.0, 16.0, 30.0, 62.0, 103.0, 155.0, 179.0, 169.0, 123.0, 72.0, 35.0, 26.0, 9.0, 10.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5269262194633484, -0.514862060546875, -0.5027979612350464, -0.490733802318573, -0.478669673204422, -0.466605544090271, -0.45454141497612, -0.442477285861969, -0.430413156747818, -0.418349027633667, -0.406284898519516, -0.394220769405365, -0.3821566104888916, -0.3700924813747406, -0.3580283522605896, -0.3459642231464386, -0.3339000940322876, -0.3218359649181366, -0.3097718358039856, -0.2977076768875122, -0.2856435477733612, -0.2735794186592102, -0.2615152895450592, -0.2494511604309082, -0.23738700151443481, -0.2253228724002838, -0.21325872838497162, -0.20119459927082062, -0.18913047015666962, -0.17706632614135742, -0.16500219702720642, -0.15293806791305542, -0.14087393879890442, -0.12880980968475342, -0.11674567312002182, -0.10468153655529022, -0.09261740744113922, -0.08055327087640762, -0.06848913431167603, -0.056425005197525024, -0.044360868632793427, -0.03229673579335213, -0.02023260109126568, -0.00816846638917923, 0.0038956664502620697, 0.01595979928970337, 0.028023935854434967, 0.04008806496858597, 0.052152201533317566, 0.06421633809804916, 0.07628046721220016, 0.08834460377693176, 0.10040873289108276, 0.11247286945581436, 0.12453700602054596, 0.13660113513469696, 0.14866527915000916, 0.16072940826416016, 0.17279355227947235, 0.18485768139362335, 0.19692181050777435, 0.20898595452308655, 0.22105008363723755, 0.23311421275138855, 0.24517834186553955]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 7.0, 16.0, 12.0, 20.0, 27.0, 40.0, 51.0, 52.0, 69.0, 86.0, 70.0, 83.0, 85.0, 59.0, 70.0, 59.0, 50.0, 38.0, 28.0, 25.0, 13.0, 14.0, 7.0, 10.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15630078315734863, -0.14940908551216125, -0.14251737296581268, -0.1356256753206253, -0.12873397767543793, -0.12184227257966995, -0.11495056748390198, -0.1080588698387146, -0.10116716474294662, -0.09427545964717865, -0.08738376200199127, -0.0804920569062233, -0.07360035181045532, -0.06670865416526794, -0.05981694906949997, -0.05292524769902229, -0.04603354632854462, -0.03914184495806694, -0.032250143587589264, -0.02535843849182129, -0.018466737121343613, -0.011575035750865936, -0.004683330655097961, 0.002208370715379715, 0.009100072085857391, 0.015991773456335068, 0.022883476689457893, 0.02977517992258072, 0.036666881293058395, 0.04355858266353607, 0.05045028775930405, 0.05734198912978172, 0.0642336905002594, 0.07112539559602737, 0.07801709324121475, 0.08490879833698273, 0.0918004959821701, 0.09869220107793808, 0.10558390617370605, 0.11247560381889343, 0.11936730891466141, 0.12625901401042938, 0.13315071165561676, 0.14004242420196533, 0.1469341218471527, 0.1538258194923401, 0.16071751713752747, 0.16760922968387604, 0.17450092732906342, 0.1813926249742508, 0.18828433752059937, 0.19517603516578674, 0.20206773281097412, 0.2089594304561615, 0.21585114300251007, 0.22274284064769745, 0.22963455319404602, 0.2365262508392334, 0.24341796338558197, 0.25030964612960815, 0.2572013735771179, 0.2640930712223053, 0.2709847688674927, 0.27787646651268005, 0.28476816415786743]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 7.0, 16.0, 17.0, 32.0, 63.0, 67.0, 138.0, 194.0, 352.0, 663.0, 1274.0, 2742.0, 6287.0, 18254.0, 96939.0, 800709.0, 91424.0, 17870.0, 6077.0, 2571.0, 1297.0, 601.0, 389.0, 209.0, 139.0, 64.0, 65.0, 26.0, 31.0, 10.0, 9.0, 10.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.179443359375, -0.17438697814941406, -0.16933059692382812, -0.1642742156982422, -0.15921783447265625, -0.1541614532470703, -0.14910507202148438, -0.14404869079589844, -0.1389923095703125, -0.13393592834472656, -0.12887954711914062, -0.12382316589355469, -0.11876678466796875, -0.11371040344238281, -0.10865402221679688, -0.10359764099121094, -0.098541259765625, -0.09348487854003906, -0.08842849731445312, -0.08337211608886719, -0.07831573486328125, -0.07325935363769531, -0.06820297241210938, -0.06314659118652344, -0.0580902099609375, -0.05303382873535156, -0.047977447509765625, -0.04292106628417969, -0.03786468505859375, -0.03280830383300781, -0.027751922607421875, -0.022695541381835938, -0.01763916015625, -0.012582778930664062, -0.007526397705078125, -0.0024700164794921875, 0.00258636474609375, 0.0076427459716796875, 0.012699127197265625, 0.017755508422851562, 0.0228118896484375, 0.027868270874023438, 0.032924652099609375, 0.03798103332519531, 0.04303741455078125, 0.04809379577636719, 0.053150177001953125, 0.05820655822753906, 0.063262939453125, 0.06831932067871094, 0.07337570190429688, 0.07843208312988281, 0.08348846435546875, 0.08854484558105469, 0.09360122680664062, 0.09865760803222656, 0.1037139892578125, 0.10877037048339844, 0.11382675170898438, 0.11888313293457031, 0.12393951416015625, 0.1289958953857422, 0.13405227661132812, 0.13910865783691406, 0.1441650390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 5.0, 10.0, 6.0, 10.0, 18.0, 29.0, 37.0, 37.0, 51.0, 47.0, 55.0, 60.0, 69.0, 73.0, 75.0, 61.0, 65.0, 59.0, 44.0, 33.0, 38.0, 27.0, 21.0, 12.0, 11.0, 13.0, 16.0, 6.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265625, -0.253570556640625, -0.24151611328125, -0.229461669921875, -0.2174072265625, -0.205352783203125, -0.19329833984375, -0.181243896484375, -0.169189453125, -0.157135009765625, -0.14508056640625, -0.133026123046875, -0.1209716796875, -0.108917236328125, -0.09686279296875, -0.084808349609375, -0.07275390625, -0.060699462890625, -0.04864501953125, -0.036590576171875, -0.0245361328125, -0.012481689453125, -0.00042724609375, 0.011627197265625, 0.023681640625, 0.035736083984375, 0.04779052734375, 0.059844970703125, 0.0718994140625, 0.083953857421875, 0.09600830078125, 0.108062744140625, 0.1201171875, 0.132171630859375, 0.14422607421875, 0.156280517578125, 0.1683349609375, 0.180389404296875, 0.19244384765625, 0.204498291015625, 0.216552734375, 0.228607177734375, 0.24066162109375, 0.252716064453125, 0.2647705078125, 0.276824951171875, 0.28887939453125, 0.300933837890625, 0.31298828125, 0.325042724609375, 0.33709716796875, 0.349151611328125, 0.3612060546875, 0.373260498046875, 0.38531494140625, 0.397369384765625, 0.409423828125, 0.421478271484375, 0.43353271484375, 0.445587158203125, 0.4576416015625, 0.469696044921875, 0.48175048828125, 0.493804931640625, 0.505859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 16.0, 23.0, 42.0, 74.0, 131.0, 528.0, 1041246.0, 6053.0, 215.0, 109.0, 60.0, 25.0, 12.0, 8.0, 9.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.33984375, -2.2724761962890625, -2.205108642578125, -2.1377410888671875, -2.07037353515625, -2.0030059814453125, -1.935638427734375, -1.8682708740234375, -1.8009033203125, -1.7335357666015625, -1.666168212890625, -1.5988006591796875, -1.53143310546875, -1.4640655517578125, -1.396697998046875, -1.3293304443359375, -1.261962890625, -1.1945953369140625, -1.127227783203125, -1.0598602294921875, -0.99249267578125, -0.9251251220703125, -0.857757568359375, -0.7903900146484375, -0.7230224609375, -0.6556549072265625, -0.588287353515625, -0.5209197998046875, -0.45355224609375, -0.3861846923828125, -0.318817138671875, -0.2514495849609375, -0.18408203125, -0.1167144775390625, -0.049346923828125, 0.0180206298828125, 0.08538818359375, 0.1527557373046875, 0.220123291015625, 0.2874908447265625, 0.3548583984375, 0.4222259521484375, 0.489593505859375, 0.5569610595703125, 0.62432861328125, 0.6916961669921875, 0.759063720703125, 0.8264312744140625, 0.893798828125, 0.9611663818359375, 1.028533935546875, 1.0959014892578125, 1.16326904296875, 1.2306365966796875, 1.298004150390625, 1.3653717041015625, 1.4327392578125, 1.5001068115234375, 1.567474365234375, 1.6348419189453125, 1.70220947265625, 1.7695770263671875, 1.836944580078125, 1.9043121337890625, 1.9716796875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 16.0, 28.0, 47.0, 50.0, 92.0, 136.0, 153.0, 152.0, 127.0, 90.0, 43.0, 27.0, 17.0, 8.0, 8.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2548828125, -1.2187042236328125, -1.182525634765625, -1.1463470458984375, -1.11016845703125, -1.0739898681640625, -1.037811279296875, -1.0016326904296875, -0.9654541015625, -0.9292755126953125, -0.893096923828125, -0.8569183349609375, -0.82073974609375, -0.7845611572265625, -0.748382568359375, -0.7122039794921875, -0.676025390625, -0.6398468017578125, -0.603668212890625, -0.5674896240234375, -0.53131103515625, -0.4951324462890625, -0.458953857421875, -0.4227752685546875, -0.3865966796875, -0.3504180908203125, -0.314239501953125, -0.2780609130859375, -0.24188232421875, -0.2057037353515625, -0.169525146484375, -0.1333465576171875, -0.09716796875, -0.0609893798828125, -0.024810791015625, 0.0113677978515625, 0.04754638671875, 0.0837249755859375, 0.119903564453125, 0.1560821533203125, 0.1922607421875, 0.2284393310546875, 0.264617919921875, 0.3007965087890625, 0.33697509765625, 0.3731536865234375, 0.409332275390625, 0.4455108642578125, 0.481689453125, 0.5178680419921875, 0.554046630859375, 0.5902252197265625, 0.62640380859375, 0.6625823974609375, 0.698760986328125, 0.7349395751953125, 0.7711181640625, 0.8072967529296875, 0.843475341796875, 0.8796539306640625, 0.91583251953125, 0.9520111083984375, 0.988189697265625, 1.0243682861328125, 1.060546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 4.0, 4.0, 15.0, 15.0, 19.0, 45.0, 80.0, 170.0, 589.0, 3664.0, 80730.0, 945682.0, 15342.0, 1585.0, 374.0, 129.0, 59.0, 22.0, 16.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1754150390625, -0.1712656021118164, -0.1671161651611328, -0.16296672821044922, -0.15881729125976562, -0.15466785430908203, -0.15051841735839844, -0.14636898040771484, -0.14221954345703125, -0.13807010650634766, -0.13392066955566406, -0.12977123260498047, -0.12562179565429688, -0.12147235870361328, -0.11732292175292969, -0.1131734848022461, -0.1090240478515625, -0.1048746109008789, -0.10072517395019531, -0.09657573699951172, -0.09242630004882812, -0.08827686309814453, -0.08412742614746094, -0.07997798919677734, -0.07582855224609375, -0.07167911529541016, -0.06752967834472656, -0.06338024139404297, -0.059230804443359375, -0.05508136749267578, -0.05093193054199219, -0.046782493591308594, -0.042633056640625, -0.038483619689941406, -0.03433418273925781, -0.03018474578857422, -0.026035308837890625, -0.02188587188720703, -0.017736434936523438, -0.013586997985839844, -0.00943756103515625, -0.005288124084472656, -0.0011386871337890625, 0.0030107498168945312, 0.007160186767578125, 0.011309623718261719, 0.015459060668945312, 0.019608497619628906, 0.0237579345703125, 0.027907371520996094, 0.03205680847167969, 0.03620624542236328, 0.040355682373046875, 0.04450511932373047, 0.04865455627441406, 0.052803993225097656, 0.05695343017578125, 0.061102867126464844, 0.06525230407714844, 0.06940174102783203, 0.07355117797851562, 0.07770061492919922, 0.08185005187988281, 0.0859994888305664, 0.09014892578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 4.0, 9.0, 4.0, 17.0, 14.0, 21.0, 40.0, 46.0, 70.0, 103.0, 159.0, 162.0, 107.0, 69.0, 36.0, 33.0, 17.0, 17.0, 7.0, 11.0, 10.0, 4.0, 6.0, 6.0, 3.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.231929779052734e-06, -4.056841135025024e-06, -3.8817524909973145e-06, -3.7066638469696045e-06, -3.5315752029418945e-06, -3.3564865589141846e-06, -3.1813979148864746e-06, -3.0063092708587646e-06, -2.8312206268310547e-06, -2.6561319828033447e-06, -2.4810433387756348e-06, -2.305954694747925e-06, -2.130866050720215e-06, -1.955777406692505e-06, -1.780688762664795e-06, -1.605600118637085e-06, -1.430511474609375e-06, -1.255422830581665e-06, -1.080334186553955e-06, -9.052455425262451e-07, -7.301568984985352e-07, -5.550682544708252e-07, -3.7997961044311523e-07, -2.0489096641540527e-07, -2.9802322387695312e-08, 1.4528632164001465e-07, 3.203749656677246e-07, 4.954636096954346e-07, 6.705522537231445e-07, 8.456408977508545e-07, 1.0207295417785645e-06, 1.1958181858062744e-06, 1.3709068298339844e-06, 1.5459954738616943e-06, 1.7210841178894043e-06, 1.8961727619171143e-06, 2.0712614059448242e-06, 2.246350049972534e-06, 2.421438694000244e-06, 2.596527338027954e-06, 2.771615982055664e-06, 2.946704626083374e-06, 3.121793270111084e-06, 3.296881914138794e-06, 3.471970558166504e-06, 3.647059202194214e-06, 3.822147846221924e-06, 3.997236490249634e-06, 4.172325134277344e-06, 4.347413778305054e-06, 4.522502422332764e-06, 4.697591066360474e-06, 4.872679710388184e-06, 5.0477683544158936e-06, 5.2228569984436035e-06, 5.3979456424713135e-06, 5.5730342864990234e-06, 5.748122930526733e-06, 5.923211574554443e-06, 6.098300218582153e-06, 6.273388862609863e-06, 6.448477506637573e-06, 6.623566150665283e-06, 6.798654794692993e-06, 6.973743438720703e-06]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 8.0, 11.0, 28.0, 60.0, 119.0, 366.0, 1418.0, 11507.0, 877848.0, 150620.0, 5267.0, 844.0, 264.0, 96.0, 41.0, 22.0, 7.0, 9.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13330078125, -0.12833595275878906, -0.12337112426757812, -0.11840629577636719, -0.11344146728515625, -0.10847663879394531, -0.10351181030273438, -0.09854698181152344, -0.0935821533203125, -0.08861732482910156, -0.08365249633789062, -0.07868766784667969, -0.07372283935546875, -0.06875801086425781, -0.06379318237304688, -0.05882835388183594, -0.053863525390625, -0.04889869689941406, -0.043933868408203125, -0.03896903991699219, -0.03400421142578125, -0.029039382934570312, -0.024074554443359375, -0.019109725952148438, -0.0141448974609375, -0.009180068969726562, -0.004215240478515625, 0.0007495880126953125, 0.00571441650390625, 0.010679244995117188, 0.015644073486328125, 0.020608901977539062, 0.02557373046875, 0.030538558959960938, 0.035503387451171875, 0.04046821594238281, 0.04543304443359375, 0.05039787292480469, 0.055362701416015625, 0.06032752990722656, 0.0652923583984375, 0.07025718688964844, 0.07522201538085938, 0.08018684387207031, 0.08515167236328125, 0.09011650085449219, 0.09508132934570312, 0.10004615783691406, 0.105010986328125, 0.10997581481933594, 0.11494064331054688, 0.11990547180175781, 0.12487030029296875, 0.1298351287841797, 0.13479995727539062, 0.13976478576660156, 0.1447296142578125, 0.14969444274902344, 0.15465927124023438, 0.1596240997314453, 0.16458892822265625, 0.1695537567138672, 0.17451858520507812, 0.17948341369628906, 0.1844482421875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 7.0, 1.0, 4.0, 3.0, 12.0, 20.0, 28.0, 48.0, 63.0, 109.0, 262.0, 196.0, 102.0, 55.0, 28.0, 32.0, 11.0, 9.0, 5.0, 5.0, 8.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0433349609375, -0.0421600341796875, -0.040985107421875, -0.0398101806640625, -0.03863525390625, -0.0374603271484375, -0.036285400390625, -0.0351104736328125, -0.033935546875, -0.0327606201171875, -0.031585693359375, -0.0304107666015625, -0.02923583984375, -0.0280609130859375, -0.026885986328125, -0.0257110595703125, -0.0245361328125, -0.0233612060546875, -0.022186279296875, -0.0210113525390625, -0.01983642578125, -0.0186614990234375, -0.017486572265625, -0.0163116455078125, -0.01513671875, -0.0139617919921875, -0.012786865234375, -0.0116119384765625, -0.01043701171875, -0.0092620849609375, -0.008087158203125, -0.0069122314453125, -0.0057373046875, -0.0045623779296875, -0.003387451171875, -0.0022125244140625, -0.00103759765625, 0.0001373291015625, 0.001312255859375, 0.0024871826171875, 0.003662109375, 0.0048370361328125, 0.006011962890625, 0.0071868896484375, 0.00836181640625, 0.0095367431640625, 0.010711669921875, 0.0118865966796875, 0.0130615234375, 0.0142364501953125, 0.015411376953125, 0.0165863037109375, 0.01776123046875, 0.0189361572265625, 0.020111083984375, 0.0212860107421875, 0.0224609375, 0.0236358642578125, 0.024810791015625, 0.0259857177734375, 0.02716064453125, 0.0283355712890625, 0.029510498046875, 0.0306854248046875, 0.0318603515625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 8.0, 14.0, 22.0, 42.0, 78.0, 114.0, 142.0, 152.0, 147.0, 123.0, 69.0, 38.0, 21.0, 9.0, 17.0, 7.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8278663754463196, -0.8057905435562134, -0.7837146520614624, -0.7616388201713562, -0.7395629286766052, -0.717487096786499, -0.695411205291748, -0.6733353734016418, -0.6512595415115356, -0.6291837096214294, -0.6071078181266785, -0.5850319862365723, -0.5629560947418213, -0.5408802628517151, -0.5188044309616089, -0.4967285394668579, -0.4746526777744293, -0.45257681608200073, -0.43050095438957214, -0.40842509269714355, -0.38634926080703735, -0.36427339911460876, -0.3421975374221802, -0.320121705532074, -0.298045814037323, -0.2759699523448944, -0.2538940906524658, -0.23181824386119843, -0.20974239706993103, -0.18766653537750244, -0.16559067368507385, -0.14351482689380646, -0.12143898010253906, -0.09936312586069107, -0.07728727161884308, -0.05521140992641449, -0.0331355556845665, -0.011059701442718506, 0.011016160249710083, 0.03309200704097748, 0.05516786873340607, 0.07724372297525406, 0.09931957721710205, 0.12139543890953064, 0.14347130060195923, 0.16554714739322662, 0.1876230090856552, 0.2096988558769226, 0.2317747175693512, 0.2538505792617798, 0.2759264409542084, 0.29800230264663696, 0.32007813453674316, 0.34215399622917175, 0.36422985792160034, 0.38630568981170654, 0.4083815813064575, 0.4304574429988861, 0.4525333046913147, 0.4746091365814209, 0.4966849982738495, 0.5187608599662781, 0.5408366918563843, 0.5629125833511353, 0.5849884152412415]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 7.0, 7.0, 10.0, 19.0, 19.0, 22.0, 24.0, 31.0, 29.0, 33.0, 46.0, 39.0, 47.0, 59.0, 61.0, 49.0, 40.0, 59.0, 51.0, 50.0, 42.0, 35.0, 42.0, 27.0, 24.0, 30.0, 18.0, 13.0, 12.0, 16.0, 11.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6547601222991943, -0.631588876247406, -0.6084176898002625, -0.5852464437484741, -0.5620752573013306, -0.5389040112495422, -0.5157327651977539, -0.49256154894828796, -0.469390332698822, -0.4462191164493561, -0.42304790019989014, -0.3998766541481018, -0.37670543789863586, -0.3535342216491699, -0.3303629755973816, -0.30719175934791565, -0.2840205430984497, -0.26084932684898376, -0.23767809569835663, -0.2145068645477295, -0.19133564829826355, -0.1681644320487976, -0.14499320089817047, -0.12182196974754333, -0.09865075349807739, -0.07547952979803085, -0.052308306097984314, -0.029137082397937775, -0.005965858697891235, 0.017205365002155304, 0.04037658870220184, 0.06354781985282898, 0.08671897649765015, 0.10989020019769669, 0.13306142389774323, 0.15623265504837036, 0.1794038712978363, 0.20257508754730225, 0.22574631869792938, 0.24891754984855652, 0.27208876609802246, 0.2952599823474884, 0.31843119859695435, 0.3416024446487427, 0.3647736608982086, 0.38794487714767456, 0.4111161231994629, 0.43428733944892883, 0.4574585556983948, 0.4806297719478607, 0.5038009881973267, 0.526972234249115, 0.5501434803009033, 0.5733146667480469, 0.5964859127998352, 0.6196571588516235, 0.6428283452987671, 0.6659995913505554, 0.689170777797699, 0.7123420238494873, 0.7355132102966309, 0.7586844563484192, 0.7818557024002075, 0.8050268888473511, 0.8281981348991394]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 12.0, 15.0, 12.0, 28.0, 33.0, 40.0, 71.0, 116.0, 277.0, 656.0, 1601.0, 5477.0, 27414.0, 1816336.0, 2303887.0, 29626.0, 5591.0, 1795.0, 652.0, 281.0, 141.0, 77.0, 52.0, 19.0, 18.0, 13.0, 13.0, 5.0, 5.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61328125, -0.5935134887695312, -0.5737457275390625, -0.5539779663085938, -0.534210205078125, -0.5144424438476562, -0.4946746826171875, -0.47490692138671875, -0.45513916015625, -0.43537139892578125, -0.4156036376953125, -0.39583587646484375, -0.376068115234375, -0.35630035400390625, -0.3365325927734375, -0.31676483154296875, -0.2969970703125, -0.27722930908203125, -0.2574615478515625, -0.23769378662109375, -0.217926025390625, -0.19815826416015625, -0.1783905029296875, -0.15862274169921875, -0.13885498046875, -0.11908721923828125, -0.0993194580078125, -0.07955169677734375, -0.059783935546875, -0.04001617431640625, -0.0202484130859375, -0.00048065185546875, 0.019287109375, 0.03905487060546875, 0.0588226318359375, 0.07859039306640625, 0.098358154296875, 0.11812591552734375, 0.1378936767578125, 0.15766143798828125, 0.17742919921875, 0.19719696044921875, 0.2169647216796875, 0.23673248291015625, 0.256500244140625, 0.27626800537109375, 0.2960357666015625, 0.31580352783203125, 0.3355712890625, 0.35533905029296875, 0.3751068115234375, 0.39487457275390625, 0.414642333984375, 0.43441009521484375, 0.4541778564453125, 0.47394561767578125, 0.49371337890625, 0.5134811401367188, 0.5332489013671875, 0.5530166625976562, 0.572784423828125, 0.5925521850585938, 0.6123199462890625, 0.6320877075195312, 0.65185546875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 4.0, 8.0, 6.0, 15.0, 20.0, 25.0, 31.0, 30.0, 61.0, 63.0, 63.0, 72.0, 76.0, 68.0, 79.0, 73.0, 43.0, 51.0, 53.0, 37.0, 31.0, 26.0, 20.0, 15.0, 10.0, 6.0, 6.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1800537109375, -0.1726665496826172, -0.16527938842773438, -0.15789222717285156, -0.15050506591796875, -0.14311790466308594, -0.13573074340820312, -0.1283435821533203, -0.1209564208984375, -0.11356925964355469, -0.10618209838867188, -0.09879493713378906, -0.09140777587890625, -0.08402061462402344, -0.07663345336914062, -0.06924629211425781, -0.061859130859375, -0.05447196960449219, -0.047084808349609375, -0.03969764709472656, -0.03231048583984375, -0.024923324584960938, -0.017536163330078125, -0.010149002075195312, -0.0027618408203125, 0.0046253204345703125, 0.012012481689453125, 0.019399642944335938, 0.02678680419921875, 0.03417396545410156, 0.041561126708984375, 0.04894828796386719, 0.05633544921875, 0.06372261047363281, 0.07110977172851562, 0.07849693298339844, 0.08588409423828125, 0.09327125549316406, 0.10065841674804688, 0.10804557800292969, 0.1154327392578125, 0.12281990051269531, 0.13020706176757812, 0.13759422302246094, 0.14498138427734375, 0.15236854553222656, 0.15975570678710938, 0.1671428680419922, 0.174530029296875, 0.1819171905517578, 0.18930435180664062, 0.19669151306152344, 0.20407867431640625, 0.21146583557128906, 0.21885299682617188, 0.2262401580810547, 0.2336273193359375, 0.2410144805908203, 0.24840164184570312, 0.25578880310058594, 0.26317596435546875, 0.27056312561035156, 0.2779502868652344, 0.2853374481201172, 0.292724609375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 11.0, 5.0, 7.0, 9.0, 14.0, 16.0, 23.0, 44.0, 48.0, 80.0, 189.0, 470.0, 1314.0, 6538.0, 72218.0, 4021450.0, 82829.0, 6786.0, 1363.0, 422.0, 195.0, 79.0, 51.0, 40.0, 22.0, 16.0, 9.0, 13.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8212890625, -0.7994003295898438, -0.7775115966796875, -0.7556228637695312, -0.733734130859375, -0.7118453979492188, -0.6899566650390625, -0.6680679321289062, -0.64617919921875, -0.6242904663085938, -0.6024017333984375, -0.5805130004882812, -0.558624267578125, -0.5367355346679688, -0.5148468017578125, -0.49295806884765625, -0.4710693359375, -0.44918060302734375, -0.4272918701171875, -0.40540313720703125, -0.383514404296875, -0.36162567138671875, -0.3397369384765625, -0.31784820556640625, -0.29595947265625, -0.27407073974609375, -0.2521820068359375, -0.23029327392578125, -0.208404541015625, -0.18651580810546875, -0.1646270751953125, -0.14273834228515625, -0.120849609375, -0.09896087646484375, -0.0770721435546875, -0.05518341064453125, -0.033294677734375, -0.01140594482421875, 0.0104827880859375, 0.03237152099609375, 0.05426025390625, 0.07614898681640625, 0.0980377197265625, 0.11992645263671875, 0.141815185546875, 0.16370391845703125, 0.1855926513671875, 0.20748138427734375, 0.2293701171875, 0.25125885009765625, 0.2731475830078125, 0.29503631591796875, 0.316925048828125, 0.33881378173828125, 0.3607025146484375, 0.38259124755859375, 0.40447998046875, 0.42636871337890625, 0.4482574462890625, 0.47014617919921875, 0.492034912109375, 0.5139236450195312, 0.5358123779296875, 0.5577011108398438, 0.57958984375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 11.0, 9.0, 9.0, 13.0, 14.0, 25.0, 33.0, 52.0, 60.0, 102.0, 258.0, 615.0, 1021.0, 889.0, 429.0, 194.0, 104.0, 77.0, 37.0, 28.0, 21.0, 14.0, 17.0, 8.0, 7.0, 8.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.087646484375, -0.08425521850585938, -0.08086395263671875, -0.07747268676757812, -0.0740814208984375, -0.07069015502929688, -0.06729888916015625, -0.06390762329101562, -0.060516357421875, -0.057125091552734375, -0.05373382568359375, -0.050342559814453125, -0.0469512939453125, -0.043560028076171875, -0.04016876220703125, -0.036777496337890625, -0.03338623046875, -0.029994964599609375, -0.02660369873046875, -0.023212432861328125, -0.0198211669921875, -0.016429901123046875, -0.01303863525390625, -0.009647369384765625, -0.006256103515625, -0.002864837646484375, 0.00052642822265625, 0.003917694091796875, 0.0073089599609375, 0.010700225830078125, 0.01409149169921875, 0.017482757568359375, 0.0208740234375, 0.024265289306640625, 0.02765655517578125, 0.031047821044921875, 0.0344390869140625, 0.037830352783203125, 0.04122161865234375, 0.044612884521484375, 0.048004150390625, 0.051395416259765625, 0.05478668212890625, 0.058177947998046875, 0.0615692138671875, 0.06496047973632812, 0.06835174560546875, 0.07174301147460938, 0.07513427734375, 0.07852554321289062, 0.08191680908203125, 0.08530807495117188, 0.0886993408203125, 0.09209060668945312, 0.09548187255859375, 0.09887313842773438, 0.102264404296875, 0.10565567016601562, 0.10904693603515625, 0.11243820190429688, 0.1158294677734375, 0.11922073364257812, 0.12261199951171875, 0.12600326538085938, 0.12939453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 13.0, 21.0, 26.0, 51.0, 69.0, 106.0, 114.0, 167.0, 133.0, 111.0, 61.0, 51.0, 27.0, 21.0, 13.0, 8.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.6497433185577393, -0.6357386112213135, -0.6217339634895325, -0.6077292561531067, -0.5937246084213257, -0.5797199010848999, -0.5657151937484741, -0.5517105460166931, -0.5377058386802673, -0.5237011313438416, -0.5096964836120605, -0.49569177627563477, -0.48168709874153137, -0.467682421207428, -0.4536777138710022, -0.4396730363368988, -0.4256683588027954, -0.411663681268692, -0.3976590037345886, -0.38365429639816284, -0.36964961886405945, -0.35564494132995605, -0.3416402339935303, -0.3276355564594269, -0.3136308789253235, -0.2996262013912201, -0.2856215238571167, -0.2716168165206909, -0.2576121389865875, -0.24360746145248413, -0.22960276901721954, -0.21559807658195496, -0.20159339904785156, -0.18758872151374817, -0.17358402907848358, -0.159579336643219, -0.1455746591091156, -0.1315699815750122, -0.11756528913974762, -0.10356060415506363, -0.08955591917037964, -0.07555123418569565, -0.06154654920101166, -0.04754186421632767, -0.03353717923164368, -0.019532494246959686, -0.005527809262275696, 0.008476875722408295, 0.022481560707092285, 0.036486245691776276, 0.050490930676460266, 0.06449561566114426, 0.07850030064582825, 0.09250498563051224, 0.10650967061519623, 0.12051435559988022, 0.1345190405845642, 0.1485237181186676, 0.1625284105539322, 0.17653310298919678, 0.19053778052330017, 0.20454245805740356, 0.21854715049266815, 0.23255184292793274, 0.24655652046203613]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 10.0, 9.0, 4.0, 15.0, 15.0, 14.0, 37.0, 27.0, 31.0, 49.0, 69.0, 50.0, 48.0, 57.0, 52.0, 56.0, 53.0, 60.0, 44.0, 52.0, 51.0, 38.0, 43.0, 26.0, 32.0, 19.0, 16.0, 10.0, 10.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21098384261131287, -0.20335905253887177, -0.19573426246643066, -0.18810947239398956, -0.18048468232154846, -0.17285990715026855, -0.16523510217666626, -0.15761032700538635, -0.14998553693294525, -0.14236074686050415, -0.13473595678806305, -0.12711116671562195, -0.11948638409376144, -0.11186159402132034, -0.10423680394887924, -0.09661202132701874, -0.08898722380399704, -0.08136243373155594, -0.07373764365911484, -0.06611286103725433, -0.05848807096481323, -0.05086328089237213, -0.04323849081993103, -0.03561370447278023, -0.027988914400339127, -0.020364126190543175, -0.012739337049424648, -0.005114547908306122, 0.00251024030148983, 0.010135028511285782, 0.017759818583726883, 0.025384604930877686, 0.03300939500331879, 0.04063418507575989, 0.04825897142291069, 0.05588376149535179, 0.0635085478425026, 0.0711333379149437, 0.0787581279873848, 0.0863829106092453, 0.0940077006816864, 0.1016324907541275, 0.1092572808265686, 0.1168820708990097, 0.12450685352087021, 0.1321316361427307, 0.139756441116333, 0.14738121628761292, 0.1550060212612152, 0.1626308113336563, 0.1702556014060974, 0.1778803914785385, 0.18550518155097961, 0.19312995672225952, 0.20075476169586182, 0.20837953686714172, 0.21600432693958282, 0.22362911701202393, 0.23125390708446503, 0.23887869715690613, 0.24650348722934723, 0.25412827730178833, 0.26175305247306824, 0.26937785744667053, 0.27700263261795044]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 4.0, 7.0, 22.0, 29.0, 41.0, 67.0, 115.0, 223.0, 396.0, 731.0, 1631.0, 3777.0, 11420.0, 42946.0, 234872.0, 589053.0, 123928.0, 26428.0, 7533.0, 2774.0, 1201.0, 609.0, 303.0, 181.0, 117.0, 55.0, 37.0, 22.0, 8.0, 7.0, 5.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09307861328125, -0.09019947052001953, -0.08732032775878906, -0.0844411849975586, -0.08156204223632812, -0.07868289947509766, -0.07580375671386719, -0.07292461395263672, -0.07004547119140625, -0.06716632843017578, -0.06428718566894531, -0.061408042907714844, -0.058528900146484375, -0.055649757385253906, -0.05277061462402344, -0.04989147186279297, -0.0470123291015625, -0.04413318634033203, -0.04125404357910156, -0.038374900817871094, -0.035495758056640625, -0.032616615295410156, -0.029737472534179688, -0.02685832977294922, -0.02397918701171875, -0.02110004425048828, -0.018220901489257812, -0.015341758728027344, -0.012462615966796875, -0.009583473205566406, -0.0067043304443359375, -0.0038251876831054688, -0.000946044921875, 0.0019330978393554688, 0.0048122406005859375, 0.007691383361816406, 0.010570526123046875, 0.013449668884277344, 0.016328811645507812, 0.01920795440673828, 0.02208709716796875, 0.02496623992919922, 0.027845382690429688, 0.030724525451660156, 0.033603668212890625, 0.036482810974121094, 0.03936195373535156, 0.04224109649658203, 0.0451202392578125, 0.04799938201904297, 0.05087852478027344, 0.053757667541503906, 0.056636810302734375, 0.059515953063964844, 0.06239509582519531, 0.06527423858642578, 0.06815338134765625, 0.07103252410888672, 0.07391166687011719, 0.07679080963134766, 0.07966995239257812, 0.0825490951538086, 0.08542823791503906, 0.08830738067626953, 0.0911865234375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 4.0, 8.0, 7.0, 12.0, 16.0, 22.0, 26.0, 25.0, 25.0, 46.0, 62.0, 41.0, 48.0, 60.0, 66.0, 62.0, 48.0, 52.0, 58.0, 42.0, 48.0, 44.0, 36.0, 26.0, 30.0, 26.0, 21.0, 15.0, 5.0, 6.0, 11.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11810302734375, -0.1129007339477539, -0.10769844055175781, -0.10249614715576172, -0.09729385375976562, -0.09209156036376953, -0.08688926696777344, -0.08168697357177734, -0.07648468017578125, -0.07128238677978516, -0.06608009338378906, -0.06087779998779297, -0.055675506591796875, -0.05047321319580078, -0.04527091979980469, -0.040068626403808594, -0.0348663330078125, -0.029664039611816406, -0.024461746215820312, -0.01925945281982422, -0.014057159423828125, -0.008854866027832031, -0.0036525726318359375, 0.0015497207641601562, 0.00675201416015625, 0.011954307556152344, 0.017156600952148438, 0.02235889434814453, 0.027561187744140625, 0.03276348114013672, 0.03796577453613281, 0.043168067932128906, 0.048370361328125, 0.053572654724121094, 0.05877494812011719, 0.06397724151611328, 0.06917953491210938, 0.07438182830810547, 0.07958412170410156, 0.08478641510009766, 0.08998870849609375, 0.09519100189208984, 0.10039329528808594, 0.10559558868408203, 0.11079788208007812, 0.11600017547607422, 0.12120246887207031, 0.1264047622680664, 0.1316070556640625, 0.1368093490600586, 0.1420116424560547, 0.14721393585205078, 0.15241622924804688, 0.15761852264404297, 0.16282081604003906, 0.16802310943603516, 0.17322540283203125, 0.17842769622802734, 0.18362998962402344, 0.18883228302001953, 0.19403457641601562, 0.19923686981201172, 0.2044391632080078, 0.2096414566040039, 0.21484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 6.0, 10.0, 19.0, 20.0, 39.0, 45.0, 55.0, 60.0, 85.0, 129.0, 184.0, 259.0, 317.0, 485.0, 653.0, 985.0, 1309.0, 2001.0, 2864.0, 4404.0, 6489.0, 9946.0, 15478.0, 24253.0, 40579.0, 69662.0, 121217.0, 191506.0, 205397.0, 141172.0, 81463.0, 47305.0, 28519.0, 17545.0, 11304.0, 7250.0, 4860.0, 3218.0, 2267.0, 1575.0, 1050.0, 700.0, 541.0, 373.0, 270.0, 178.0, 140.0, 107.0, 77.0, 52.0, 48.0, 33.0, 10.0, 8.0, 17.0, 9.0, 8.0, 4.0, 4.0, 3.0], "bins": [-0.022796630859375, -0.02208733558654785, -0.021378040313720703, -0.020668745040893555, -0.019959449768066406, -0.019250154495239258, -0.01854085922241211, -0.01783156394958496, -0.017122268676757812, -0.016412973403930664, -0.015703678131103516, -0.014994382858276367, -0.014285087585449219, -0.01357579231262207, -0.012866497039794922, -0.012157201766967773, -0.011447906494140625, -0.010738611221313477, -0.010029315948486328, -0.00932002067565918, -0.008610725402832031, -0.007901430130004883, -0.007192134857177734, -0.006482839584350586, -0.0057735443115234375, -0.005064249038696289, -0.004354953765869141, -0.003645658493041992, -0.0029363632202148438, -0.0022270679473876953, -0.0015177726745605469, -0.0008084774017333984, -9.918212890625e-05, 0.0006101131439208984, 0.0013194084167480469, 0.0020287036895751953, 0.0027379989624023438, 0.003447294235229492, 0.004156589508056641, 0.004865884780883789, 0.0055751800537109375, 0.006284475326538086, 0.006993770599365234, 0.007703065872192383, 0.008412361145019531, 0.00912165641784668, 0.009830951690673828, 0.010540246963500977, 0.011249542236328125, 0.011958837509155273, 0.012668132781982422, 0.01337742805480957, 0.014086723327636719, 0.014796018600463867, 0.015505313873291016, 0.016214609146118164, 0.016923904418945312, 0.01763319969177246, 0.01834249496459961, 0.019051790237426758, 0.019761085510253906, 0.020470380783081055, 0.021179676055908203, 0.02188897132873535, 0.0225982666015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 8.0, 4.0, 6.0, 7.0, 19.0, 13.0, 15.0, 13.0, 27.0, 25.0, 34.0, 28.0, 34.0, 35.0, 52.0, 61.0, 46.0, 46.0, 57.0, 46.0, 46.0, 51.0, 47.0, 38.0, 26.0, 34.0, 31.0, 24.0, 26.0, 19.0, 16.0, 13.0, 17.0, 10.0, 5.0, 4.0, 5.0, 5.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3017578125, -0.2925453186035156, -0.28333282470703125, -0.2741203308105469, -0.2649078369140625, -0.2556953430175781, -0.24648284912109375, -0.23727035522460938, -0.228057861328125, -0.21884536743164062, -0.20963287353515625, -0.20042037963867188, -0.1912078857421875, -0.18199539184570312, -0.17278289794921875, -0.16357040405273438, -0.15435791015625, -0.14514541625976562, -0.13593292236328125, -0.12672042846679688, -0.1175079345703125, -0.10829544067382812, -0.09908294677734375, -0.08987045288085938, -0.080657958984375, -0.07144546508789062, -0.06223297119140625, -0.053020477294921875, -0.0438079833984375, -0.034595489501953125, -0.02538299560546875, -0.016170501708984375, -0.0069580078125, 0.002254486083984375, 0.01146697998046875, 0.020679473876953125, 0.0298919677734375, 0.039104461669921875, 0.04831695556640625, 0.057529449462890625, 0.066741943359375, 0.07595443725585938, 0.08516693115234375, 0.09437942504882812, 0.1035919189453125, 0.11280441284179688, 0.12201690673828125, 0.13122940063476562, 0.14044189453125, 0.14965438842773438, 0.15886688232421875, 0.16807937622070312, 0.1772918701171875, 0.18650436401367188, 0.19571685791015625, 0.20492935180664062, 0.214141845703125, 0.22335433959960938, 0.23256683349609375, 0.24177932739257812, 0.2509918212890625, 0.2602043151855469, 0.26941680908203125, 0.2786293029785156, 0.287841796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 11.0, 6.0, 15.0, 30.0, 37.0, 46.0, 68.0, 93.0, 153.0, 220.0, 266.0, 429.0, 716.0, 1178.0, 2090.0, 3675.0, 6946.0, 14142.0, 30897.0, 68905.0, 147334.0, 249997.0, 248561.0, 145253.0, 67506.0, 30170.0, 14076.0, 6999.0, 3476.0, 1995.0, 1189.0, 705.0, 481.0, 268.0, 197.0, 140.0, 91.0, 70.0, 48.0, 31.0, 18.0, 12.0, 5.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025424957275390625, -0.002454787492752075, -0.002367079257965088, -0.0022793710231781006, -0.0021916627883911133, -0.002103954553604126, -0.0020162463188171387, -0.0019285380840301514, -0.001840829849243164, -0.0017531216144561768, -0.0016654133796691895, -0.0015777051448822021, -0.0014899969100952148, -0.0014022886753082275, -0.0013145804405212402, -0.001226872205734253, -0.0011391639709472656, -0.0010514557361602783, -0.000963747501373291, -0.0008760392665863037, -0.0007883310317993164, -0.0007006227970123291, -0.0006129145622253418, -0.0005252063274383545, -0.0004374980926513672, -0.0003497898578643799, -0.0002620816230773926, -0.00017437338829040527, -8.666515350341797e-05, 1.043081283569336e-06, 8.875131607055664e-05, 0.00017645955085754395, 0.00026416778564453125, 0.00035187602043151855, 0.00043958425521850586, 0.0005272924900054932, 0.0006150007247924805, 0.0007027089595794678, 0.0007904171943664551, 0.0008781254291534424, 0.0009658336639404297, 0.001053541898727417, 0.0011412501335144043, 0.0012289583683013916, 0.001316666603088379, 0.0014043748378753662, 0.0014920830726623535, 0.0015797913074493408, 0.0016674995422363281, 0.0017552077770233154, 0.0018429160118103027, 0.00193062424659729, 0.0020183324813842773, 0.0021060407161712646, 0.002193748950958252, 0.0022814571857452393, 0.0023691654205322266, 0.002456873655319214, 0.002544581890106201, 0.0026322901248931885, 0.0027199983596801758, 0.002807706594467163, 0.0028954148292541504, 0.0029831230640411377, 0.003070831298828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 8.0, 6.0, 10.0, 8.0, 13.0, 20.0, 18.0, 20.0, 33.0, 43.0, 58.0, 65.0, 76.0, 77.0, 97.0, 89.0, 72.0, 42.0, 57.0, 44.0, 33.0, 19.0, 29.0, 10.0, 12.0, 13.0, 6.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.735324859619141e-06, -6.498768925666809e-06, -6.2622129917144775e-06, -6.025657057762146e-06, -5.7891011238098145e-06, -5.552545189857483e-06, -5.315989255905151e-06, -5.07943332195282e-06, -4.842877388000488e-06, -4.606321454048157e-06, -4.369765520095825e-06, -4.133209586143494e-06, -3.896653652191162e-06, -3.6600977182388306e-06, -3.423541784286499e-06, -3.1869858503341675e-06, -2.950429916381836e-06, -2.7138739824295044e-06, -2.477318048477173e-06, -2.2407621145248413e-06, -2.0042061805725098e-06, -1.7676502466201782e-06, -1.5310943126678467e-06, -1.2945383787155151e-06, -1.0579824447631836e-06, -8.21426510810852e-07, -5.848705768585205e-07, -3.4831464290618896e-07, -1.1175870895385742e-07, 1.2479722499847412e-07, 3.6135315895080566e-07, 5.979090929031372e-07, 8.344650268554688e-07, 1.0710209608078003e-06, 1.3075768947601318e-06, 1.5441328287124634e-06, 1.780688762664795e-06, 2.0172446966171265e-06, 2.253800630569458e-06, 2.4903565645217896e-06, 2.726912498474121e-06, 2.9634684324264526e-06, 3.200024366378784e-06, 3.4365803003311157e-06, 3.6731362342834473e-06, 3.909692168235779e-06, 4.14624810218811e-06, 4.382804036140442e-06, 4.6193599700927734e-06, 4.855915904045105e-06, 5.0924718379974365e-06, 5.329027771949768e-06, 5.5655837059021e-06, 5.802139639854431e-06, 6.038695573806763e-06, 6.275251507759094e-06, 6.511807441711426e-06, 6.748363375663757e-06, 6.984919309616089e-06, 7.22147524356842e-06, 7.458031177520752e-06, 7.694587111473083e-06, 7.931143045425415e-06, 8.167698979377747e-06, 8.404254913330078e-06]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 5.0, 6.0, 10.0, 10.0, 18.0, 23.0, 32.0, 41.0, 63.0, 84.0, 176.0, 281.0, 493.0, 997.0, 2003.0, 4871.0, 12487.0, 35574.0, 106091.0, 274824.0, 349724.0, 169476.0, 58118.0, 19929.0, 7235.0, 2953.0, 1341.0, 687.0, 321.0, 220.0, 140.0, 88.0, 63.0, 54.0, 42.0, 18.0, 24.0, 9.0, 11.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0033721923828125, -0.0032736659049987793, -0.0031751394271850586, -0.003076612949371338, -0.002978086471557617, -0.0028795599937438965, -0.0027810335159301758, -0.002682507038116455, -0.0025839805603027344, -0.0024854540824890137, -0.002386927604675293, -0.0022884011268615723, -0.0021898746490478516, -0.002091348171234131, -0.00199282169342041, -0.0018942952156066895, -0.0017957687377929688, -0.001697242259979248, -0.0015987157821655273, -0.0015001893043518066, -0.001401662826538086, -0.0013031363487243652, -0.0012046098709106445, -0.0011060833930969238, -0.0010075569152832031, -0.0009090304374694824, -0.0008105039596557617, -0.000711977481842041, -0.0006134510040283203, -0.0005149245262145996, -0.0004163980484008789, -0.0003178715705871582, -0.0002193450927734375, -0.0001208186149597168, -2.2292137145996094e-05, 7.623434066772461e-05, 0.0001747608184814453, 0.000273287296295166, 0.0003718137741088867, 0.0004703402519226074, 0.0005688667297363281, 0.0006673932075500488, 0.0007659196853637695, 0.0008644461631774902, 0.0009629726409912109, 0.0010614991188049316, 0.0011600255966186523, 0.001258552074432373, 0.0013570785522460938, 0.0014556050300598145, 0.0015541315078735352, 0.0016526579856872559, 0.0017511844635009766, 0.0018497109413146973, 0.001948237419128418, 0.0020467638969421387, 0.0021452903747558594, 0.00224381685256958, 0.0023423433303833008, 0.0024408698081970215, 0.002539396286010742, 0.002637922763824463, 0.0027364492416381836, 0.0028349757194519043, 0.002933502197265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 5.0, 5.0, 10.0, 10.0, 10.0, 14.0, 9.0, 23.0, 18.0, 20.0, 28.0, 27.0, 44.0, 35.0, 45.0, 43.0, 52.0, 48.0, 53.0, 50.0, 62.0, 51.0, 48.0, 47.0, 48.0, 26.0, 29.0, 26.0, 23.0, 32.0, 16.0, 8.0, 8.0, 6.0, 4.0, 5.0, 7.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0007476806640625, -0.0007212907075881958, -0.0006949007511138916, -0.0006685107946395874, -0.0006421208381652832, -0.000615730881690979, -0.0005893409252166748, -0.0005629509687423706, -0.0005365610122680664, -0.0005101710557937622, -0.000483781099319458, -0.0004573911428451538, -0.0004310011863708496, -0.0004046112298965454, -0.0003782212734222412, -0.000351831316947937, -0.0003254413604736328, -0.0002990514039993286, -0.0002726614475250244, -0.0002462714910507202, -0.00021988153457641602, -0.00019349157810211182, -0.00016710162162780762, -0.00014071166515350342, -0.00011432170867919922, -8.793175220489502e-05, -6.154179573059082e-05, -3.515183925628662e-05, -8.761882781982422e-06, 1.7628073692321777e-05, 4.4018030166625977e-05, 7.040798664093018e-05, 9.679794311523438e-05, 0.00012318789958953857, 0.00014957785606384277, 0.00017596781253814697, 0.00020235776901245117, 0.00022874772548675537, 0.00025513768196105957, 0.00028152763843536377, 0.00030791759490966797, 0.00033430755138397217, 0.00036069750785827637, 0.00038708746433258057, 0.00041347742080688477, 0.00043986737728118896, 0.00046625733375549316, 0.0004926472902297974, 0.0005190372467041016, 0.0005454272031784058, 0.00057181715965271, 0.0005982071161270142, 0.0006245970726013184, 0.0006509870290756226, 0.0006773769855499268, 0.000703766942024231, 0.0007301568984985352, 0.0007565468549728394, 0.0007829368114471436, 0.0008093267679214478, 0.000835716724395752, 0.0008621066808700562, 0.0008884966373443604, 0.0009148865938186646, 0.0009412765502929688]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 14.0, 34.0, 61.0, 124.0, 245.0, 224.0, 165.0, 90.0, 29.0, 12.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7300755977630615, -0.7148867249488831, -0.6996978521347046, -0.6845089793205261, -0.6693201065063477, -0.6541312336921692, -0.6389423608779907, -0.6237534880638123, -0.6085646152496338, -0.5933757424354553, -0.5781868696212769, -0.5629979968070984, -0.5478091239929199, -0.5326202511787415, -0.517431378364563, -0.5022425055503845, -0.48705363273620605, -0.4718647599220276, -0.4566758871078491, -0.44148701429367065, -0.4262981414794922, -0.4111092686653137, -0.39592039585113525, -0.3807315230369568, -0.36554262042045593, -0.35035374760627747, -0.335164874792099, -0.31997600197792053, -0.30478712916374207, -0.2895982563495636, -0.27440938353538513, -0.25922051072120667, -0.244031623005867, -0.22884275019168854, -0.21365387737751007, -0.1984650045633316, -0.18327613174915314, -0.16808724403381348, -0.152898371219635, -0.13770949840545654, -0.12252063304185867, -0.1073317602276802, -0.09214288741350174, -0.07695400714874268, -0.06176513805985451, -0.04657626152038574, -0.031387388706207275, -0.01619851589202881, -0.0010096430778503418, 0.0141792306676507, 0.02936810441315174, 0.04455697908997536, 0.059745851904153824, 0.07493472844362259, 0.09012360125780106, 0.10531247407197952, 0.12050134688615799, 0.13569022715091705, 0.15087909996509552, 0.166067972779274, 0.18125684559345245, 0.19644571840763092, 0.2116345912218094, 0.22682346403598785, 0.24201233685016632]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 11.0, 8.0, 7.0, 12.0, 22.0, 18.0, 35.0, 35.0, 40.0, 65.0, 57.0, 45.0, 60.0, 57.0, 57.0, 54.0, 67.0, 55.0, 49.0, 46.0, 41.0, 41.0, 29.0, 28.0, 22.0, 15.0, 7.0, 11.0, 1.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1315542310476303, -0.12619411945343018, -0.12083400785923004, -0.11547389626502991, -0.11011378467082977, -0.10475367307662964, -0.09939355403184891, -0.09403344243764877, -0.08867333084344864, -0.0833132192492485, -0.07795310765504837, -0.07259298861026764, -0.0672328770160675, -0.06187276914715767, -0.056512653827667236, -0.0511525422334671, -0.04579243063926697, -0.040432319045066833, -0.0350722074508667, -0.029712092131376266, -0.024351980537176132, -0.018991868942975998, -0.013631753623485565, -0.008271642029285431, -0.0029115304350852966, 0.0024485820904374123, 0.007808694615960121, 0.013168808072805405, 0.01852891966700554, 0.023889031261205673, 0.029249146580696106, 0.03460925817489624, 0.039969369769096375, 0.04532948136329651, 0.05068959295749664, 0.056049708276987076, 0.06140981987118721, 0.06676992774009705, 0.07213004678487778, 0.07749015837907791, 0.08285026997327805, 0.08821038156747818, 0.09357049316167831, 0.09893061220645905, 0.10429072380065918, 0.10965083539485931, 0.11501094698905945, 0.12037105858325958, 0.12573117017745972, 0.13109128177165985, 0.13645139336585999, 0.14181150496006012, 0.14717161655426025, 0.1525317281484604, 0.15789183974266052, 0.16325196623802185, 0.1686120629310608, 0.17397217452526093, 0.17933228611946106, 0.1846923977136612, 0.19005250930786133, 0.19541262090206146, 0.2007727324962616, 0.20613285899162292, 0.21149297058582306]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 3.0, 11.0, 10.0, 11.0, 28.0, 37.0, 59.0, 76.0, 141.0, 234.0, 438.0, 974.0, 2486.0, 7659.0, 33058.0, 312824.0, 619353.0, 54330.0, 11028.0, 3345.0, 1218.0, 542.0, 261.0, 149.0, 94.0, 59.0, 43.0, 27.0, 18.0, 7.0, 7.0, 5.0, 8.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2330322265625, -0.22658348083496094, -0.22013473510742188, -0.2136859893798828, -0.20723724365234375, -0.2007884979248047, -0.19433975219726562, -0.18789100646972656, -0.1814422607421875, -0.17499351501464844, -0.16854476928710938, -0.1620960235595703, -0.15564727783203125, -0.1491985321044922, -0.14274978637695312, -0.13630104064941406, -0.129852294921875, -0.12340354919433594, -0.11695480346679688, -0.11050605773925781, -0.10405731201171875, -0.09760856628417969, -0.09115982055664062, -0.08471107482910156, -0.0782623291015625, -0.07181358337402344, -0.06536483764648438, -0.05891609191894531, -0.05246734619140625, -0.04601860046386719, -0.039569854736328125, -0.03312110900878906, -0.02667236328125, -0.020223617553710938, -0.013774871826171875, -0.0073261260986328125, -0.00087738037109375, 0.0055713653564453125, 0.012020111083984375, 0.018468856811523438, 0.0249176025390625, 0.03136634826660156, 0.037815093994140625, 0.04426383972167969, 0.05071258544921875, 0.05716133117675781, 0.06361007690429688, 0.07005882263183594, 0.076507568359375, 0.08295631408691406, 0.08940505981445312, 0.09585380554199219, 0.10230255126953125, 0.10875129699707031, 0.11520004272460938, 0.12164878845214844, 0.1280975341796875, 0.13454627990722656, 0.14099502563476562, 0.1474437713623047, 0.15389251708984375, 0.1603412628173828, 0.16679000854492188, 0.17323875427246094, 0.1796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 6.0, 4.0, 7.0, 10.0, 11.0, 14.0, 22.0, 21.0, 36.0, 42.0, 59.0, 54.0, 52.0, 55.0, 75.0, 66.0, 69.0, 58.0, 52.0, 59.0, 49.0, 41.0, 38.0, 25.0, 30.0, 16.0, 10.0, 13.0, 5.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.328857421875, -0.3184661865234375, -0.308074951171875, -0.2976837158203125, -0.28729248046875, -0.2769012451171875, -0.266510009765625, -0.2561187744140625, -0.2457275390625, -0.2353363037109375, -0.224945068359375, -0.2145538330078125, -0.20416259765625, -0.1937713623046875, -0.183380126953125, -0.1729888916015625, -0.16259765625, -0.1522064208984375, -0.141815185546875, -0.1314239501953125, -0.12103271484375, -0.1106414794921875, -0.100250244140625, -0.0898590087890625, -0.0794677734375, -0.0690765380859375, -0.058685302734375, -0.0482940673828125, -0.03790283203125, -0.0275115966796875, -0.017120361328125, -0.0067291259765625, 0.003662109375, 0.0140533447265625, 0.024444580078125, 0.0348358154296875, 0.04522705078125, 0.0556182861328125, 0.066009521484375, 0.0764007568359375, 0.0867919921875, 0.0971832275390625, 0.107574462890625, 0.1179656982421875, 0.12835693359375, 0.1387481689453125, 0.149139404296875, 0.1595306396484375, 0.169921875, 0.1803131103515625, 0.190704345703125, 0.2010955810546875, 0.21148681640625, 0.2218780517578125, 0.232269287109375, 0.2426605224609375, 0.2530517578125, 0.2634429931640625, 0.273834228515625, 0.2842254638671875, 0.29461669921875, 0.3050079345703125, 0.315399169921875, 0.3257904052734375, 0.336181640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 6.0, 4.0, 8.0, 11.0, 13.0, 25.0, 38.0, 35.0, 51.0, 78.0, 105.0, 119.0, 195.0, 321.0, 581.0, 1782.0, 15319.0, 854611.0, 167445.0, 5371.0, 1083.0, 444.0, 254.0, 151.0, 127.0, 94.0, 60.0, 41.0, 39.0, 28.0, 28.0, 23.0, 15.0, 13.0, 5.0, 7.0, 7.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.398681640625, -0.3848381042480469, -0.37099456787109375, -0.3571510314941406, -0.3433074951171875, -0.3294639587402344, -0.31562042236328125, -0.3017768859863281, -0.287933349609375, -0.2740898132324219, -0.26024627685546875, -0.24640274047851562, -0.2325592041015625, -0.21871566772460938, -0.20487213134765625, -0.19102859497070312, -0.17718505859375, -0.16334152221679688, -0.14949798583984375, -0.13565444946289062, -0.1218109130859375, -0.10796737670898438, -0.09412384033203125, -0.08028030395507812, -0.066436767578125, -0.052593231201171875, -0.03874969482421875, -0.024906158447265625, -0.0110626220703125, 0.002780914306640625, 0.01662445068359375, 0.030467987060546875, 0.0443115234375, 0.058155059814453125, 0.07199859619140625, 0.08584213256835938, 0.0996856689453125, 0.11352920532226562, 0.12737274169921875, 0.14121627807617188, 0.155059814453125, 0.16890335083007812, 0.18274688720703125, 0.19659042358398438, 0.2104339599609375, 0.22427749633789062, 0.23812103271484375, 0.2519645690917969, 0.26580810546875, 0.2796516418457031, 0.29349517822265625, 0.3073387145996094, 0.3211822509765625, 0.3350257873535156, 0.34886932373046875, 0.3627128601074219, 0.376556396484375, 0.3903999328613281, 0.40424346923828125, 0.4180870056152344, 0.4319305419921875, 0.4457740783691406, 0.45961761474609375, 0.4734611511230469, 0.4873046875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 6.0, 9.0, 5.0, 13.0, 13.0, 19.0, 14.0, 16.0, 15.0, 14.0, 27.0, 38.0, 43.0, 55.0, 49.0, 49.0, 42.0, 51.0, 57.0, 49.0, 38.0, 53.0, 29.0, 38.0, 35.0, 25.0, 32.0, 28.0, 15.0, 17.0, 19.0, 13.0, 15.0, 8.0, 5.0, 9.0, 4.0, 8.0, 3.0, 3.0, 3.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.277099609375, -0.26732635498046875, -0.2575531005859375, -0.24777984619140625, -0.238006591796875, -0.22823333740234375, -0.2184600830078125, -0.20868682861328125, -0.19891357421875, -0.18914031982421875, -0.1793670654296875, -0.16959381103515625, -0.159820556640625, -0.15004730224609375, -0.1402740478515625, -0.13050079345703125, -0.1207275390625, -0.11095428466796875, -0.1011810302734375, -0.09140777587890625, -0.081634521484375, -0.07186126708984375, -0.0620880126953125, -0.05231475830078125, -0.04254150390625, -0.03276824951171875, -0.0229949951171875, -0.01322174072265625, -0.003448486328125, 0.00632476806640625, 0.0160980224609375, 0.02587127685546875, 0.03564453125, 0.04541778564453125, 0.0551910400390625, 0.06496429443359375, 0.074737548828125, 0.08451080322265625, 0.0942840576171875, 0.10405731201171875, 0.11383056640625, 0.12360382080078125, 0.1333770751953125, 0.14315032958984375, 0.152923583984375, 0.16269683837890625, 0.1724700927734375, 0.18224334716796875, 0.1920166015625, 0.20178985595703125, 0.2115631103515625, 0.22133636474609375, 0.231109619140625, 0.24088287353515625, 0.2506561279296875, 0.26042938232421875, 0.27020263671875, 0.27997589111328125, 0.2897491455078125, 0.29952239990234375, 0.309295654296875, 0.31906890869140625, 0.3288421630859375, 0.33861541748046875, 0.348388671875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 16.0, 9.0, 14.0, 17.0, 34.0, 51.0, 110.0, 271.0, 772.0, 2927.0, 18237.0, 847851.0, 165757.0, 9673.0, 1858.0, 473.0, 208.0, 71.0, 37.0, 41.0, 32.0, 13.0, 16.0, 6.0, 9.0, 6.0, 5.0, 5.0, 1.0, 4.0, 6.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11004638671875, -0.1060953140258789, -0.10214424133300781, -0.09819316864013672, -0.09424209594726562, -0.09029102325439453, -0.08633995056152344, -0.08238887786865234, -0.07843780517578125, -0.07448673248291016, -0.07053565979003906, -0.06658458709716797, -0.06263351440429688, -0.05868244171142578, -0.05473136901855469, -0.050780296325683594, -0.0468292236328125, -0.042878150939941406, -0.03892707824707031, -0.03497600555419922, -0.031024932861328125, -0.02707386016845703, -0.023122787475585938, -0.019171714782714844, -0.01522064208984375, -0.011269569396972656, -0.0073184967041015625, -0.0033674240112304688, 0.000583648681640625, 0.004534721374511719, 0.008485794067382812, 0.012436866760253906, 0.016387939453125, 0.020339012145996094, 0.024290084838867188, 0.02824115753173828, 0.032192230224609375, 0.03614330291748047, 0.04009437561035156, 0.044045448303222656, 0.04799652099609375, 0.051947593688964844, 0.05589866638183594, 0.05984973907470703, 0.06380081176757812, 0.06775188446044922, 0.07170295715332031, 0.0756540298461914, 0.0796051025390625, 0.0835561752319336, 0.08750724792480469, 0.09145832061767578, 0.09540939331054688, 0.09936046600341797, 0.10331153869628906, 0.10726261138916016, 0.11121368408203125, 0.11516475677490234, 0.11911582946777344, 0.12306690216064453, 0.12701797485351562, 0.13096904754638672, 0.1349201202392578, 0.1388711929321289, 0.142822265625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 5.0, 5.0, 16.0, 8.0, 5.0, 7.0, 17.0, 26.0, 42.0, 59.0, 130.0, 188.0, 209.0, 120.0, 55.0, 31.0, 19.0, 17.0, 13.0, 11.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0728836059570312e-05, -1.039169728755951e-05, -1.0054558515548706e-05, -9.717419743537903e-06, -9.3802809715271e-06, -9.043142199516296e-06, -8.706003427505493e-06, -8.36886465549469e-06, -8.031725883483887e-06, -7.694587111473083e-06, -7.35744833946228e-06, -7.020309567451477e-06, -6.683170795440674e-06, -6.346032023429871e-06, -6.008893251419067e-06, -5.671754479408264e-06, -5.334615707397461e-06, -4.997476935386658e-06, -4.6603381633758545e-06, -4.323199391365051e-06, -3.986060619354248e-06, -3.648921847343445e-06, -3.3117830753326416e-06, -2.9746443033218384e-06, -2.637505531311035e-06, -2.300366759300232e-06, -1.9632279872894287e-06, -1.6260892152786255e-06, -1.2889504432678223e-06, -9.51811671257019e-07, -6.146728992462158e-07, -2.775341272354126e-07, 5.960464477539063e-08, 3.9674341678619385e-07, 7.338821887969971e-07, 1.0710209608078003e-06, 1.4081597328186035e-06, 1.7452985048294067e-06, 2.08243727684021e-06, 2.419576048851013e-06, 2.7567148208618164e-06, 3.0938535928726196e-06, 3.430992364883423e-06, 3.768131136894226e-06, 4.105269908905029e-06, 4.4424086809158325e-06, 4.779547452926636e-06, 5.116686224937439e-06, 5.453824996948242e-06, 5.790963768959045e-06, 6.128102540969849e-06, 6.465241312980652e-06, 6.802380084991455e-06, 7.139518857002258e-06, 7.4766576290130615e-06, 7.813796401023865e-06, 8.150935173034668e-06, 8.488073945045471e-06, 8.825212717056274e-06, 9.162351489067078e-06, 9.499490261077881e-06, 9.836629033088684e-06, 1.0173767805099487e-05, 1.051090657711029e-05, 1.0848045349121094e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 8.0, 14.0, 10.0, 21.0, 70.0, 94.0, 221.0, 659.0, 2819.0, 30765.0, 984696.0, 25609.0, 2533.0, 592.0, 224.0, 107.0, 33.0, 28.0, 13.0, 15.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.2349853515625, -0.22816848754882812, -0.22135162353515625, -0.21453475952148438, -0.2077178955078125, -0.20090103149414062, -0.19408416748046875, -0.18726730346679688, -0.180450439453125, -0.17363357543945312, -0.16681671142578125, -0.15999984741210938, -0.1531829833984375, -0.14636611938476562, -0.13954925537109375, -0.13273239135742188, -0.12591552734375, -0.11909866333007812, -0.11228179931640625, -0.10546493530273438, -0.0986480712890625, -0.09183120727539062, -0.08501434326171875, -0.07819747924804688, -0.071380615234375, -0.06456375122070312, -0.05774688720703125, -0.050930023193359375, -0.0441131591796875, -0.037296295166015625, -0.03047943115234375, -0.023662567138671875, -0.016845703125, -0.010028839111328125, -0.00321197509765625, 0.003604888916015625, 0.0104217529296875, 0.017238616943359375, 0.02405548095703125, 0.030872344970703125, 0.037689208984375, 0.044506072998046875, 0.05132293701171875, 0.058139801025390625, 0.0649566650390625, 0.07177352905273438, 0.07859039306640625, 0.08540725708007812, 0.09222412109375, 0.09904098510742188, 0.10585784912109375, 0.11267471313476562, 0.1194915771484375, 0.12630844116210938, 0.13312530517578125, 0.13994216918945312, 0.146759033203125, 0.15357589721679688, 0.16039276123046875, 0.16720962524414062, 0.1740264892578125, 0.18084335327148438, 0.18766021728515625, 0.19447708129882812, 0.2012939453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 7.0, 4.0, 10.0, 10.0, 14.0, 14.0, 39.0, 65.0, 168.0, 412.0, 122.0, 54.0, 24.0, 16.0, 14.0, 9.0, 3.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06524658203125, -0.06316757202148438, -0.06108856201171875, -0.059009552001953125, -0.0569305419921875, -0.054851531982421875, -0.05277252197265625, -0.050693511962890625, -0.048614501953125, -0.046535491943359375, -0.04445648193359375, -0.042377471923828125, -0.0402984619140625, -0.038219451904296875, -0.03614044189453125, -0.034061431884765625, -0.031982421875, -0.029903411865234375, -0.02782440185546875, -0.025745391845703125, -0.0236663818359375, -0.021587371826171875, -0.01950836181640625, -0.017429351806640625, -0.015350341796875, -0.013271331787109375, -0.01119232177734375, -0.009113311767578125, -0.0070343017578125, -0.004955291748046875, -0.00287628173828125, -0.000797271728515625, 0.00128173828125, 0.003360748291015625, 0.00543975830078125, 0.007518768310546875, 0.0095977783203125, 0.011676788330078125, 0.01375579833984375, 0.015834808349609375, 0.017913818359375, 0.019992828369140625, 0.02207183837890625, 0.024150848388671875, 0.0262298583984375, 0.028308868408203125, 0.03038787841796875, 0.032466888427734375, 0.0345458984375, 0.036624908447265625, 0.03870391845703125, 0.040782928466796875, 0.0428619384765625, 0.044940948486328125, 0.04701995849609375, 0.049098968505859375, 0.051177978515625, 0.053256988525390625, 0.05533599853515625, 0.057415008544921875, 0.0594940185546875, 0.061573028564453125, 0.06365203857421875, 0.06573104858398438, 0.06781005859375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 6.0, 15.0, 21.0, 28.0, 33.0, 43.0, 90.0, 118.0, 102.0, 104.0, 117.0, 81.0, 81.0, 56.0, 37.0, 21.0, 13.0, 10.0, 6.0, 7.0, 0.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5503585338592529, -0.5363423228263855, -0.5223261117935181, -0.5083099603652954, -0.494293749332428, -0.48027753829956055, -0.4662613272666931, -0.45224514603614807, -0.438228964805603, -0.4242127537727356, -0.41019657254219055, -0.3961803615093231, -0.3821641802787781, -0.36814796924591064, -0.3541317582130432, -0.34011557698249817, -0.32609936594963074, -0.3120831549167633, -0.29806697368621826, -0.28405076265335083, -0.2700345814228058, -0.25601837038993835, -0.24200217425823212, -0.22798597812652588, -0.21396978199481964, -0.1999535858631134, -0.18593738973140717, -0.17192119359970093, -0.1579049825668335, -0.14388880133628845, -0.12987259030342102, -0.11585639417171478, -0.10184022784233093, -0.0878240317106247, -0.07380783557891846, -0.05979163199663162, -0.045775435864925385, -0.03175923973321915, -0.017743036150932312, -0.0037268400192260742, 0.010289356112480164, 0.02430555410683155, 0.03832175210118294, 0.052337951958179474, 0.06635414808988571, 0.08037034422159195, 0.09438654780387878, 0.10840274393558502, 0.12241894006729126, 0.1364351361989975, 0.15045133233070374, 0.16446754336357117, 0.1784837245941162, 0.19249993562698364, 0.20651613175868988, 0.22053232789039612, 0.23454852402210236, 0.2485647201538086, 0.262580931186676, 0.27659711241722107, 0.2906133234500885, 0.30462950468063354, 0.318645715713501, 0.3326619267463684, 0.34667810797691345]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 12.0, 12.0, 9.0, 15.0, 16.0, 20.0, 24.0, 32.0, 37.0, 58.0, 35.0, 55.0, 55.0, 41.0, 51.0, 56.0, 64.0, 54.0, 55.0, 52.0, 49.0, 40.0, 33.0, 31.0, 17.0, 23.0, 12.0, 16.0, 11.0, 7.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7299357652664185, -0.7077171802520752, -0.6854985356330872, -0.6632798910140991, -0.6410613059997559, -0.6188427209854126, -0.5966240763664246, -0.5744054317474365, -0.5521868467330933, -0.52996826171875, -0.507749617099762, -0.4855310022830963, -0.46331238746643066, -0.441093772649765, -0.41887515783309937, -0.3966565430164337, -0.37443792819976807, -0.3522193133831024, -0.33000069856643677, -0.3077820837497711, -0.28556346893310547, -0.2633448541164398, -0.24112623929977417, -0.21890762448310852, -0.19668900966644287, -0.17447039484977722, -0.15225178003311157, -0.13003316521644592, -0.10781455039978027, -0.08559593558311462, -0.06337732076644897, -0.041158705949783325, -0.018940091133117676, 0.0032785236835479736, 0.025497138500213623, 0.04771575331687927, 0.06993436813354492, 0.09215298295021057, 0.11437159776687622, 0.13659021258354187, 0.15880882740020752, 0.18102744221687317, 0.20324605703353882, 0.22546467185020447, 0.24768328666687012, 0.26990190148353577, 0.2921205163002014, 0.31433913111686707, 0.3365577459335327, 0.35877636075019836, 0.380994975566864, 0.40321359038352966, 0.4254322052001953, 0.44765082001686096, 0.4698694348335266, 0.49208804965019226, 0.5143066644668579, 0.5365252494812012, 0.5587438941001892, 0.5809625387191772, 0.6031811237335205, 0.6253997087478638, 0.6476183533668518, 0.6698369979858398, 0.6920555830001831]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 1.0, 4.0, 6.0, 7.0, 4.0, 12.0, 15.0, 28.0, 23.0, 42.0, 44.0, 61.0, 67.0, 77.0, 99.0, 164.0, 257.0, 444.0, 831.0, 1938.0, 6701.0, 33676.0, 2722658.0, 1393390.0, 25195.0, 4903.0, 1713.0, 648.0, 401.0, 218.0, 142.0, 120.0, 92.0, 62.0, 51.0, 39.0, 30.0, 21.0, 30.0, 26.0, 11.0, 9.0, 3.0, 8.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.493408203125, -0.4774513244628906, -0.46149444580078125, -0.4455375671386719, -0.4295806884765625, -0.4136238098144531, -0.39766693115234375, -0.3817100524902344, -0.365753173828125, -0.3497962951660156, -0.33383941650390625, -0.3178825378417969, -0.3019256591796875, -0.2859687805175781, -0.27001190185546875, -0.2540550231933594, -0.23809814453125, -0.22214126586914062, -0.20618438720703125, -0.19022750854492188, -0.1742706298828125, -0.15831375122070312, -0.14235687255859375, -0.12639999389648438, -0.110443115234375, -0.09448623657226562, -0.07852935791015625, -0.06257247924804688, -0.0466156005859375, -0.030658721923828125, -0.01470184326171875, 0.001255035400390625, 0.0172119140625, 0.033168792724609375, 0.04912567138671875, 0.06508255004882812, 0.0810394287109375, 0.09699630737304688, 0.11295318603515625, 0.12891006469726562, 0.144866943359375, 0.16082382202148438, 0.17678070068359375, 0.19273757934570312, 0.2086944580078125, 0.22465133666992188, 0.24060821533203125, 0.2565650939941406, 0.27252197265625, 0.2884788513183594, 0.30443572998046875, 0.3203926086425781, 0.3363494873046875, 0.3523063659667969, 0.36826324462890625, 0.3842201232910156, 0.400177001953125, 0.4161338806152344, 0.43209075927734375, 0.4480476379394531, 0.4640045166015625, 0.4799613952636719, 0.49591827392578125, 0.5118751525878906, 0.52783203125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 12.0, 8.0, 17.0, 24.0, 37.0, 41.0, 57.0, 89.0, 93.0, 101.0, 83.0, 91.0, 82.0, 71.0, 49.0, 51.0, 39.0, 26.0, 20.0, 4.0, 6.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2154541015625, -0.20728111267089844, -0.19910812377929688, -0.1909351348876953, -0.18276214599609375, -0.1745891571044922, -0.16641616821289062, -0.15824317932128906, -0.1500701904296875, -0.14189720153808594, -0.13372421264648438, -0.1255512237548828, -0.11737823486328125, -0.10920524597167969, -0.10103225708007812, -0.09285926818847656, -0.084686279296875, -0.07651329040527344, -0.06834030151367188, -0.06016731262207031, -0.05199432373046875, -0.04382133483886719, -0.035648345947265625, -0.027475357055664062, -0.0193023681640625, -0.011129379272460938, -0.002956390380859375, 0.0052165985107421875, 0.01338958740234375, 0.021562576293945312, 0.029735565185546875, 0.03790855407714844, 0.04608154296875, 0.05425453186035156, 0.062427520751953125, 0.07060050964355469, 0.07877349853515625, 0.08694648742675781, 0.09511947631835938, 0.10329246520996094, 0.1114654541015625, 0.11963844299316406, 0.12781143188476562, 0.1359844207763672, 0.14415740966796875, 0.1523303985595703, 0.16050338745117188, 0.16867637634277344, 0.176849365234375, 0.18502235412597656, 0.19319534301757812, 0.2013683319091797, 0.20954132080078125, 0.2177143096923828, 0.22588729858398438, 0.23406028747558594, 0.2422332763671875, 0.25040626525878906, 0.2585792541503906, 0.2667522430419922, 0.27492523193359375, 0.2830982208251953, 0.2912712097167969, 0.29944419860839844, 0.3076171875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 7.0, 9.0, 14.0, 14.0, 30.0, 62.0, 156.0, 474.0, 2932.0, 134493.0, 4046513.0, 8203.0, 931.0, 253.0, 89.0, 41.0, 23.0, 13.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85986328125, -0.8227920532226562, -0.7857208251953125, -0.7486495971679688, -0.711578369140625, -0.6745071411132812, -0.6374359130859375, -0.6003646850585938, -0.56329345703125, -0.5262222290039062, -0.4891510009765625, -0.45207977294921875, -0.415008544921875, -0.37793731689453125, -0.3408660888671875, -0.30379486083984375, -0.2667236328125, -0.22965240478515625, -0.1925811767578125, -0.15550994873046875, -0.118438720703125, -0.08136749267578125, -0.0442962646484375, -0.00722503662109375, 0.02984619140625, 0.06691741943359375, 0.1039886474609375, 0.14105987548828125, 0.178131103515625, 0.21520233154296875, 0.2522735595703125, 0.28934478759765625, 0.326416015625, 0.36348724365234375, 0.4005584716796875, 0.43762969970703125, 0.474700927734375, 0.5117721557617188, 0.5488433837890625, 0.5859146118164062, 0.62298583984375, 0.6600570678710938, 0.6971282958984375, 0.7341995239257812, 0.771270751953125, 0.8083419799804688, 0.8454132080078125, 0.8824844360351562, 0.9195556640625, 0.9566268920898438, 0.9936981201171875, 1.0307693481445312, 1.067840576171875, 1.1049118041992188, 1.1419830322265625, 1.1790542602539062, 1.21612548828125, 1.2531967163085938, 1.2902679443359375, 1.3273391723632812, 1.364410400390625, 1.4014816284179688, 1.4385528564453125, 1.4756240844726562, 1.5126953125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 17.0, 12.0, 30.0, 46.0, 60.0, 146.0, 453.0, 1287.0, 1308.0, 416.0, 113.0, 71.0, 37.0, 19.0, 11.0, 10.0, 10.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1732177734375, -0.16840553283691406, -0.16359329223632812, -0.1587810516357422, -0.15396881103515625, -0.1491565704345703, -0.14434432983398438, -0.13953208923339844, -0.1347198486328125, -0.12990760803222656, -0.12509536743164062, -0.12028312683105469, -0.11547088623046875, -0.11065864562988281, -0.10584640502929688, -0.10103416442871094, -0.096221923828125, -0.09140968322753906, -0.08659744262695312, -0.08178520202636719, -0.07697296142578125, -0.07216072082519531, -0.06734848022460938, -0.06253623962402344, -0.0577239990234375, -0.05291175842285156, -0.048099517822265625, -0.04328727722167969, -0.03847503662109375, -0.03366279602050781, -0.028850555419921875, -0.024038314819335938, -0.01922607421875, -0.014413833618164062, -0.009601593017578125, -0.0047893524169921875, 2.288818359375e-05, 0.0048351287841796875, 0.009647369384765625, 0.014459609985351562, 0.0192718505859375, 0.024084091186523438, 0.028896331787109375, 0.03370857238769531, 0.03852081298828125, 0.04333305358886719, 0.048145294189453125, 0.05295753479003906, 0.057769775390625, 0.06258201599121094, 0.06739425659179688, 0.07220649719238281, 0.07701873779296875, 0.08183097839355469, 0.08664321899414062, 0.09145545959472656, 0.0962677001953125, 0.10107994079589844, 0.10589218139648438, 0.11070442199707031, 0.11551666259765625, 0.12032890319824219, 0.12514114379882812, 0.12995338439941406, 0.134765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 9.0, 11.0, 12.0, 23.0, 29.0, 38.0, 54.0, 55.0, 58.0, 93.0, 92.0, 90.0, 85.0, 91.0, 67.0, 44.0, 44.0, 26.0, 18.0, 18.0, 14.0, 8.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2212124913930893, -0.2131403088569641, -0.20506811141967773, -0.19699592888355255, -0.18892373144626617, -0.180851548910141, -0.17277935147285461, -0.16470716893672943, -0.15663498640060425, -0.14856280386447906, -0.1404906064271927, -0.1324184238910675, -0.12434622645378113, -0.11627404391765594, -0.10820185393095016, -0.10012966394424438, -0.09205746650695801, -0.08398527652025223, -0.07591308653354645, -0.06784090399742126, -0.059768710285425186, -0.051696520298719406, -0.043624334037303925, -0.035552144050598145, -0.027479954063892365, -0.019407764077186584, -0.011335575953125954, -0.003263387829065323, 0.004808802157640457, 0.012880992144346237, 0.02095317840576172, 0.0290253683924675, 0.03709757328033447, 0.04516976326704025, 0.05324195325374603, 0.061314139515161514, 0.06938633322715759, 0.07745851576328278, 0.08553070574998856, 0.09360289573669434, 0.10167508572340012, 0.1097472757101059, 0.11781946569681168, 0.12589165568351746, 0.13396383821964264, 0.14203603565692902, 0.1501082181930542, 0.15818041563034058, 0.16625259816646576, 0.17432478070259094, 0.18239697813987732, 0.1904691606760025, 0.19854135811328888, 0.20661354064941406, 0.21468573808670044, 0.22275792062282562, 0.2308301031589508, 0.238902285695076, 0.24697448313236237, 0.25504666566848755, 0.2631188631057739, 0.2711910605430603, 0.2792632281780243, 0.28733542561531067, 0.29540762305259705]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 9.0, 12.0, 14.0, 17.0, 19.0, 24.0, 44.0, 29.0, 57.0, 39.0, 53.0, 63.0, 55.0, 74.0, 56.0, 66.0, 43.0, 53.0, 44.0, 39.0, 36.0, 29.0, 37.0, 16.0, 17.0, 14.0, 13.0, 14.0, 2.0, 1.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15524552762508392, -0.14874964952468872, -0.14225377142429352, -0.13575789332389832, -0.1292620152235031, -0.12276613712310791, -0.11627025157213211, -0.10977437347173691, -0.1032784953713417, -0.0967826172709465, -0.0902867391705513, -0.0837908536195755, -0.0772949755191803, -0.0707990974187851, -0.06430321931838989, -0.05780734121799469, -0.05131146311759949, -0.044815585017204285, -0.03831970691680908, -0.03182382509112358, -0.02532794699072838, -0.018832068890333176, -0.012336187064647675, -0.005840308964252472, 0.0006555691361427307, 0.007151448167860508, 0.013647327199578285, 0.020143207162618637, 0.02663908526301384, 0.03313496336340904, 0.03963084518909454, 0.046126723289489746, 0.052622586488723755, 0.05911846458911896, 0.06561434268951416, 0.07211022078990936, 0.07860609889030457, 0.08510197699069977, 0.09159786254167557, 0.09809374064207077, 0.10458961874246597, 0.11108549684286118, 0.11758137494325638, 0.12407726049423218, 0.13057313859462738, 0.13706901669502258, 0.14356489479541779, 0.150060772895813, 0.1565566509962082, 0.1630525290966034, 0.1695484071969986, 0.1760442852973938, 0.182540163397789, 0.1890360414981842, 0.1955319344997406, 0.2020277976989746, 0.208523690700531, 0.2150195688009262, 0.2215154469013214, 0.2280113250017166, 0.23450720310211182, 0.24100308120250702, 0.24749895930290222, 0.2539948523044586, 0.2604907155036926]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 10.0, 5.0, 10.0, 19.0, 32.0, 41.0, 55.0, 135.0, 213.0, 410.0, 886.0, 2297.0, 6941.0, 28858.0, 181568.0, 678539.0, 118435.0, 21167.0, 5477.0, 1914.0, 706.0, 375.0, 175.0, 109.0, 75.0, 37.0, 24.0, 20.0, 8.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07415771484375, -0.07154655456542969, -0.06893539428710938, -0.06632423400878906, -0.06371307373046875, -0.06110191345214844, -0.058490753173828125, -0.05587959289550781, -0.0532684326171875, -0.05065727233886719, -0.048046112060546875, -0.04543495178222656, -0.04282379150390625, -0.04021263122558594, -0.037601470947265625, -0.03499031066894531, -0.032379150390625, -0.029767990112304688, -0.027156829833984375, -0.024545669555664062, -0.02193450927734375, -0.019323348999023438, -0.016712188720703125, -0.014101028442382812, -0.0114898681640625, -0.008878707885742188, -0.006267547607421875, -0.0036563873291015625, -0.00104522705078125, 0.0015659332275390625, 0.004177093505859375, 0.0067882537841796875, 0.0093994140625, 0.012010574340820312, 0.014621734619140625, 0.017232894897460938, 0.01984405517578125, 0.022455215454101562, 0.025066375732421875, 0.027677536010742188, 0.0302886962890625, 0.03289985656738281, 0.035511016845703125, 0.03812217712402344, 0.04073333740234375, 0.04334449768066406, 0.045955657958984375, 0.04856681823730469, 0.051177978515625, 0.05378913879394531, 0.056400299072265625, 0.05901145935058594, 0.06162261962890625, 0.06423377990722656, 0.06684494018554688, 0.06945610046386719, 0.0720672607421875, 0.07467842102050781, 0.07728958129882812, 0.07990074157714844, 0.08251190185546875, 0.08512306213378906, 0.08773422241210938, 0.09034538269042969, 0.09295654296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 4.0, 8.0, 13.0, 18.0, 21.0, 25.0, 45.0, 66.0, 57.0, 81.0, 81.0, 75.0, 87.0, 86.0, 68.0, 57.0, 58.0, 40.0, 33.0, 22.0, 22.0, 20.0, 10.0, 3.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.147705078125, -0.14245033264160156, -0.13719558715820312, -0.1319408416748047, -0.12668609619140625, -0.12143135070800781, -0.11617660522460938, -0.11092185974121094, -0.1056671142578125, -0.10041236877441406, -0.09515762329101562, -0.08990287780761719, -0.08464813232421875, -0.07939338684082031, -0.07413864135742188, -0.06888389587402344, -0.063629150390625, -0.05837440490722656, -0.053119659423828125, -0.04786491394042969, -0.04261016845703125, -0.03735542297363281, -0.032100677490234375, -0.026845932006835938, -0.0215911865234375, -0.016336441040039062, -0.011081695556640625, -0.0058269500732421875, -0.00057220458984375, 0.0046825408935546875, 0.009937286376953125, 0.015192031860351562, 0.02044677734375, 0.025701522827148438, 0.030956268310546875, 0.03621101379394531, 0.04146575927734375, 0.04672050476074219, 0.051975250244140625, 0.05722999572753906, 0.0624847412109375, 0.06773948669433594, 0.07299423217773438, 0.07824897766113281, 0.08350372314453125, 0.08875846862792969, 0.09401321411132812, 0.09926795959472656, 0.104522705078125, 0.10977745056152344, 0.11503219604492188, 0.12028694152832031, 0.12554168701171875, 0.1307964324951172, 0.13605117797851562, 0.14130592346191406, 0.1465606689453125, 0.15181541442871094, 0.15707015991210938, 0.1623249053955078, 0.16757965087890625, 0.1728343963623047, 0.17808914184570312, 0.18334388732910156, 0.1885986328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 10.0, 15.0, 25.0, 42.0, 43.0, 59.0, 87.0, 146.0, 186.0, 332.0, 461.0, 674.0, 1012.0, 1576.0, 2597.0, 4180.0, 6870.0, 11934.0, 21113.0, 40617.0, 85328.0, 194948.0, 307421.0, 193169.0, 84598.0, 40071.0, 21184.0, 11731.0, 6842.0, 4162.0, 2478.0, 1612.0, 1023.0, 693.0, 402.0, 291.0, 199.0, 153.0, 64.0, 59.0, 55.0, 19.0, 20.0, 21.0, 6.0, 3.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0246124267578125, -0.023830890655517578, -0.023049354553222656, -0.022267818450927734, -0.021486282348632812, -0.02070474624633789, -0.01992321014404297, -0.019141674041748047, -0.018360137939453125, -0.017578601837158203, -0.01679706573486328, -0.01601552963256836, -0.015233993530273438, -0.014452457427978516, -0.013670921325683594, -0.012889385223388672, -0.01210784912109375, -0.011326313018798828, -0.010544776916503906, -0.009763240814208984, -0.008981704711914062, -0.00820016860961914, -0.007418632507324219, -0.006637096405029297, -0.005855560302734375, -0.005074024200439453, -0.004292488098144531, -0.0035109519958496094, -0.0027294158935546875, -0.0019478797912597656, -0.0011663436889648438, -0.0003848075866699219, 0.000396728515625, 0.0011782646179199219, 0.0019598007202148438, 0.0027413368225097656, 0.0035228729248046875, 0.004304409027099609, 0.005085945129394531, 0.005867481231689453, 0.006649017333984375, 0.007430553436279297, 0.008212089538574219, 0.00899362564086914, 0.009775161743164062, 0.010556697845458984, 0.011338233947753906, 0.012119770050048828, 0.01290130615234375, 0.013682842254638672, 0.014464378356933594, 0.015245914459228516, 0.016027450561523438, 0.01680898666381836, 0.01759052276611328, 0.018372058868408203, 0.019153594970703125, 0.019935131072998047, 0.02071666717529297, 0.02149820327758789, 0.022279739379882812, 0.023061275482177734, 0.023842811584472656, 0.024624347686767578, 0.0254058837890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 9.0, 7.0, 12.0, 14.0, 21.0, 18.0, 21.0, 22.0, 31.0, 48.0, 37.0, 49.0, 58.0, 66.0, 66.0, 62.0, 70.0, 54.0, 51.0, 44.0, 39.0, 29.0, 36.0, 18.0, 30.0, 17.0, 10.0, 15.0, 8.0, 4.0, 10.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2261962890625, -0.2175769805908203, -0.20895767211914062, -0.20033836364746094, -0.19171905517578125, -0.18309974670410156, -0.17448043823242188, -0.1658611297607422, -0.1572418212890625, -0.1486225128173828, -0.14000320434570312, -0.13138389587402344, -0.12276458740234375, -0.11414527893066406, -0.10552597045898438, -0.09690666198730469, -0.088287353515625, -0.07966804504394531, -0.07104873657226562, -0.06242942810058594, -0.05381011962890625, -0.04519081115722656, -0.036571502685546875, -0.027952194213867188, -0.0193328857421875, -0.010713577270507812, -0.002094268798828125, 0.0065250396728515625, 0.01514434814453125, 0.023763656616210938, 0.032382965087890625, 0.04100227355957031, 0.04962158203125, 0.05824089050292969, 0.06686019897460938, 0.07547950744628906, 0.08409881591796875, 0.09271812438964844, 0.10133743286132812, 0.10995674133300781, 0.1185760498046875, 0.1271953582763672, 0.13581466674804688, 0.14443397521972656, 0.15305328369140625, 0.16167259216308594, 0.17029190063476562, 0.1789112091064453, 0.187530517578125, 0.1961498260498047, 0.20476913452148438, 0.21338844299316406, 0.22200775146484375, 0.23062705993652344, 0.23924636840820312, 0.2478656768798828, 0.2564849853515625, 0.2651042938232422, 0.2737236022949219, 0.28234291076660156, 0.29096221923828125, 0.29958152770996094, 0.3082008361816406, 0.3168201446533203, 0.325439453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 7.0, 4.0, 13.0, 27.0, 26.0, 36.0, 50.0, 68.0, 108.0, 182.0, 266.0, 441.0, 746.0, 1412.0, 2767.0, 5789.0, 13132.0, 33029.0, 86796.0, 220145.0, 348880.0, 202667.0, 79002.0, 29748.0, 12031.0, 5310.0, 2699.0, 1287.0, 718.0, 411.0, 265.0, 156.0, 93.0, 66.0, 47.0, 35.0, 28.0, 16.0, 10.0, 7.0, 7.0, 5.0, 6.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.0031681060791015625, -0.0030761361122131348, -0.002984166145324707, -0.0028921961784362793, -0.0028002262115478516, -0.002708256244659424, -0.002616286277770996, -0.0025243163108825684, -0.0024323463439941406, -0.002340376377105713, -0.002248406410217285, -0.0021564364433288574, -0.0020644664764404297, -0.001972496509552002, -0.0018805265426635742, -0.0017885565757751465, -0.0016965866088867188, -0.001604616641998291, -0.0015126466751098633, -0.0014206767082214355, -0.0013287067413330078, -0.00123673677444458, -0.0011447668075561523, -0.0010527968406677246, -0.0009608268737792969, -0.0008688569068908691, -0.0007768869400024414, -0.0006849169731140137, -0.0005929470062255859, -0.0005009770393371582, -0.00040900707244873047, -0.00031703710556030273, -0.000225067138671875, -0.00013309717178344727, -4.112720489501953e-05, 5.08427619934082e-05, 0.00014281272888183594, 0.00023478269577026367, 0.0003267526626586914, 0.00041872262954711914, 0.0005106925964355469, 0.0006026625633239746, 0.0006946325302124023, 0.0007866024971008301, 0.0008785724639892578, 0.0009705424308776855, 0.0010625123977661133, 0.001154482364654541, 0.0012464523315429688, 0.0013384222984313965, 0.0014303922653198242, 0.001522362232208252, 0.0016143321990966797, 0.0017063021659851074, 0.0017982721328735352, 0.0018902420997619629, 0.0019822120666503906, 0.0020741820335388184, 0.002166152000427246, 0.002258121967315674, 0.0023500919342041016, 0.0024420619010925293, 0.002534031867980957, 0.0026260018348693848, 0.0027179718017578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 4.0, 3.0, 5.0, 9.0, 4.0, 2.0, 3.0, 9.0, 17.0, 15.0, 20.0, 36.0, 24.0, 37.0, 56.0, 72.0, 82.0, 86.0, 77.0, 96.0, 57.0, 58.0, 47.0, 40.0, 33.0, 30.0, 15.0, 13.0, 13.0, 12.0, 8.0, 4.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.125999450683594e-06, -4.9443915486335754e-06, -4.762783646583557e-06, -4.581175744533539e-06, -4.3995678424835205e-06, -4.217959940433502e-06, -4.036352038383484e-06, -3.8547441363334656e-06, -3.6731362342834473e-06, -3.491528332233429e-06, -3.3099204301834106e-06, -3.1283125281333923e-06, -2.946704626083374e-06, -2.7650967240333557e-06, -2.5834888219833374e-06, -2.401880919933319e-06, -2.2202730178833008e-06, -2.0386651158332825e-06, -1.8570572137832642e-06, -1.6754493117332458e-06, -1.4938414096832275e-06, -1.3122335076332092e-06, -1.130625605583191e-06, -9.490177035331726e-07, -7.674098014831543e-07, -5.85801899433136e-07, -4.041939973831177e-07, -2.2258609533309937e-07, -4.0978193283081055e-08, 1.4062970876693726e-07, 3.2223761081695557e-07, 5.038455128669739e-07, 6.854534149169922e-07, 8.670613169670105e-07, 1.0486692190170288e-06, 1.2302771210670471e-06, 1.4118850231170654e-06, 1.5934929251670837e-06, 1.775100827217102e-06, 1.9567087292671204e-06, 2.1383166313171387e-06, 2.319924533367157e-06, 2.5015324354171753e-06, 2.6831403374671936e-06, 2.864748239517212e-06, 3.0463561415672302e-06, 3.2279640436172485e-06, 3.409571945667267e-06, 3.591179847717285e-06, 3.7727877497673035e-06, 3.954395651817322e-06, 4.13600355386734e-06, 4.317611455917358e-06, 4.499219357967377e-06, 4.680827260017395e-06, 4.862435162067413e-06, 5.044043064117432e-06, 5.22565096616745e-06, 5.407258868217468e-06, 5.5888667702674866e-06, 5.770474672317505e-06, 5.952082574367523e-06, 6.1336904764175415e-06, 6.31529837846756e-06, 6.496906280517578e-06]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 5.0, 1.0, 3.0, 7.0, 8.0, 16.0, 15.0, 16.0, 22.0, 34.0, 60.0, 97.0, 142.0, 202.0, 351.0, 554.0, 932.0, 1767.0, 3304.0, 6672.0, 14438.0, 33301.0, 82533.0, 201800.0, 322562.0, 219018.0, 92459.0, 36794.0, 16050.0, 7272.0, 3552.0, 1880.0, 1053.0, 633.0, 342.0, 230.0, 143.0, 81.0, 57.0, 36.0, 29.0, 18.0, 17.0, 15.0, 13.0, 9.0, 8.0, 7.0, 0.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00212860107421875, -0.002054065465927124, -0.001979529857635498, -0.001904994249343872, -0.001830458641052246, -0.0017559230327606201, -0.0016813874244689941, -0.0016068518161773682, -0.0015323162078857422, -0.0014577805995941162, -0.0013832449913024902, -0.0013087093830108643, -0.0012341737747192383, -0.0011596381664276123, -0.0010851025581359863, -0.0010105669498443604, -0.0009360313415527344, -0.0008614957332611084, -0.0007869601249694824, -0.0007124245166778564, -0.0006378889083862305, -0.0005633533000946045, -0.0004888176918029785, -0.00041428208351135254, -0.00033974647521972656, -0.0002652108669281006, -0.0001906752586364746, -0.00011613965034484863, -4.1604042053222656e-05, 3.293156623840332e-05, 0.0001074671745300293, 0.00018200278282165527, 0.00025653839111328125, 0.0003310739994049072, 0.0004056096076965332, 0.0004801452159881592, 0.0005546808242797852, 0.0006292164325714111, 0.0007037520408630371, 0.0007782876491546631, 0.0008528232574462891, 0.000927358865737915, 0.001001894474029541, 0.001076430082321167, 0.001150965690612793, 0.001225501298904419, 0.001300036907196045, 0.001374572515487671, 0.0014491081237792969, 0.0015236437320709229, 0.0015981793403625488, 0.0016727149486541748, 0.0017472505569458008, 0.0018217861652374268, 0.0018963217735290527, 0.0019708573818206787, 0.0020453929901123047, 0.0021199285984039307, 0.0021944642066955566, 0.0022689998149871826, 0.0023435354232788086, 0.0024180710315704346, 0.0024926066398620605, 0.0025671422481536865, 0.0026416778564453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 5.0, 5.0, 8.0, 6.0, 8.0, 9.0, 9.0, 9.0, 6.0, 15.0, 21.0, 22.0, 24.0, 29.0, 33.0, 46.0, 48.0, 58.0, 55.0, 54.0, 67.0, 52.0, 59.0, 41.0, 47.0, 44.0, 30.0, 40.0, 25.0, 22.0, 25.0, 10.0, 13.0, 7.0, 9.0, 9.0, 6.0, 2.0, 8.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0007700920104980469, -0.0007495582103729248, -0.0007290244102478027, -0.0007084906101226807, -0.0006879568099975586, -0.0006674230098724365, -0.0006468892097473145, -0.0006263554096221924, -0.0006058216094970703, -0.0005852878093719482, -0.0005647540092468262, -0.0005442202091217041, -0.000523686408996582, -0.00050315260887146, -0.0004826188087463379, -0.0004620850086212158, -0.00044155120849609375, -0.0004210174083709717, -0.0004004836082458496, -0.00037994980812072754, -0.00035941600799560547, -0.0003388822078704834, -0.00031834840774536133, -0.00029781460762023926, -0.0002772808074951172, -0.0002567470073699951, -0.00023621320724487305, -0.00021567940711975098, -0.0001951456069946289, -0.00017461180686950684, -0.00015407800674438477, -0.0001335442066192627, -0.00011301040649414062, -9.247660636901855e-05, -7.194280624389648e-05, -5.1409006118774414e-05, -3.0875205993652344e-05, -1.0341405868530273e-05, 1.0192394256591797e-05, 3.072619438171387e-05, 5.125999450683594e-05, 7.179379463195801e-05, 9.232759475708008e-05, 0.00011286139488220215, 0.00013339519500732422, 0.0001539289951324463, 0.00017446279525756836, 0.00019499659538269043, 0.0002155303955078125, 0.00023606419563293457, 0.00025659799575805664, 0.0002771317958831787, 0.0002976655960083008, 0.00031819939613342285, 0.0003387331962585449, 0.000359266996383667, 0.00037980079650878906, 0.00040033459663391113, 0.0004208683967590332, 0.0004414021968841553, 0.00046193599700927734, 0.0004824697971343994, 0.0005030035972595215, 0.0005235373973846436, 0.0005440711975097656]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 13.0, 28.0, 71.0, 139.0, 235.0, 233.0, 172.0, 72.0, 24.0, 13.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2637604773044586, -0.2517978847026825, -0.23983527719974518, -0.22787266969680786, -0.21591007709503174, -0.20394748449325562, -0.1919848769903183, -0.18002226948738098, -0.16805967688560486, -0.15609708428382874, -0.14413447678089142, -0.1321718692779541, -0.12020927667617798, -0.10824667662382126, -0.09628407657146454, -0.08432147651910782, -0.0723588764667511, -0.06039627641439438, -0.04843367636203766, -0.03647107630968094, -0.02450847625732422, -0.012545876204967499, -0.0005832761526107788, 0.011379323899745941, 0.02334192395210266, 0.03530452400445938, 0.0472671240568161, 0.05922972410917282, 0.07119232416152954, 0.08315492421388626, 0.09511752426624298, 0.1070801243185997, 0.11904269456863403, 0.13100528717041016, 0.14296789467334747, 0.1549305021762848, 0.1668930947780609, 0.17885568737983704, 0.19081829488277435, 0.20278090238571167, 0.2147434949874878, 0.22670608758926392, 0.23866869509220123, 0.25063130259513855, 0.2625938951969147, 0.2745564877986908, 0.2865191102027893, 0.29848170280456543, 0.31044429540634155, 0.3224068880081177, 0.3343694806098938, 0.3463321030139923, 0.35829469561576843, 0.37025728821754456, 0.38221991062164307, 0.3941825032234192, 0.4061450958251953, 0.41810768842697144, 0.43007028102874756, 0.44203290343284607, 0.4539954960346222, 0.4659580886363983, 0.4779207110404968, 0.48988330364227295, 0.5018458962440491]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 12.0, 13.0, 17.0, 27.0, 30.0, 47.0, 62.0, 62.0, 63.0, 82.0, 78.0, 79.0, 82.0, 61.0, 60.0, 48.0, 42.0, 44.0, 24.0, 20.0, 18.0, 11.0, 9.0, 2.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13385745882987976, -0.12910066545009613, -0.1243438869714737, -0.11958709359169006, -0.11483030766248703, -0.110073521733284, -0.10531673580408096, -0.10055994987487793, -0.0958031564950943, -0.09104637056589127, -0.08628958463668823, -0.0815327912569046, -0.07677600532770157, -0.07201921939849854, -0.0672624334692955, -0.06250564754009247, -0.057748861610889435, -0.0529920756816864, -0.04823528602719307, -0.043478500097990036, -0.038721710443496704, -0.03396492451429367, -0.029208138585090637, -0.024451348930597305, -0.019694563001394272, -0.01493777520954609, -0.010180988349020481, -0.005424201488494873, -0.0006674136966466904, 0.004089374095201492, 0.008846160024404526, 0.013602949678897858, 0.01835973560810089, 0.023116523399949074, 0.027873311191797256, 0.03263009712100029, 0.03738688677549362, 0.042143672704696655, 0.04690045863389969, 0.05165724828839302, 0.056414034217596054, 0.06117082014679909, 0.06592760980129242, 0.07068439573049545, 0.07544118165969849, 0.08019797503948212, 0.08495475351810455, 0.08971154689788818, 0.09446833282709122, 0.09922511875629425, 0.10398190468549728, 0.10873869061470032, 0.11349548399448395, 0.11825226992368698, 0.12300905585289001, 0.12776584923267365, 0.13252262771129608, 0.1372794210910797, 0.14203619956970215, 0.14679299294948578, 0.15154977142810822, 0.15630656480789185, 0.16106334328651428, 0.1658201366662979, 0.17057693004608154]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 11.0, 12.0, 23.0, 31.0, 48.0, 49.0, 107.0, 140.0, 253.0, 397.0, 665.0, 1020.0, 1723.0, 3196.0, 5962.0, 11536.0, 25154.0, 70031.0, 314942.0, 450108.0, 100288.0, 32601.0, 14240.0, 7011.0, 3818.0, 2113.0, 1178.0, 676.0, 415.0, 260.0, 181.0, 123.0, 78.0, 58.0, 38.0, 21.0, 14.0, 11.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1280517578125, -0.12406730651855469, -0.12008285522460938, -0.11609840393066406, -0.11211395263671875, -0.10812950134277344, -0.10414505004882812, -0.10016059875488281, -0.0961761474609375, -0.09219169616699219, -0.08820724487304688, -0.08422279357910156, -0.08023834228515625, -0.07625389099121094, -0.07226943969726562, -0.06828498840332031, -0.064300537109375, -0.06031608581542969, -0.056331634521484375, -0.05234718322753906, -0.04836273193359375, -0.04437828063964844, -0.040393829345703125, -0.03640937805175781, -0.0324249267578125, -0.028440475463867188, -0.024456024169921875, -0.020471572875976562, -0.01648712158203125, -0.012502670288085938, -0.008518218994140625, -0.0045337677001953125, -0.00054931640625, 0.0034351348876953125, 0.007419586181640625, 0.011404037475585938, 0.01538848876953125, 0.019372940063476562, 0.023357391357421875, 0.027341842651367188, 0.0313262939453125, 0.03531074523925781, 0.039295196533203125, 0.04327964782714844, 0.04726409912109375, 0.05124855041503906, 0.055233001708984375, 0.05921745300292969, 0.063201904296875, 0.06718635559082031, 0.07117080688476562, 0.07515525817871094, 0.07913970947265625, 0.08312416076660156, 0.08710861206054688, 0.09109306335449219, 0.0950775146484375, 0.09906196594238281, 0.10304641723632812, 0.10703086853027344, 0.11101531982421875, 0.11499977111816406, 0.11898422241210938, 0.12296867370605469, 0.126953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 2.0, 5.0, 9.0, 12.0, 20.0, 21.0, 20.0, 27.0, 25.0, 35.0, 30.0, 52.0, 62.0, 61.0, 54.0, 56.0, 40.0, 55.0, 57.0, 49.0, 46.0, 43.0, 29.0, 32.0, 32.0, 21.0, 17.0, 27.0, 15.0, 7.0, 7.0, 7.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.238525390625, -0.2309436798095703, -0.22336196899414062, -0.21578025817871094, -0.20819854736328125, -0.20061683654785156, -0.19303512573242188, -0.1854534149169922, -0.1778717041015625, -0.1702899932861328, -0.16270828247070312, -0.15512657165527344, -0.14754486083984375, -0.13996315002441406, -0.13238143920898438, -0.12479972839355469, -0.117218017578125, -0.10963630676269531, -0.10205459594726562, -0.09447288513183594, -0.08689117431640625, -0.07930946350097656, -0.07172775268554688, -0.06414604187011719, -0.0565643310546875, -0.04898262023925781, -0.041400909423828125, -0.03381919860839844, -0.02623748779296875, -0.018655776977539062, -0.011074066162109375, -0.0034923553466796875, 0.00408935546875, 0.011671066284179688, 0.019252777099609375, 0.026834487915039062, 0.03441619873046875, 0.04199790954589844, 0.049579620361328125, 0.05716133117675781, 0.0647430419921875, 0.07232475280761719, 0.07990646362304688, 0.08748817443847656, 0.09506988525390625, 0.10265159606933594, 0.11023330688476562, 0.11781501770019531, 0.125396728515625, 0.1329784393310547, 0.14056015014648438, 0.14814186096191406, 0.15572357177734375, 0.16330528259277344, 0.17088699340820312, 0.1784687042236328, 0.1860504150390625, 0.1936321258544922, 0.20121383666992188, 0.20879554748535156, 0.21637725830078125, 0.22395896911621094, 0.23154067993164062, 0.2391223907470703, 0.2467041015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 9.0, 6.0, 9.0, 10.0, 6.0, 15.0, 18.0, 26.0, 36.0, 42.0, 46.0, 72.0, 106.0, 195.0, 345.0, 786.0, 2189.0, 7574.0, 35537.0, 472381.0, 482262.0, 35521.0, 7599.0, 2078.0, 785.0, 317.0, 176.0, 109.0, 78.0, 49.0, 42.0, 30.0, 24.0, 25.0, 11.0, 15.0, 7.0, 7.0, 6.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2734375, -0.264892578125, -0.25634765625, -0.247802734375, -0.2392578125, -0.230712890625, -0.22216796875, -0.213623046875, -0.205078125, -0.196533203125, -0.18798828125, -0.179443359375, -0.1708984375, -0.162353515625, -0.15380859375, -0.145263671875, -0.13671875, -0.128173828125, -0.11962890625, -0.111083984375, -0.1025390625, -0.093994140625, -0.08544921875, -0.076904296875, -0.068359375, -0.059814453125, -0.05126953125, -0.042724609375, -0.0341796875, -0.025634765625, -0.01708984375, -0.008544921875, 0.0, 0.008544921875, 0.01708984375, 0.025634765625, 0.0341796875, 0.042724609375, 0.05126953125, 0.059814453125, 0.068359375, 0.076904296875, 0.08544921875, 0.093994140625, 0.1025390625, 0.111083984375, 0.11962890625, 0.128173828125, 0.13671875, 0.145263671875, 0.15380859375, 0.162353515625, 0.1708984375, 0.179443359375, 0.18798828125, 0.196533203125, 0.205078125, 0.213623046875, 0.22216796875, 0.230712890625, 0.2392578125, 0.247802734375, 0.25634765625, 0.264892578125, 0.2734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 5.0, 8.0, 16.0, 12.0, 15.0, 21.0, 24.0, 38.0, 35.0, 50.0, 58.0, 69.0, 72.0, 61.0, 75.0, 57.0, 45.0, 51.0, 51.0, 32.0, 33.0, 30.0, 22.0, 17.0, 21.0, 15.0, 11.0, 7.0, 7.0, 4.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2958984375, -0.28548431396484375, -0.2750701904296875, -0.26465606689453125, -0.254241943359375, -0.24382781982421875, -0.2334136962890625, -0.22299957275390625, -0.21258544921875, -0.20217132568359375, -0.1917572021484375, -0.18134307861328125, -0.170928955078125, -0.16051483154296875, -0.1501007080078125, -0.13968658447265625, -0.1292724609375, -0.11885833740234375, -0.1084442138671875, -0.09803009033203125, -0.087615966796875, -0.07720184326171875, -0.0667877197265625, -0.05637359619140625, -0.04595947265625, -0.03554534912109375, -0.0251312255859375, -0.01471710205078125, -0.004302978515625, 0.00611114501953125, 0.0165252685546875, 0.02693939208984375, 0.037353515625, 0.04776763916015625, 0.0581817626953125, 0.06859588623046875, 0.079010009765625, 0.08942413330078125, 0.0998382568359375, 0.11025238037109375, 0.12066650390625, 0.13108062744140625, 0.1414947509765625, 0.15190887451171875, 0.162322998046875, 0.17273712158203125, 0.1831512451171875, 0.19356536865234375, 0.2039794921875, 0.21439361572265625, 0.2248077392578125, 0.23522186279296875, 0.245635986328125, 0.25605010986328125, 0.2664642333984375, 0.27687835693359375, 0.28729248046875, 0.29770660400390625, 0.3081207275390625, 0.31853485107421875, 0.328948974609375, 0.33936309814453125, 0.3497772216796875, 0.36019134521484375, 0.37060546875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 2.0, 8.0, 12.0, 12.0, 19.0, 34.0, 85.0, 155.0, 399.0, 1093.0, 4311.0, 31180.0, 833712.0, 163435.0, 10730.0, 2156.0, 671.0, 275.0, 120.0, 52.0, 22.0, 23.0, 13.0, 6.0, 5.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07568359375, -0.07305240631103516, -0.07042121887207031, -0.06779003143310547, -0.06515884399414062, -0.06252765655517578, -0.05989646911621094, -0.057265281677246094, -0.05463409423828125, -0.052002906799316406, -0.04937171936035156, -0.04674053192138672, -0.044109344482421875, -0.04147815704345703, -0.03884696960449219, -0.036215782165527344, -0.0335845947265625, -0.030953407287597656, -0.028322219848632812, -0.02569103240966797, -0.023059844970703125, -0.02042865753173828, -0.017797470092773438, -0.015166282653808594, -0.01253509521484375, -0.009903907775878906, -0.0072727203369140625, -0.004641532897949219, -0.002010345458984375, 0.0006208419799804688, 0.0032520294189453125, 0.005883216857910156, 0.008514404296875, 0.011145591735839844, 0.013776779174804688, 0.01640796661376953, 0.019039154052734375, 0.02167034149169922, 0.024301528930664062, 0.026932716369628906, 0.02956390380859375, 0.032195091247558594, 0.03482627868652344, 0.03745746612548828, 0.040088653564453125, 0.04271984100341797, 0.04535102844238281, 0.047982215881347656, 0.0506134033203125, 0.053244590759277344, 0.05587577819824219, 0.05850696563720703, 0.061138153076171875, 0.06376934051513672, 0.06640052795410156, 0.0690317153930664, 0.07166290283203125, 0.0742940902709961, 0.07692527770996094, 0.07955646514892578, 0.08218765258789062, 0.08481884002685547, 0.08745002746582031, 0.09008121490478516, 0.09271240234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 0.0, 2.0, 9.0, 8.0, 7.0, 6.0, 13.0, 30.0, 25.0, 51.0, 57.0, 88.0, 98.0, 177.0, 136.0, 82.0, 67.0, 42.0, 21.0, 22.0, 18.0, 12.0, 10.0, 2.0, 6.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.059906005859375e-06, -8.830800652503967e-06, -8.60169529914856e-06, -8.372589945793152e-06, -8.143484592437744e-06, -7.914379239082336e-06, -7.685273885726929e-06, -7.456168532371521e-06, -7.227063179016113e-06, -6.9979578256607056e-06, -6.768852472305298e-06, -6.53974711894989e-06, -6.310641765594482e-06, -6.081536412239075e-06, -5.852431058883667e-06, -5.623325705528259e-06, -5.3942203521728516e-06, -5.165114998817444e-06, -4.936009645462036e-06, -4.706904292106628e-06, -4.477798938751221e-06, -4.248693585395813e-06, -4.019588232040405e-06, -3.7904828786849976e-06, -3.56137752532959e-06, -3.332272171974182e-06, -3.1031668186187744e-06, -2.8740614652633667e-06, -2.644956111907959e-06, -2.4158507585525513e-06, -2.1867454051971436e-06, -1.957640051841736e-06, -1.7285346984863281e-06, -1.4994293451309204e-06, -1.2703239917755127e-06, -1.041218638420105e-06, -8.121132850646973e-07, -5.830079317092896e-07, -3.5390257835388184e-07, -1.2479722499847412e-07, 1.043081283569336e-07, 3.334134817123413e-07, 5.62518835067749e-07, 7.916241884231567e-07, 1.0207295417785645e-06, 1.2498348951339722e-06, 1.4789402484893799e-06, 1.7080456018447876e-06, 1.9371509552001953e-06, 2.166256308555603e-06, 2.3953616619110107e-06, 2.6244670152664185e-06, 2.853572368621826e-06, 3.082677721977234e-06, 3.3117830753326416e-06, 3.5408884286880493e-06, 3.769993782043457e-06, 3.999099135398865e-06, 4.2282044887542725e-06, 4.45730984210968e-06, 4.686415195465088e-06, 4.915520548820496e-06, 5.144625902175903e-06, 5.373731255531311e-06, 5.602836608886719e-06]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 9.0, 9.0, 10.0, 22.0, 34.0, 42.0, 71.0, 117.0, 210.0, 510.0, 1292.0, 3891.0, 18010.0, 389368.0, 607164.0, 20975.0, 4280.0, 1424.0, 570.0, 231.0, 138.0, 63.0, 35.0, 26.0, 15.0, 13.0, 15.0, 8.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08843994140625, -0.08504390716552734, -0.08164787292480469, -0.07825183868408203, -0.07485580444335938, -0.07145977020263672, -0.06806373596191406, -0.0646677017211914, -0.06127166748046875, -0.057875633239746094, -0.05447959899902344, -0.05108356475830078, -0.047687530517578125, -0.04429149627685547, -0.04089546203613281, -0.037499427795410156, -0.0341033935546875, -0.030707359313964844, -0.027311325073242188, -0.02391529083251953, -0.020519256591796875, -0.01712322235107422, -0.013727188110351562, -0.010331153869628906, -0.00693511962890625, -0.0035390853881835938, -0.0001430511474609375, 0.0032529830932617188, 0.006649017333984375, 0.010045051574707031, 0.013441085815429688, 0.016837120056152344, 0.020233154296875, 0.023629188537597656, 0.027025222778320312, 0.03042125701904297, 0.033817291259765625, 0.03721332550048828, 0.04060935974121094, 0.044005393981933594, 0.04740142822265625, 0.050797462463378906, 0.05419349670410156, 0.05758953094482422, 0.060985565185546875, 0.06438159942626953, 0.06777763366699219, 0.07117366790771484, 0.0745697021484375, 0.07796573638916016, 0.08136177062988281, 0.08475780487060547, 0.08815383911132812, 0.09154987335205078, 0.09494590759277344, 0.0983419418334961, 0.10173797607421875, 0.1051340103149414, 0.10853004455566406, 0.11192607879638672, 0.11532211303710938, 0.11871814727783203, 0.12211418151855469, 0.12551021575927734, 0.12890625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 13.0, 20.0, 22.0, 36.0, 63.0, 106.0, 148.0, 210.0, 129.0, 82.0, 61.0, 32.0, 18.0, 12.0, 13.0, 4.0, 6.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.045440673828125, -0.04425477981567383, -0.043068885803222656, -0.041882991790771484, -0.04069709777832031, -0.03951120376586914, -0.03832530975341797, -0.0371394157409668, -0.035953521728515625, -0.03476762771606445, -0.03358173370361328, -0.03239583969116211, -0.031209945678710938, -0.030024051666259766, -0.028838157653808594, -0.027652263641357422, -0.02646636962890625, -0.025280475616455078, -0.024094581604003906, -0.022908687591552734, -0.021722793579101562, -0.02053689956665039, -0.01935100555419922, -0.018165111541748047, -0.016979217529296875, -0.015793323516845703, -0.014607429504394531, -0.01342153549194336, -0.012235641479492188, -0.011049747467041016, -0.009863853454589844, -0.008677959442138672, -0.0074920654296875, -0.006306171417236328, -0.005120277404785156, -0.003934383392333984, -0.0027484893798828125, -0.0015625953674316406, -0.00037670135498046875, 0.0008091926574707031, 0.001995086669921875, 0.003180980682373047, 0.004366874694824219, 0.005552768707275391, 0.0067386627197265625, 0.007924556732177734, 0.009110450744628906, 0.010296344757080078, 0.01148223876953125, 0.012668132781982422, 0.013854026794433594, 0.015039920806884766, 0.016225814819335938, 0.01741170883178711, 0.01859760284423828, 0.019783496856689453, 0.020969390869140625, 0.022155284881591797, 0.02334117889404297, 0.02452707290649414, 0.025712966918945312, 0.026898860931396484, 0.028084754943847656, 0.029270648956298828, 0.03045654296875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 42.0, 201.0, 423.0, 267.0, 51.0, 15.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4311898350715637, -0.38658493757247925, -0.3419800102710724, -0.2973750829696655, -0.25277018547058105, -0.2081652730703354, -0.16356036067008972, -0.11895543336868286, -0.07435053586959839, -0.029745623469352722, 0.014859288930892944, 0.05946420133113861, 0.10406911373138428, 0.14867402613162994, 0.1932789385318756, 0.23788386583328247, 0.28248876333236694, 0.3270936608314514, 0.3716985881328583, 0.41630351543426514, 0.4609084129333496, 0.5055133104324341, 0.5501182079315186, 0.5947231650352478, 0.6393280625343323, 0.6839329600334167, 0.728537917137146, 0.7731428146362305, 0.8177477121353149, 0.8623526096343994, 0.9069575071334839, 0.9515624642372131, 0.9961674213409424, 1.0407723188400269, 1.0853772163391113, 1.1299821138381958, 1.1745870113372803, 1.2191920280456543, 1.2637969255447388, 1.3084018230438232, 1.3530067205429077, 1.3976116180419922, 1.4422165155410767, 1.4868214130401611, 1.5314264297485352, 1.5760313272476196, 1.620636224746704, 1.6652411222457886, 1.709846019744873, 1.7544509172439575, 1.799055814743042, 1.8436607122421265, 1.888265609741211, 1.932870626449585, 1.9774755239486694, 2.022080421447754, 2.066685199737549, 2.111290216445923, 2.1558949947357178, 2.200500011444092, 2.2451047897338867, 2.2897098064422607, 2.3343145847320557, 2.3789196014404297, 2.4235246181488037]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 10.0, 7.0, 8.0, 15.0, 15.0, 16.0, 18.0, 23.0, 20.0, 26.0, 31.0, 35.0, 44.0, 36.0, 43.0, 40.0, 42.0, 49.0, 43.0, 27.0, 36.0, 39.0, 36.0, 43.0, 35.0, 42.0, 32.0, 26.0, 27.0, 22.0, 26.0, 17.0, 22.0, 8.0, 10.0, 9.0, 5.0, 3.0, 2.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38138970732688904, -0.3677147924900055, -0.35403984785079956, -0.340364933013916, -0.32669001817703247, -0.31301507353782654, -0.299340158700943, -0.28566521406173706, -0.2719902992248535, -0.25831538438796997, -0.24464043974876404, -0.2309655249118805, -0.21729059517383575, -0.20361566543579102, -0.18994075059890747, -0.17626582086086273, -0.162590891122818, -0.14891596138477325, -0.13524103164672852, -0.12156611680984497, -0.10789118707180023, -0.0942162573337555, -0.08054133504629135, -0.06686641275882721, -0.05319148302078247, -0.03951655700802803, -0.02584163099527359, -0.01216670498251915, 0.0015082210302352905, 0.01518315076828003, 0.02885807305574417, 0.04253299534320831, 0.056207895278930664, 0.0698828250169754, 0.08355774730443954, 0.09723266959190369, 0.11090759932994843, 0.12458252906799316, 0.1382574439048767, 0.15193237364292145, 0.1656073033809662, 0.17928223311901093, 0.19295716285705566, 0.2066320776939392, 0.22030700743198395, 0.2339819371700287, 0.24765685200691223, 0.26133179664611816, 0.2750067114830017, 0.28868162631988525, 0.3023565709590912, 0.31603148579597473, 0.32970643043518066, 0.3433813452720642, 0.35705626010894775, 0.3707311749458313, 0.38440611958503723, 0.3980810344219208, 0.4117559790611267, 0.42543089389801025, 0.4391058087348938, 0.45278075337409973, 0.4664556682109833, 0.4801306128501892, 0.49380552768707275]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 6.0, 7.0, 8.0, 8.0, 12.0, 24.0, 26.0, 45.0, 50.0, 88.0, 130.0, 148.0, 242.0, 495.0, 1071.0, 2640.0, 8351.0, 80577.0, 3857084.0, 221773.0, 14554.0, 4117.0, 1278.0, 633.0, 313.0, 193.0, 132.0, 60.0, 53.0, 49.0, 26.0, 19.0, 12.0, 13.0, 6.0, 9.0, 9.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.435546875, -0.4221916198730469, -0.40883636474609375, -0.3954811096191406, -0.3821258544921875, -0.3687705993652344, -0.35541534423828125, -0.3420600891113281, -0.328704833984375, -0.3153495788574219, -0.30199432373046875, -0.2886390686035156, -0.2752838134765625, -0.2619285583496094, -0.24857330322265625, -0.23521804809570312, -0.22186279296875, -0.20850753784179688, -0.19515228271484375, -0.18179702758789062, -0.1684417724609375, -0.15508651733398438, -0.14173126220703125, -0.12837600708007812, -0.115020751953125, -0.10166549682617188, -0.08831024169921875, -0.07495498657226562, -0.0615997314453125, -0.048244476318359375, -0.03488922119140625, -0.021533966064453125, -0.0081787109375, 0.005176544189453125, 0.01853179931640625, 0.031887054443359375, 0.0452423095703125, 0.058597564697265625, 0.07195281982421875, 0.08530807495117188, 0.098663330078125, 0.11201858520507812, 0.12537384033203125, 0.13872909545898438, 0.1520843505859375, 0.16543960571289062, 0.17879486083984375, 0.19215011596679688, 0.20550537109375, 0.21886062622070312, 0.23221588134765625, 0.24557113647460938, 0.2589263916015625, 0.2722816467285156, 0.28563690185546875, 0.2989921569824219, 0.312347412109375, 0.3257026672363281, 0.33905792236328125, 0.3524131774902344, 0.3657684326171875, 0.3791236877441406, 0.39247894287109375, 0.4058341979980469, 0.419189453125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 7.0, 14.0, 21.0, 36.0, 49.0, 67.0, 79.0, 84.0, 88.0, 101.0, 110.0, 80.0, 73.0, 47.0, 43.0, 30.0, 28.0, 27.0, 9.0, 8.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.276123046875, -0.2694683074951172, -0.2628135681152344, -0.25615882873535156, -0.24950408935546875, -0.24284934997558594, -0.23619461059570312, -0.2295398712158203, -0.2228851318359375, -0.2162303924560547, -0.20957565307617188, -0.20292091369628906, -0.19626617431640625, -0.18961143493652344, -0.18295669555664062, -0.1763019561767578, -0.169647216796875, -0.1629924774169922, -0.15633773803710938, -0.14968299865722656, -0.14302825927734375, -0.13637351989746094, -0.12971878051757812, -0.12306404113769531, -0.1164093017578125, -0.10975456237792969, -0.10309982299804688, -0.09644508361816406, -0.08979034423828125, -0.08313560485839844, -0.07648086547851562, -0.06982612609863281, -0.06317138671875, -0.05651664733886719, -0.049861907958984375, -0.04320716857910156, -0.03655242919921875, -0.029897689819335938, -0.023242950439453125, -0.016588211059570312, -0.0099334716796875, -0.0032787322998046875, 0.003376007080078125, 0.010030746459960938, 0.01668548583984375, 0.023340225219726562, 0.029994964599609375, 0.03664970397949219, 0.043304443359375, 0.04995918273925781, 0.056613922119140625, 0.06326866149902344, 0.06992340087890625, 0.07657814025878906, 0.08323287963867188, 0.08988761901855469, 0.0965423583984375, 0.10319709777832031, 0.10985183715820312, 0.11650657653808594, 0.12316131591796875, 0.12981605529785156, 0.13647079467773438, 0.1431255340576172, 0.1497802734375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 2.0, 4.0, 9.0, 12.0, 18.0, 39.0, 132.0, 559.0, 5689.0, 4161853.0, 24627.0, 998.0, 217.0, 55.0, 26.0, 16.0, 11.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5068359375, -1.4657440185546875, -1.424652099609375, -1.3835601806640625, -1.34246826171875, -1.3013763427734375, -1.260284423828125, -1.2191925048828125, -1.1781005859375, -1.1370086669921875, -1.095916748046875, -1.0548248291015625, -1.01373291015625, -0.9726409912109375, -0.931549072265625, -0.8904571533203125, -0.849365234375, -0.8082733154296875, -0.767181396484375, -0.7260894775390625, -0.68499755859375, -0.6439056396484375, -0.602813720703125, -0.5617218017578125, -0.5206298828125, -0.4795379638671875, -0.438446044921875, -0.3973541259765625, -0.35626220703125, -0.3151702880859375, -0.274078369140625, -0.2329864501953125, -0.19189453125, -0.1508026123046875, -0.109710693359375, -0.0686187744140625, -0.02752685546875, 0.0135650634765625, 0.054656982421875, 0.0957489013671875, 0.1368408203125, 0.1779327392578125, 0.219024658203125, 0.2601165771484375, 0.30120849609375, 0.3423004150390625, 0.383392333984375, 0.4244842529296875, 0.465576171875, 0.5066680908203125, 0.547760009765625, 0.5888519287109375, 0.62994384765625, 0.6710357666015625, 0.712127685546875, 0.7532196044921875, 0.7943115234375, 0.8354034423828125, 0.876495361328125, 0.9175872802734375, 0.95867919921875, 0.9997711181640625, 1.040863037109375, 1.0819549560546875, 1.123046875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 7.0, 9.0, 18.0, 60.0, 143.0, 839.0, 1982.0, 755.0, 165.0, 42.0, 22.0, 13.0, 7.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.162353515625, -0.15645408630371094, -0.15055465698242188, -0.1446552276611328, -0.13875579833984375, -0.1328563690185547, -0.12695693969726562, -0.12105751037597656, -0.1151580810546875, -0.10925865173339844, -0.10335922241210938, -0.09745979309082031, -0.09156036376953125, -0.08566093444824219, -0.07976150512695312, -0.07386207580566406, -0.067962646484375, -0.06206321716308594, -0.056163787841796875, -0.05026435852050781, -0.04436492919921875, -0.03846549987792969, -0.032566070556640625, -0.026666641235351562, -0.0207672119140625, -0.014867782592773438, -0.008968353271484375, -0.0030689239501953125, 0.00283050537109375, 0.008729934692382812, 0.014629364013671875, 0.020528793334960938, 0.02642822265625, 0.03232765197753906, 0.038227081298828125, 0.04412651062011719, 0.05002593994140625, 0.05592536926269531, 0.061824798583984375, 0.06772422790527344, 0.0736236572265625, 0.07952308654785156, 0.08542251586914062, 0.09132194519042969, 0.09722137451171875, 0.10312080383300781, 0.10902023315429688, 0.11491966247558594, 0.120819091796875, 0.12671852111816406, 0.13261795043945312, 0.1385173797607422, 0.14441680908203125, 0.1503162384033203, 0.15621566772460938, 0.16211509704589844, 0.1680145263671875, 0.17391395568847656, 0.17981338500976562, 0.1857128143310547, 0.19161224365234375, 0.1975116729736328, 0.20341110229492188, 0.20931053161621094, 0.2152099609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 3.0, 3.0, 7.0, 6.0, 4.0, 12.0, 14.0, 25.0, 21.0, 28.0, 47.0, 52.0, 67.0, 62.0, 85.0, 94.0, 101.0, 63.0, 65.0, 67.0, 51.0, 26.0, 29.0, 25.0, 13.0, 14.0, 10.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1069868803024292, -0.10128872096538544, -0.09559056162834167, -0.08989240229129791, -0.08419424295425415, -0.07849608361721039, -0.07279793173074722, -0.06709977239370346, -0.0614016130566597, -0.055703453719615936, -0.050005294382572174, -0.04430713877081871, -0.03860897943377495, -0.032910820096731186, -0.027212664484977722, -0.02151450514793396, -0.015816345810890198, -0.01011818740516901, -0.004420028999447823, 0.0012781284749507904, 0.006976287811994553, 0.012674447149038315, 0.01837260276079178, 0.02407076209783554, 0.029768921434879303, 0.035467080771923065, 0.04116524010896683, 0.04686339572072029, 0.05256155505776405, 0.058259714394807816, 0.06395787000656128, 0.06965602934360504, 0.0753541886806488, 0.08105234801769257, 0.08675050735473633, 0.09244866669178009, 0.09814682602882385, 0.10384498536586761, 0.10954313725233078, 0.11524129658937454, 0.1209394559264183, 0.12663760781288147, 0.13233576714992523, 0.138033926486969, 0.14373208582401276, 0.14943024516105652, 0.15512840449810028, 0.16082656383514404, 0.1665247231721878, 0.17222288250923157, 0.17792104184627533, 0.1836192011833191, 0.18931736052036285, 0.19501551985740662, 0.20071366429328918, 0.20641183853149414, 0.2121099829673767, 0.21780814230442047, 0.22350630164146423, 0.229204460978508, 0.23490262031555176, 0.24060077965259552, 0.24629893898963928, 0.25199708342552185, 0.2576952576637268]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 3.0, 5.0, 9.0, 9.0, 7.0, 13.0, 17.0, 14.0, 22.0, 20.0, 23.0, 17.0, 24.0, 32.0, 35.0, 38.0, 37.0, 28.0, 46.0, 42.0, 49.0, 41.0, 36.0, 44.0, 41.0, 32.0, 48.0, 41.0, 32.0, 35.0, 19.0, 20.0, 18.0, 16.0, 14.0, 17.0, 9.0, 11.0, 7.0, 4.0, 7.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10701067745685577, -0.10366680473089218, -0.10032292455434799, -0.0969790518283844, -0.09363517165184021, -0.09029129892587662, -0.08694742619991302, -0.08360354602336884, -0.08025967329740524, -0.07691580057144165, -0.07357192039489746, -0.07022804766893387, -0.06688417494297028, -0.06354029476642609, -0.060196422040462494, -0.0568525455892086, -0.05350866913795471, -0.05016479268670082, -0.04682091623544693, -0.04347704350948334, -0.040133167058229446, -0.036789290606975555, -0.03344541788101196, -0.030101541429758072, -0.02675766497850418, -0.02341378852725029, -0.020069913938641548, -0.016726039350032806, -0.013382162898778915, -0.010038286447525024, -0.006694411858916283, -0.003350537270307541, -6.660819053649902e-06, 0.0033372147008776665, 0.006681090220808983, 0.0100249657407403, 0.013368841260671616, 0.016712717711925507, 0.02005659230053425, 0.02340046688914299, 0.02674434334039688, 0.030088219791650772, 0.03343209624290466, 0.036775968968868256, 0.04011984542012215, 0.04346372187137604, 0.04680759459733963, 0.05015147104859352, 0.05349534749984741, 0.0568392239511013, 0.060183100402355194, 0.06352697312831879, 0.06687085330486298, 0.07021472603082657, 0.07355859875679016, 0.07690247893333435, 0.08024635165929794, 0.08359022438526154, 0.08693410456180573, 0.09027797728776932, 0.09362185001373291, 0.0969657301902771, 0.10030960291624069, 0.10365347564220428, 0.10699735581874847]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 7.0, 16.0, 15.0, 28.0, 30.0, 36.0, 56.0, 81.0, 119.0, 198.0, 321.0, 526.0, 1120.0, 2625.0, 7226.0, 24989.0, 112395.0, 552118.0, 275950.0, 50083.0, 12855.0, 4180.0, 1694.0, 726.0, 387.0, 242.0, 185.0, 90.0, 70.0, 43.0, 40.0, 30.0, 17.0, 13.0, 11.0, 8.0, 4.0, 4.0, 3.0, 7.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040130615234375, -0.03850889205932617, -0.036887168884277344, -0.035265445709228516, -0.03364372253417969, -0.03202199935913086, -0.03040027618408203, -0.028778553009033203, -0.027156829833984375, -0.025535106658935547, -0.02391338348388672, -0.02229166030883789, -0.020669937133789062, -0.019048213958740234, -0.017426490783691406, -0.015804767608642578, -0.01418304443359375, -0.012561321258544922, -0.010939598083496094, -0.009317874908447266, -0.0076961517333984375, -0.006074428558349609, -0.004452705383300781, -0.002830982208251953, -0.001209259033203125, 0.0004124641418457031, 0.0020341873168945312, 0.0036559104919433594, 0.0052776336669921875, 0.006899356842041016, 0.008521080017089844, 0.010142803192138672, 0.0117645263671875, 0.013386249542236328, 0.015007972717285156, 0.016629695892333984, 0.018251419067382812, 0.01987314224243164, 0.02149486541748047, 0.023116588592529297, 0.024738311767578125, 0.026360034942626953, 0.02798175811767578, 0.02960348129272461, 0.031225204467773438, 0.032846927642822266, 0.034468650817871094, 0.03609037399291992, 0.03771209716796875, 0.03933382034301758, 0.040955543518066406, 0.042577266693115234, 0.04419898986816406, 0.04582071304321289, 0.04744243621826172, 0.04906415939331055, 0.050685882568359375, 0.0523076057434082, 0.05392932891845703, 0.05555105209350586, 0.05717277526855469, 0.058794498443603516, 0.060416221618652344, 0.06203794479370117, 0.06365966796875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 2.0, 5.0, 7.0, 7.0, 10.0, 15.0, 12.0, 16.0, 17.0, 24.0, 25.0, 31.0, 41.0, 32.0, 55.0, 47.0, 56.0, 55.0, 53.0, 45.0, 45.0, 55.0, 56.0, 46.0, 44.0, 37.0, 29.0, 21.0, 22.0, 17.0, 14.0, 19.0, 13.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.09942626953125, -0.09679698944091797, -0.09416770935058594, -0.0915384292602539, -0.08890914916992188, -0.08627986907958984, -0.08365058898925781, -0.08102130889892578, -0.07839202880859375, -0.07576274871826172, -0.07313346862792969, -0.07050418853759766, -0.06787490844726562, -0.0652456283569336, -0.06261634826660156, -0.05998706817626953, -0.0573577880859375, -0.05472850799560547, -0.05209922790527344, -0.049469947814941406, -0.046840667724609375, -0.044211387634277344, -0.04158210754394531, -0.03895282745361328, -0.03632354736328125, -0.03369426727294922, -0.031064987182617188, -0.028435707092285156, -0.025806427001953125, -0.023177146911621094, -0.020547866821289062, -0.01791858673095703, -0.015289306640625, -0.012660026550292969, -0.010030746459960938, -0.007401466369628906, -0.004772186279296875, -0.0021429061889648438, 0.0004863739013671875, 0.0031156539916992188, 0.00574493408203125, 0.008374214172363281, 0.011003494262695312, 0.013632774353027344, 0.016262054443359375, 0.018891334533691406, 0.021520614624023438, 0.02414989471435547, 0.0267791748046875, 0.02940845489501953, 0.03203773498535156, 0.034667015075683594, 0.037296295166015625, 0.039925575256347656, 0.04255485534667969, 0.04518413543701172, 0.04781341552734375, 0.05044269561767578, 0.05307197570800781, 0.055701255798339844, 0.058330535888671875, 0.060959815979003906, 0.06358909606933594, 0.06621837615966797, 0.06884765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 15.0, 15.0, 30.0, 38.0, 40.0, 60.0, 85.0, 133.0, 196.0, 291.0, 366.0, 529.0, 778.0, 1089.0, 1650.0, 2344.0, 3476.0, 5230.0, 7943.0, 12104.0, 19079.0, 30944.0, 53646.0, 97642.0, 171334.0, 221981.0, 173201.0, 100309.0, 55600.0, 31766.0, 19278.0, 12363.0, 8089.0, 5338.0, 3554.0, 2476.0, 1636.0, 1219.0, 793.0, 536.0, 415.0, 272.0, 200.0, 138.0, 101.0, 68.0, 41.0, 36.0, 33.0, 19.0, 14.0, 7.0, 9.0, 2.0, 6.0, 5.0], "bins": [-0.0181732177734375, -0.017631053924560547, -0.017088890075683594, -0.01654672622680664, -0.016004562377929688, -0.015462398529052734, -0.014920234680175781, -0.014378070831298828, -0.013835906982421875, -0.013293743133544922, -0.012751579284667969, -0.012209415435791016, -0.011667251586914062, -0.01112508773803711, -0.010582923889160156, -0.010040760040283203, -0.00949859619140625, -0.008956432342529297, -0.008414268493652344, -0.00787210464477539, -0.0073299407958984375, -0.006787776947021484, -0.006245613098144531, -0.005703449249267578, -0.005161285400390625, -0.004619121551513672, -0.004076957702636719, -0.0035347938537597656, -0.0029926300048828125, -0.0024504661560058594, -0.0019083023071289062, -0.0013661384582519531, -0.000823974609375, -0.0002818107604980469, 0.00026035308837890625, 0.0008025169372558594, 0.0013446807861328125, 0.0018868446350097656, 0.0024290084838867188, 0.002971172332763672, 0.003513336181640625, 0.004055500030517578, 0.004597663879394531, 0.005139827728271484, 0.0056819915771484375, 0.006224155426025391, 0.006766319274902344, 0.007308483123779297, 0.00785064697265625, 0.008392810821533203, 0.008934974670410156, 0.00947713851928711, 0.010019302368164062, 0.010561466217041016, 0.011103630065917969, 0.011645793914794922, 0.012187957763671875, 0.012730121612548828, 0.013272285461425781, 0.013814449310302734, 0.014356613159179688, 0.01489877700805664, 0.015440940856933594, 0.015983104705810547, 0.0165252685546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 2.0, 0.0, 12.0, 9.0, 4.0, 8.0, 13.0, 13.0, 21.0, 15.0, 17.0, 19.0, 24.0, 17.0, 30.0, 33.0, 46.0, 37.0, 45.0, 34.0, 45.0, 66.0, 47.0, 45.0, 40.0, 47.0, 46.0, 46.0, 34.0, 30.0, 16.0, 31.0, 15.0, 16.0, 19.0, 12.0, 7.0, 11.0, 8.0, 7.0, 2.0, 2.0, 5.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2186279296875, -0.21216201782226562, -0.20569610595703125, -0.19923019409179688, -0.1927642822265625, -0.18629837036132812, -0.17983245849609375, -0.17336654663085938, -0.166900634765625, -0.16043472290039062, -0.15396881103515625, -0.14750289916992188, -0.1410369873046875, -0.13457107543945312, -0.12810516357421875, -0.12163925170898438, -0.11517333984375, -0.10870742797851562, -0.10224151611328125, -0.09577560424804688, -0.0893096923828125, -0.08284378051757812, -0.07637786865234375, -0.06991195678710938, -0.063446044921875, -0.056980133056640625, -0.05051422119140625, -0.044048309326171875, -0.0375823974609375, -0.031116485595703125, -0.02465057373046875, -0.018184661865234375, -0.01171875, -0.005252838134765625, 0.00121307373046875, 0.007678985595703125, 0.0141448974609375, 0.020610809326171875, 0.02707672119140625, 0.033542633056640625, 0.040008544921875, 0.046474456787109375, 0.05294036865234375, 0.059406280517578125, 0.0658721923828125, 0.07233810424804688, 0.07880401611328125, 0.08526992797851562, 0.09173583984375, 0.09820175170898438, 0.10466766357421875, 0.11113357543945312, 0.1175994873046875, 0.12406539916992188, 0.13053131103515625, 0.13699722290039062, 0.143463134765625, 0.14992904663085938, 0.15639495849609375, 0.16286087036132812, 0.1693267822265625, 0.17579269409179688, 0.18225860595703125, 0.18872451782226562, 0.1951904296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 6.0, 5.0, 9.0, 23.0, 26.0, 32.0, 34.0, 44.0, 94.0, 130.0, 203.0, 340.0, 590.0, 1002.0, 1750.0, 3246.0, 7112.0, 21780.0, 103001.0, 437577.0, 365864.0, 75482.0, 17213.0, 6142.0, 2882.0, 1573.0, 917.0, 568.0, 311.0, 183.0, 118.0, 86.0, 54.0, 36.0, 22.0, 18.0, 20.0, 15.0, 13.0, 7.0, 3.0, 5.0, 3.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0048675537109375, -0.004710078239440918, -0.004552602767944336, -0.004395127296447754, -0.004237651824951172, -0.00408017635345459, -0.003922700881958008, -0.0037652254104614258, -0.0036077499389648438, -0.0034502744674682617, -0.0032927989959716797, -0.0031353235244750977, -0.0029778480529785156, -0.0028203725814819336, -0.0026628971099853516, -0.0025054216384887695, -0.0023479461669921875, -0.0021904706954956055, -0.0020329952239990234, -0.0018755197525024414, -0.0017180442810058594, -0.0015605688095092773, -0.0014030933380126953, -0.0012456178665161133, -0.0010881423950195312, -0.0009306669235229492, -0.0007731914520263672, -0.0006157159805297852, -0.0004582405090332031, -0.0003007650375366211, -0.00014328956604003906, 1.4185905456542969e-05, 0.000171661376953125, 0.00032913684844970703, 0.00048661231994628906, 0.0006440877914428711, 0.0008015632629394531, 0.0009590387344360352, 0.0011165142059326172, 0.0012739896774291992, 0.0014314651489257812, 0.0015889406204223633, 0.0017464160919189453, 0.0019038915634155273, 0.0020613670349121094, 0.0022188425064086914, 0.0023763179779052734, 0.0025337934494018555, 0.0026912689208984375, 0.0028487443923950195, 0.0030062198638916016, 0.0031636953353881836, 0.0033211708068847656, 0.0034786462783813477, 0.0036361217498779297, 0.0037935972213745117, 0.003951072692871094, 0.004108548164367676, 0.004266023635864258, 0.00442349910736084, 0.004580974578857422, 0.004738450050354004, 0.004895925521850586, 0.005053400993347168, 0.00521087646484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 10.0, 13.0, 13.0, 24.0, 39.0, 48.0, 60.0, 84.0, 130.0, 97.0, 110.0, 113.0, 67.0, 62.0, 43.0, 20.0, 16.0, 15.0, 17.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.106231689453125e-06, -7.82497227191925e-06, -7.543712854385376e-06, -7.2624534368515015e-06, -6.981194019317627e-06, -6.6999346017837524e-06, -6.418675184249878e-06, -6.137415766716003e-06, -5.856156349182129e-06, -5.574896931648254e-06, -5.29363751411438e-06, -5.012378096580505e-06, -4.731118679046631e-06, -4.449859261512756e-06, -4.168599843978882e-06, -3.887340426445007e-06, -3.606081008911133e-06, -3.3248215913772583e-06, -3.043562173843384e-06, -2.7623027563095093e-06, -2.4810433387756348e-06, -2.1997839212417603e-06, -1.9185245037078857e-06, -1.6372650861740112e-06, -1.3560056686401367e-06, -1.0747462511062622e-06, -7.934868335723877e-07, -5.122274160385132e-07, -2.3096799850463867e-07, 5.029141902923584e-08, 3.3155083656311035e-07, 6.128102540969849e-07, 8.940696716308594e-07, 1.1753290891647339e-06, 1.4565885066986084e-06, 1.737847924232483e-06, 2.0191073417663574e-06, 2.300366759300232e-06, 2.5816261768341064e-06, 2.862885594367981e-06, 3.1441450119018555e-06, 3.42540442943573e-06, 3.7066638469696045e-06, 3.987923264503479e-06, 4.2691826820373535e-06, 4.550442099571228e-06, 4.8317015171051025e-06, 5.112960934638977e-06, 5.3942203521728516e-06, 5.675479769706726e-06, 5.956739187240601e-06, 6.237998604774475e-06, 6.51925802230835e-06, 6.800517439842224e-06, 7.081776857376099e-06, 7.363036274909973e-06, 7.644295692443848e-06, 7.925555109977722e-06, 8.206814527511597e-06, 8.488073945045471e-06, 8.769333362579346e-06, 9.05059278011322e-06, 9.331852197647095e-06, 9.61311161518097e-06, 9.894371032714844e-06]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 14.0, 10.0, 15.0, 13.0, 22.0, 32.0, 53.0, 92.0, 119.0, 182.0, 245.0, 383.0, 622.0, 1017.0, 1864.0, 3696.0, 7620.0, 16699.0, 39016.0, 88946.0, 181714.0, 264728.0, 221454.0, 120273.0, 54712.0, 23458.0, 10692.0, 4929.0, 2477.0, 1356.0, 757.0, 470.0, 303.0, 180.0, 120.0, 79.0, 59.0, 45.0, 28.0, 21.0, 8.0, 13.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.0023250579833984375, -0.002256035804748535, -0.002187013626098633, -0.0021179914474487305, -0.002048969268798828, -0.0019799470901489258, -0.0019109249114990234, -0.001841902732849121, -0.0017728805541992188, -0.0017038583755493164, -0.001634836196899414, -0.0015658140182495117, -0.0014967918395996094, -0.001427769660949707, -0.0013587474822998047, -0.0012897253036499023, -0.001220703125, -0.0011516809463500977, -0.0010826587677001953, -0.001013636589050293, -0.0009446144104003906, -0.0008755922317504883, -0.0008065700531005859, -0.0007375478744506836, -0.0006685256958007812, -0.0005995035171508789, -0.0005304813385009766, -0.0004614591598510742, -0.0003924369812011719, -0.00032341480255126953, -0.0002543926239013672, -0.00018537044525146484, -0.0001163482666015625, -4.7326087951660156e-05, 2.1696090698242188e-05, 9.071826934814453e-05, 0.00015974044799804688, 0.00022876262664794922, 0.00029778480529785156, 0.0003668069839477539, 0.00043582916259765625, 0.0005048513412475586, 0.0005738735198974609, 0.0006428956985473633, 0.0007119178771972656, 0.000780940055847168, 0.0008499622344970703, 0.0009189844131469727, 0.000988006591796875, 0.0010570287704467773, 0.0011260509490966797, 0.001195073127746582, 0.0012640953063964844, 0.0013331174850463867, 0.001402139663696289, 0.0014711618423461914, 0.0015401840209960938, 0.001609206199645996, 0.0016782283782958984, 0.0017472505569458008, 0.0018162727355957031, 0.0018852949142456055, 0.001954317092895508, 0.00202333927154541, 0.0020923614501953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 12.0, 18.0, 15.0, 21.0, 13.0, 24.0, 31.0, 41.0, 36.0, 43.0, 62.0, 60.0, 59.0, 61.0, 65.0, 63.0, 61.0, 34.0, 47.0, 56.0, 32.0, 29.0, 23.0, 21.0, 14.0, 14.0, 4.0, 9.0, 9.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0010080337524414062, -0.0009795725345611572, -0.0009511113166809082, -0.0009226500988006592, -0.0008941888809204102, -0.0008657276630401611, -0.0008372664451599121, -0.0008088052272796631, -0.0007803440093994141, -0.000751882791519165, -0.000723421573638916, -0.000694960355758667, -0.000666499137878418, -0.0006380379199981689, -0.0006095767021179199, -0.0005811154842376709, -0.0005526542663574219, -0.0005241930484771729, -0.0004957318305969238, -0.0004672706127166748, -0.0004388093948364258, -0.00041034817695617676, -0.00038188695907592773, -0.0003534257411956787, -0.0003249645233154297, -0.00029650330543518066, -0.00026804208755493164, -0.00023958086967468262, -0.0002111196517944336, -0.00018265843391418457, -0.00015419721603393555, -0.00012573599815368652, -9.72747802734375e-05, -6.881356239318848e-05, -4.035234451293945e-05, -1.189112663269043e-05, 1.6570091247558594e-05, 4.503130912780762e-05, 7.349252700805664e-05, 0.00010195374488830566, 0.0001304149627685547, 0.0001588761806488037, 0.00018733739852905273, 0.00021579861640930176, 0.0002442598342895508, 0.0002727210521697998, 0.00030118227005004883, 0.00032964348793029785, 0.0003581047058105469, 0.0003865659236907959, 0.0004150271415710449, 0.00044348835945129395, 0.00047194957733154297, 0.000500410795211792, 0.000528872013092041, 0.00055733323097229, 0.0005857944488525391, 0.0006142556667327881, 0.0006427168846130371, 0.0006711781024932861, 0.0006996393203735352, 0.0007281005382537842, 0.0007565617561340332, 0.0007850229740142822, 0.0008134841918945312]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 10.0, 11.0, 16.0, 28.0, 33.0, 43.0, 44.0, 52.0, 81.0, 78.0, 88.0, 98.0, 80.0, 62.0, 64.0, 44.0, 42.0, 34.0, 19.0, 13.0, 13.0, 11.0, 6.0, 6.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09447029232978821, -0.09121314436197281, -0.08795599639415741, -0.08469884842634201, -0.08144170045852661, -0.07818455249071121, -0.07492740452289581, -0.07167025655508041, -0.06841310858726501, -0.06515596061944962, -0.061898812651634216, -0.05864166468381882, -0.05538451671600342, -0.05212736874818802, -0.04887022078037262, -0.04561307281255722, -0.04235592484474182, -0.03909877687692642, -0.03584162890911102, -0.032584480941295624, -0.029327332973480225, -0.026070185005664825, -0.022813037037849426, -0.019555889070034027, -0.016298741102218628, -0.013041593134403229, -0.00978444516658783, -0.00652729719877243, -0.0032701492309570312, -1.300126314163208e-05, 0.003244146704673767, 0.006501294672489166, 0.009758450090885162, 0.013015598058700562, 0.01627274602651596, 0.01952989399433136, 0.02278704196214676, 0.026044189929962158, 0.029301337897777557, 0.03255848586559296, 0.035815633833408356, 0.039072781801223755, 0.042329929769039154, 0.04558707773685455, 0.04884422570466995, 0.05210137367248535, 0.05535852164030075, 0.05861566960811615, 0.06187281757593155, 0.06512996554374695, 0.06838711351156235, 0.07164426147937775, 0.07490140944719315, 0.07815855741500854, 0.08141570538282394, 0.08467285335063934, 0.08793000131845474, 0.09118714928627014, 0.09444429725408554, 0.09770144522190094, 0.10095859318971634, 0.10421574115753174, 0.10747288912534714, 0.11073003709316254, 0.11398718506097794]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 7.0, 12.0, 8.0, 13.0, 22.0, 19.0, 22.0, 29.0, 32.0, 43.0, 47.0, 52.0, 48.0, 60.0, 72.0, 51.0, 58.0, 59.0, 55.0, 61.0, 49.0, 34.0, 31.0, 21.0, 21.0, 19.0, 16.0, 10.0, 6.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.10945501923561096, -0.10658486932516098, -0.103714719414711, -0.10084456950426102, -0.09797441959381104, -0.09510426968336105, -0.09223411977291107, -0.08936397731304169, -0.08649381995201111, -0.08362367004156113, -0.08075352013111115, -0.07788337022066116, -0.07501322031021118, -0.0721430703997612, -0.06927292048931122, -0.06640277802944183, -0.06353262811899185, -0.06066247820854187, -0.05779232829809189, -0.05492217838764191, -0.052052028477191925, -0.04918187856674194, -0.04631173238158226, -0.04344158247113228, -0.0405714325606823, -0.037701282650232315, -0.03483113273978233, -0.03196098655462265, -0.02909083478152752, -0.026220684871077538, -0.023350536823272705, -0.020480386912822723, -0.01761024445295334, -0.014740094542503357, -0.01186994556337595, -0.008999796584248543, -0.006129646673798561, -0.0032594967633485794, -0.00038934871554374695, 0.0024808011949062347, 0.005350951105356216, 0.008221101015806198, 0.011091249994933605, 0.013961398974061012, 0.016831548884510994, 0.019701698794960976, 0.022571846842765808, 0.02544199675321579, 0.02831214666366577, 0.031182296574115753, 0.034052446484565735, 0.03692259639501572, 0.0397927463054657, 0.04266289621591568, 0.04553304240107536, 0.048403192311525345, 0.05127334222197533, 0.05414349213242531, 0.05701364204287529, 0.05988378822803497, 0.06275393813848495, 0.06562408804893494, 0.06849423795938492, 0.0713643878698349, 0.07423453778028488]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 6.0, 19.0, 22.0, 22.0, 38.0, 59.0, 93.0, 153.0, 253.0, 465.0, 1012.0, 2106.0, 5131.0, 13736.0, 39461.0, 124006.0, 392705.0, 322263.0, 96511.0, 31245.0, 11182.0, 4302.0, 1888.0, 839.0, 413.0, 248.0, 138.0, 80.0, 42.0, 30.0, 30.0, 22.0, 7.0, 13.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1414794921875, -0.1365833282470703, -0.13168716430664062, -0.12679100036621094, -0.12189483642578125, -0.11699867248535156, -0.11210250854492188, -0.10720634460449219, -0.1023101806640625, -0.09741401672363281, -0.09251785278320312, -0.08762168884277344, -0.08272552490234375, -0.07782936096191406, -0.07293319702148438, -0.06803703308105469, -0.063140869140625, -0.05824470520019531, -0.053348541259765625, -0.04845237731933594, -0.04355621337890625, -0.03866004943847656, -0.033763885498046875, -0.028867721557617188, -0.0239715576171875, -0.019075393676757812, -0.014179229736328125, -0.009283065795898438, -0.00438690185546875, 0.0005092620849609375, 0.005405426025390625, 0.010301589965820312, 0.01519775390625, 0.020093917846679688, 0.024990081787109375, 0.029886245727539062, 0.03478240966796875, 0.03967857360839844, 0.044574737548828125, 0.04947090148925781, 0.0543670654296875, 0.05926322937011719, 0.06415939331054688, 0.06905555725097656, 0.07395172119140625, 0.07884788513183594, 0.08374404907226562, 0.08864021301269531, 0.093536376953125, 0.09843254089355469, 0.10332870483398438, 0.10822486877441406, 0.11312103271484375, 0.11801719665527344, 0.12291336059570312, 0.1278095245361328, 0.1327056884765625, 0.1376018524169922, 0.14249801635742188, 0.14739418029785156, 0.15229034423828125, 0.15718650817871094, 0.16208267211914062, 0.1669788360595703, 0.171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 6.0, 15.0, 18.0, 16.0, 23.0, 21.0, 29.0, 31.0, 45.0, 53.0, 48.0, 71.0, 79.0, 70.0, 66.0, 66.0, 60.0, 58.0, 41.0, 40.0, 33.0, 30.0, 18.0, 22.0, 14.0, 6.0, 7.0, 5.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.145751953125, -0.1402740478515625, -0.134796142578125, -0.1293182373046875, -0.12384033203125, -0.1183624267578125, -0.112884521484375, -0.1074066162109375, -0.1019287109375, -0.0964508056640625, -0.090972900390625, -0.0854949951171875, -0.08001708984375, -0.0745391845703125, -0.069061279296875, -0.0635833740234375, -0.05810546875, -0.0526275634765625, -0.047149658203125, -0.0416717529296875, -0.03619384765625, -0.0307159423828125, -0.025238037109375, -0.0197601318359375, -0.0142822265625, -0.0088043212890625, -0.003326416015625, 0.0021514892578125, 0.00762939453125, 0.0131072998046875, 0.018585205078125, 0.0240631103515625, 0.029541015625, 0.0350189208984375, 0.040496826171875, 0.0459747314453125, 0.05145263671875, 0.0569305419921875, 0.062408447265625, 0.0678863525390625, 0.0733642578125, 0.0788421630859375, 0.084320068359375, 0.0897979736328125, 0.09527587890625, 0.1007537841796875, 0.106231689453125, 0.1117095947265625, 0.1171875, 0.1226654052734375, 0.128143310546875, 0.1336212158203125, 0.13909912109375, 0.1445770263671875, 0.150054931640625, 0.1555328369140625, 0.1610107421875, 0.1664886474609375, 0.171966552734375, 0.1774444580078125, 0.18292236328125, 0.1884002685546875, 0.193878173828125, 0.1993560791015625, 0.204833984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 10.0, 16.0, 15.0, 10.0, 33.0, 44.0, 58.0, 94.0, 129.0, 214.0, 295.0, 520.0, 900.0, 1663.0, 3397.0, 7139.0, 17865.0, 53310.0, 192362.0, 482666.0, 199204.0, 55277.0, 18438.0, 7355.0, 3400.0, 1692.0, 965.0, 559.0, 285.0, 201.0, 147.0, 83.0, 51.0, 45.0, 35.0, 20.0, 14.0, 9.0, 7.0, 5.0, 6.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1456298828125, -0.14069557189941406, -0.13576126098632812, -0.1308269500732422, -0.12589263916015625, -0.12095832824707031, -0.11602401733398438, -0.11108970642089844, -0.1061553955078125, -0.10122108459472656, -0.09628677368164062, -0.09135246276855469, -0.08641815185546875, -0.08148384094238281, -0.07654953002929688, -0.07161521911621094, -0.066680908203125, -0.06174659729003906, -0.056812286376953125, -0.05187797546386719, -0.04694366455078125, -0.04200935363769531, -0.037075042724609375, -0.03214073181152344, -0.0272064208984375, -0.022272109985351562, -0.017337799072265625, -0.012403488159179688, -0.00746917724609375, -0.0025348663330078125, 0.002399444580078125, 0.0073337554931640625, 0.01226806640625, 0.017202377319335938, 0.022136688232421875, 0.027070999145507812, 0.03200531005859375, 0.03693962097167969, 0.041873931884765625, 0.04680824279785156, 0.0517425537109375, 0.05667686462402344, 0.061611175537109375, 0.06654548645019531, 0.07147979736328125, 0.07641410827636719, 0.08134841918945312, 0.08628273010253906, 0.091217041015625, 0.09615135192871094, 0.10108566284179688, 0.10601997375488281, 0.11095428466796875, 0.11588859558105469, 0.12082290649414062, 0.12575721740722656, 0.1306915283203125, 0.13562583923339844, 0.14056015014648438, 0.1454944610595703, 0.15042877197265625, 0.1553630828857422, 0.16029739379882812, 0.16523170471191406, 0.170166015625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 8.0, 10.0, 7.0, 21.0, 11.0, 20.0, 27.0, 32.0, 47.0, 42.0, 73.0, 54.0, 65.0, 77.0, 73.0, 73.0, 74.0, 68.0, 54.0, 30.0, 24.0, 23.0, 14.0, 14.0, 20.0, 12.0, 6.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2191162109375, -0.21310997009277344, -0.20710372924804688, -0.2010974884033203, -0.19509124755859375, -0.1890850067138672, -0.18307876586914062, -0.17707252502441406, -0.1710662841796875, -0.16506004333496094, -0.15905380249023438, -0.1530475616455078, -0.14704132080078125, -0.1410350799560547, -0.13502883911132812, -0.12902259826660156, -0.123016357421875, -0.11701011657714844, -0.11100387573242188, -0.10499763488769531, -0.09899139404296875, -0.09298515319824219, -0.08697891235351562, -0.08097267150878906, -0.0749664306640625, -0.06896018981933594, -0.06295394897460938, -0.05694770812988281, -0.05094146728515625, -0.04493522644042969, -0.038928985595703125, -0.03292274475097656, -0.02691650390625, -0.020910263061523438, -0.014904022216796875, -0.008897781372070312, -0.00289154052734375, 0.0031147003173828125, 0.009120941162109375, 0.015127182006835938, 0.0211334228515625, 0.027139663696289062, 0.033145904541015625, 0.03915214538574219, 0.04515838623046875, 0.05116462707519531, 0.057170867919921875, 0.06317710876464844, 0.069183349609375, 0.07518959045410156, 0.08119583129882812, 0.08720207214355469, 0.09320831298828125, 0.09921455383300781, 0.10522079467773438, 0.11122703552246094, 0.1172332763671875, 0.12323951721191406, 0.12924575805664062, 0.1352519989013672, 0.14125823974609375, 0.1472644805908203, 0.15327072143554688, 0.15927696228027344, 0.165283203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 5.0, 9.0, 7.0, 10.0, 13.0, 18.0, 39.0, 33.0, 46.0, 58.0, 72.0, 97.0, 143.0, 201.0, 300.0, 454.0, 817.0, 1792.0, 3695.0, 8623.0, 22865.0, 72825.0, 451274.0, 378130.0, 68770.0, 22216.0, 8450.0, 3604.0, 1630.0, 841.0, 481.0, 283.0, 192.0, 127.0, 79.0, 71.0, 62.0, 40.0, 30.0, 48.0, 23.0, 15.0, 15.0, 8.0, 7.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 5.0, 0.0, 1.0, 4.0], "bins": [-0.025848388671875, -0.025040149688720703, -0.024231910705566406, -0.02342367172241211, -0.022615432739257812, -0.021807193756103516, -0.02099895477294922, -0.020190715789794922, -0.019382476806640625, -0.018574237823486328, -0.01776599884033203, -0.016957759857177734, -0.016149520874023438, -0.01534128189086914, -0.014533042907714844, -0.013724803924560547, -0.01291656494140625, -0.012108325958251953, -0.011300086975097656, -0.01049184799194336, -0.009683609008789062, -0.008875370025634766, -0.008067131042480469, -0.007258892059326172, -0.006450653076171875, -0.005642414093017578, -0.004834175109863281, -0.004025936126708984, -0.0032176971435546875, -0.0024094581604003906, -0.0016012191772460938, -0.0007929801940917969, 1.52587890625e-05, 0.0008234977722167969, 0.0016317367553710938, 0.0024399757385253906, 0.0032482147216796875, 0.004056453704833984, 0.004864692687988281, 0.005672931671142578, 0.006481170654296875, 0.007289409637451172, 0.008097648620605469, 0.008905887603759766, 0.009714126586914062, 0.01052236557006836, 0.011330604553222656, 0.012138843536376953, 0.01294708251953125, 0.013755321502685547, 0.014563560485839844, 0.01537179946899414, 0.016180038452148438, 0.016988277435302734, 0.01779651641845703, 0.018604755401611328, 0.019412994384765625, 0.020221233367919922, 0.02102947235107422, 0.021837711334228516, 0.022645950317382812, 0.02345418930053711, 0.024262428283691406, 0.025070667266845703, 0.02587890625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 3.0, 2.0, 6.0, 12.0, 13.0, 19.0, 11.0, 46.0, 46.0, 46.0, 83.0, 91.0, 201.0, 115.0, 88.0, 51.0, 45.0, 30.0, 20.0, 22.0, 8.0, 8.0, 7.0, 6.0, 3.0, 4.0, 0.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.092952728271484e-06, -6.888061761856079e-06, -6.683170795440674e-06, -6.4782798290252686e-06, -6.273388862609863e-06, -6.068497896194458e-06, -5.863606929779053e-06, -5.6587159633636475e-06, -5.453824996948242e-06, -5.248934030532837e-06, -5.044043064117432e-06, -4.839152097702026e-06, -4.634261131286621e-06, -4.429370164871216e-06, -4.2244791984558105e-06, -4.019588232040405e-06, -3.814697265625e-06, -3.6098062992095947e-06, -3.4049153327941895e-06, -3.200024366378784e-06, -2.995133399963379e-06, -2.7902424335479736e-06, -2.5853514671325684e-06, -2.380460500717163e-06, -2.175569534301758e-06, -1.9706785678863525e-06, -1.7657876014709473e-06, -1.560896635055542e-06, -1.3560056686401367e-06, -1.1511147022247314e-06, -9.462237358093262e-07, -7.413327693939209e-07, -5.364418029785156e-07, -3.3155083656311035e-07, -1.2665987014770508e-07, 7.82310962677002e-08, 2.8312206268310547e-07, 4.880130290985107e-07, 6.92903995513916e-07, 8.977949619293213e-07, 1.1026859283447266e-06, 1.3075768947601318e-06, 1.5124678611755371e-06, 1.7173588275909424e-06, 1.9222497940063477e-06, 2.127140760421753e-06, 2.332031726837158e-06, 2.5369226932525635e-06, 2.7418136596679688e-06, 2.946704626083374e-06, 3.1515955924987793e-06, 3.3564865589141846e-06, 3.56137752532959e-06, 3.766268491744995e-06, 3.9711594581604e-06, 4.176050424575806e-06, 4.380941390991211e-06, 4.585832357406616e-06, 4.7907233238220215e-06, 4.995614290237427e-06, 5.200505256652832e-06, 5.405396223068237e-06, 5.610287189483643e-06, 5.815178155899048e-06, 6.020069122314453e-06]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 5.0, 9.0, 15.0, 11.0, 14.0, 19.0, 28.0, 16.0, 33.0, 50.0, 55.0, 85.0, 146.0, 184.0, 306.0, 543.0, 1144.0, 2891.0, 10707.0, 85501.0, 861756.0, 69914.0, 9810.0, 2715.0, 1030.0, 541.0, 319.0, 217.0, 135.0, 84.0, 77.0, 43.0, 36.0, 14.0, 16.0, 15.0, 14.0, 12.0, 7.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0791015625, -0.07666492462158203, -0.07422828674316406, -0.0717916488647461, -0.06935501098632812, -0.06691837310791016, -0.06448173522949219, -0.06204509735107422, -0.05960845947265625, -0.05717182159423828, -0.05473518371582031, -0.052298545837402344, -0.049861907958984375, -0.047425270080566406, -0.04498863220214844, -0.04255199432373047, -0.0401153564453125, -0.03767871856689453, -0.03524208068847656, -0.032805442810058594, -0.030368804931640625, -0.027932167053222656, -0.025495529174804688, -0.02305889129638672, -0.02062225341796875, -0.01818561553955078, -0.015748977661132812, -0.013312339782714844, -0.010875701904296875, -0.008439064025878906, -0.0060024261474609375, -0.0035657882690429688, -0.001129150390625, 0.0013074874877929688, 0.0037441253662109375, 0.006180763244628906, 0.008617401123046875, 0.011054039001464844, 0.013490676879882812, 0.01592731475830078, 0.01836395263671875, 0.02080059051513672, 0.023237228393554688, 0.025673866271972656, 0.028110504150390625, 0.030547142028808594, 0.03298377990722656, 0.03542041778564453, 0.0378570556640625, 0.04029369354248047, 0.04273033142089844, 0.045166969299316406, 0.047603607177734375, 0.050040245056152344, 0.05247688293457031, 0.05491352081298828, 0.05735015869140625, 0.05978679656982422, 0.06222343444824219, 0.06466007232666016, 0.06709671020507812, 0.0695333480834961, 0.07196998596191406, 0.07440662384033203, 0.07684326171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 12.0, 18.0, 22.0, 35.0, 76.0, 235.0, 355.0, 143.0, 46.0, 29.0, 18.0, 9.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03961181640625, -0.0381011962890625, -0.036590576171875, -0.0350799560546875, -0.0335693359375, -0.0320587158203125, -0.030548095703125, -0.0290374755859375, -0.02752685546875, -0.0260162353515625, -0.024505615234375, -0.0229949951171875, -0.021484375, -0.0199737548828125, -0.018463134765625, -0.0169525146484375, -0.01544189453125, -0.0139312744140625, -0.012420654296875, -0.0109100341796875, -0.0093994140625, -0.0078887939453125, -0.006378173828125, -0.0048675537109375, -0.00335693359375, -0.0018463134765625, -0.000335693359375, 0.0011749267578125, 0.002685546875, 0.0041961669921875, 0.005706787109375, 0.0072174072265625, 0.00872802734375, 0.0102386474609375, 0.011749267578125, 0.0132598876953125, 0.0147705078125, 0.0162811279296875, 0.017791748046875, 0.0193023681640625, 0.02081298828125, 0.0223236083984375, 0.023834228515625, 0.0253448486328125, 0.02685546875, 0.0283660888671875, 0.029876708984375, 0.0313873291015625, 0.03289794921875, 0.0344085693359375, 0.035919189453125, 0.0374298095703125, 0.0389404296875, 0.0404510498046875, 0.041961669921875, 0.0434722900390625, 0.04498291015625, 0.0464935302734375, 0.048004150390625, 0.0495147705078125, 0.051025390625, 0.0525360107421875, 0.054046630859375, 0.0555572509765625, 0.05706787109375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 8.0, 14.0, 24.0, 38.0, 37.0, 67.0, 112.0, 126.0, 143.0, 133.0, 80.0, 65.0, 48.0, 35.0, 29.0, 12.0, 10.0, 8.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.28596094250679016, -0.27690771222114563, -0.2678544819355011, -0.25880125164985657, -0.24974802136421204, -0.2406947910785675, -0.23164156079292297, -0.22258833050727844, -0.2135351002216339, -0.20448186993598938, -0.19542863965034485, -0.18637540936470032, -0.1773221790790558, -0.16826894879341125, -0.15921571850776672, -0.1501624882221222, -0.14110924303531647, -0.13205601274967194, -0.1230027824640274, -0.11394955217838287, -0.10489632189273834, -0.09584309160709381, -0.08678985387086868, -0.07773662358522415, -0.06868339329957962, -0.05963016301393509, -0.05057693272829056, -0.04152369871735573, -0.0324704684317112, -0.023417238146066666, -0.014364004135131836, -0.005310773849487305, 0.0037424564361572266, 0.012795687653124332, 0.02184891887009144, 0.03090215101838112, 0.03995538130402565, 0.04900861158967018, 0.05806184560060501, 0.06711507588624954, 0.07616830617189407, 0.0852215364575386, 0.09427476674318314, 0.10332800447940826, 0.1123812347650528, 0.12143446505069733, 0.13048769533634186, 0.1395409256219864, 0.14859415590763092, 0.15764738619327545, 0.16670061647891998, 0.17575384676456451, 0.18480707705020905, 0.19386030733585358, 0.2029135525226593, 0.21196678280830383, 0.22102001309394836, 0.2300732433795929, 0.23912647366523743, 0.24817970395088196, 0.2572329342365265, 0.266286164522171, 0.27533939480781555, 0.2843926250934601, 0.2934458553791046]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 4.0, 4.0, 10.0, 9.0, 7.0, 13.0, 13.0, 19.0, 39.0, 22.0, 27.0, 33.0, 28.0, 38.0, 42.0, 39.0, 49.0, 38.0, 39.0, 45.0, 45.0, 43.0, 48.0, 51.0, 44.0, 31.0, 30.0, 23.0, 30.0, 22.0, 15.0, 11.0, 18.0, 18.0, 7.0, 7.0, 14.0, 10.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.20424164831638336, -0.1978919953107834, -0.19154232740402222, -0.18519267439842224, -0.17884302139282227, -0.1724933534860611, -0.16614370048046112, -0.15979403257369995, -0.15344437956809998, -0.1470947265625, -0.14074505865573883, -0.13439540565013885, -0.12804573774337769, -0.12169608473777771, -0.11534643173217773, -0.10899677127599716, -0.10264711081981659, -0.09629745036363602, -0.08994778990745544, -0.08359813690185547, -0.0772484764456749, -0.07089881598949432, -0.06454916298389435, -0.058199502527713776, -0.0518498420715332, -0.04550018161535263, -0.03915052488446236, -0.03280086815357208, -0.02645120769739151, -0.020101547241210938, -0.013751890510320663, -0.007402233779430389, -0.001052558422088623, 0.0052971001714468, 0.011646758764982224, 0.017996417358517647, 0.02434607595205307, 0.030695736408233643, 0.03704539313912392, 0.04339504987001419, 0.04974471032619476, 0.056094370782375336, 0.06244402751326561, 0.06879368424415588, 0.07514334470033646, 0.08149300515651703, 0.087842658162117, 0.09419231861829758, 0.10054197907447815, 0.10689163953065872, 0.1132412999868393, 0.11959095299243927, 0.12594062089920044, 0.13229027390480042, 0.1386399269104004, 0.14498957991600037, 0.15133924782276154, 0.1576889008283615, 0.16403856873512268, 0.17038822174072266, 0.17673787474632263, 0.1830875426530838, 0.18943719565868378, 0.19578686356544495, 0.20213651657104492]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 6.0, 6.0, 3.0, 12.0, 12.0, 12.0, 21.0, 13.0, 25.0, 24.0, 32.0, 47.0, 46.0, 64.0, 79.0, 112.0, 138.0, 160.0, 217.0, 276.0, 322.0, 482.0, 688.0, 1045377.0, 589.0, 362.0, 286.0, 244.0, 208.0, 135.0, 129.0, 81.0, 88.0, 42.0, 48.0, 45.0, 42.0, 31.0, 23.0, 19.0, 16.0, 10.0, 8.0, 7.0, 10.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.3409731984138489, -0.3307224214076996, -0.3204716145992279, -0.3102208375930786, -0.2999700605869293, -0.28971928358078003, -0.27946847677230835, -0.26921769976615906, -0.25896692276000977, -0.24871613085269928, -0.23846535384655, -0.2282145619392395, -0.2179637849330902, -0.20771299302577972, -0.19746220111846924, -0.18721142411231995, -0.17696061730384827, -0.16670982539653778, -0.1564590483903885, -0.146208256483078, -0.1359574794769287, -0.12570668756961823, -0.11545589566230774, -0.10520511120557785, -0.09495432674884796, -0.08470354229211807, -0.07445275783538818, -0.0642019659280777, -0.05395118147134781, -0.04370039701461792, -0.03344960883259773, -0.023198820650577545, -0.012948036193847656, -0.002697249874472618, 0.00755353644490242, 0.017804322764277458, 0.028055109083652496, 0.038305893540382385, 0.04855668172240257, 0.05880746990442276, 0.06905825436115265, 0.07930903881788254, 0.08955982327461243, 0.09981061518192291, 0.1100613996386528, 0.12031218409538269, 0.13056297600269318, 0.14081376791000366, 0.15106454491615295, 0.16131533682346344, 0.17156611382961273, 0.18181690573692322, 0.1920676827430725, 0.202318474650383, 0.21256926655769348, 0.22282004356384277, 0.23307083547115326, 0.24332162737846375, 0.25357240438461304, 0.26382318139076233, 0.274073988199234, 0.2843247652053833, 0.2945755422115326, 0.3048263490200043, 0.31507712602615356]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 1.0, 2.0, 8.0, 8.0, 9.0, 5.0, 3.0, 5.0, 12.0, 5.0, 10.0, 20.0, 45.0, 89.0, 189.0, 461.0, 1350.0, 4549.0, 51442240.0, 16060.0, 3753.0, 1548.0, 507.0, 227.0, 94.0, 49.0, 30.0, 13.0, 10.0, 6.0, 5.0, 11.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-5.0078125, -4.868133544921875, -4.72845458984375, -4.588775634765625, -4.4490966796875, -4.309417724609375, -4.16973876953125, -4.030059814453125, -3.890380859375, -3.750701904296875, -3.61102294921875, -3.471343994140625, -3.3316650390625, -3.191986083984375, -3.05230712890625, -2.912628173828125, -2.77294921875, -2.633270263671875, -2.49359130859375, -2.353912353515625, -2.2142333984375, -2.074554443359375, -1.93487548828125, -1.795196533203125, -1.655517578125, -1.515838623046875, -1.37615966796875, -1.236480712890625, -1.0968017578125, -0.957122802734375, -0.81744384765625, -0.677764892578125, -0.5380859375, -0.398406982421875, -0.25872802734375, -0.119049072265625, 0.0206298828125, 0.160308837890625, 0.29998779296875, 0.439666748046875, 0.579345703125, 0.719024658203125, 0.85870361328125, 0.998382568359375, 1.1380615234375, 1.277740478515625, 1.41741943359375, 1.557098388671875, 1.69677734375, 1.836456298828125, 1.97613525390625, 2.115814208984375, 2.2554931640625, 2.395172119140625, 2.53485107421875, 2.674530029296875, 2.814208984375, 2.953887939453125, 3.09356689453125, 3.233245849609375, 3.3729248046875, 3.512603759765625, 3.65228271484375, 3.791961669921875, 3.931640625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 10.0, 12.0, 22.0, 34.0, 57.0, 71.0, 124.0, 178.0, 278.0, 401.0, 648.0, 967.0, 1530.0, 2340.0, 3590.0, 5670.0, 8294.0, 13257.0, 20602.0, 31808.0, 50445.0, 81232.0, 135990.0, 235898.0, 404451.0, 2452779.0, 1858005.0, 398500.0, 232543.0, 133339.0, 79848.0, 49642.0, 31401.0, 20495.0, 13048.0, 8279.0, 5422.0, 3593.0, 2375.0, 1455.0, 962.0, 619.0, 432.0, 263.0, 172.0, 117.0, 87.0, 53.0, 32.0, 25.0, 16.0, 9.0, 9.0, 1.0, 2.0, 1.0, 4.0, 3.0], "bins": [-0.2509765625, -0.24312973022460938, -0.23528289794921875, -0.22743606567382812, -0.2195892333984375, -0.21174240112304688, -0.20389556884765625, -0.19604873657226562, -0.188201904296875, -0.18035507202148438, -0.17250823974609375, -0.16466140747070312, -0.1568145751953125, -0.14896774291992188, -0.14112091064453125, -0.13327407836914062, -0.12542724609375, -0.11758041381835938, -0.10973358154296875, -0.10188674926757812, -0.0940399169921875, -0.08619308471679688, -0.07834625244140625, -0.07049942016601562, -0.062652587890625, -0.054805755615234375, -0.04695892333984375, -0.039112091064453125, -0.0312652587890625, -0.023418426513671875, -0.01557159423828125, -0.007724761962890625, 0.0001220703125, 0.007968902587890625, 0.01581573486328125, 0.023662567138671875, 0.0315093994140625, 0.039356231689453125, 0.04720306396484375, 0.055049896240234375, 0.062896728515625, 0.07074356079101562, 0.07859039306640625, 0.08643722534179688, 0.0942840576171875, 0.10213088989257812, 0.10997772216796875, 0.11782455444335938, 0.12567138671875, 0.13351821899414062, 0.14136505126953125, 0.14921188354492188, 0.1570587158203125, 0.16490554809570312, 0.17275238037109375, 0.18059921264648438, 0.188446044921875, 0.19629287719726562, 0.20413970947265625, 0.21198654174804688, 0.2198333740234375, 0.22768020629882812, 0.23552703857421875, 0.24337387084960938, 0.251220703125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 3.0, 8.0, 7.0, 5.0, 8.0, 5.0, 15.0, 15.0, 12.0, 16.0, 27.0, 15.0, 21.0, 20.0, 24.0, 22.0, 26.0, 27.0, 49.0, 39.0, 41.0, 38.0, 250.0, 853.0, 41.0, 43.0, 36.0, 44.0, 30.0, 44.0, 26.0, 29.0, 16.0, 18.0, 23.0, 19.0, 18.0, 19.0, 17.0, 10.0, 12.0, 8.0, 7.0, 8.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-1.9716796875, -1.910491943359375, -1.84930419921875, -1.788116455078125, -1.7269287109375, -1.665740966796875, -1.60455322265625, -1.543365478515625, -1.482177734375, -1.420989990234375, -1.35980224609375, -1.298614501953125, -1.2374267578125, -1.176239013671875, -1.11505126953125, -1.053863525390625, -0.99267578125, -0.931488037109375, -0.87030029296875, -0.809112548828125, -0.7479248046875, -0.686737060546875, -0.62554931640625, -0.564361572265625, -0.503173828125, -0.441986083984375, -0.38079833984375, -0.319610595703125, -0.2584228515625, -0.197235107421875, -0.13604736328125, -0.074859619140625, -0.013671875, 0.047515869140625, 0.10870361328125, 0.169891357421875, 0.2310791015625, 0.292266845703125, 0.35345458984375, 0.414642333984375, 0.475830078125, 0.537017822265625, 0.59820556640625, 0.659393310546875, 0.7205810546875, 0.781768798828125, 0.84295654296875, 0.904144287109375, 0.96533203125, 1.026519775390625, 1.08770751953125, 1.148895263671875, 1.2100830078125, 1.271270751953125, 1.33245849609375, 1.393646240234375, 1.454833984375, 1.516021728515625, 1.57720947265625, 1.638397216796875, 1.6995849609375, 1.760772705078125, 1.82196044921875, 1.883148193359375, 1.9443359375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 8.0, 17.0, 29.0, 40.0, 50.0, 74.0, 119.0, 186.0, 305.0, 446.0, 685.0, 1072.0, 1487.0, 2155.0, 3266.0, 4863.0, 7301.0, 10858.0, 16801.0, 25679.0, 40737.0, 65926.0, 111268.0, 191459.0, 325359.0, 502724.0, 3673890.0, 500598.0, 322482.0, 191037.0, 109946.0, 65123.0, 40414.0, 25698.0, 16558.0, 10925.0, 7255.0, 4764.0, 3243.0, 2103.0, 1479.0, 1001.0, 689.0, 462.0, 270.0, 187.0, 132.0, 87.0, 59.0, 46.0, 36.0, 12.0, 15.0, 6.0, 2.0, 1.0], "bins": [-0.250732421875, -0.24346351623535156, -0.23619461059570312, -0.2289257049560547, -0.22165679931640625, -0.2143878936767578, -0.20711898803710938, -0.19985008239746094, -0.1925811767578125, -0.18531227111816406, -0.17804336547851562, -0.1707744598388672, -0.16350555419921875, -0.1562366485595703, -0.14896774291992188, -0.14169883728027344, -0.134429931640625, -0.12716102600097656, -0.11989212036132812, -0.11262321472167969, -0.10535430908203125, -0.09808540344238281, -0.09081649780273438, -0.08354759216308594, -0.0762786865234375, -0.06900978088378906, -0.061740875244140625, -0.05447196960449219, -0.04720306396484375, -0.03993415832519531, -0.032665252685546875, -0.025396347045898438, -0.01812744140625, -0.010858535766601562, -0.003589630126953125, 0.0036792755126953125, 0.01094818115234375, 0.018217086791992188, 0.025485992431640625, 0.03275489807128906, 0.0400238037109375, 0.04729270935058594, 0.054561614990234375, 0.06183052062988281, 0.06909942626953125, 0.07636833190917969, 0.08363723754882812, 0.09090614318847656, 0.098175048828125, 0.10544395446777344, 0.11271286010742188, 0.11998176574707031, 0.12725067138671875, 0.1345195770263672, 0.14178848266601562, 0.14905738830566406, 0.1563262939453125, 0.16359519958496094, 0.17086410522460938, 0.1781330108642578, 0.18540191650390625, 0.1926708221435547, 0.19993972778320312, 0.20720863342285156, 0.2144775390625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 4.0, 15.0, 9.0, 12.0, 13.0, 16.0, 21.0, 19.0, 31.0, 24.0, 32.0, 28.0, 30.0, 29.0, 38.0, 42.0, 41.0, 119.0, 887.0, 146.0, 56.0, 33.0, 39.0, 38.0, 34.0, 37.0, 26.0, 27.0, 28.0, 27.0, 23.0, 16.0, 6.0, 15.0, 11.0, 9.0, 9.0, 8.0, 2.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2744140625, -1.232818603515625, -1.19122314453125, -1.149627685546875, -1.1080322265625, -1.066436767578125, -1.02484130859375, -0.983245849609375, -0.941650390625, -0.900054931640625, -0.85845947265625, -0.816864013671875, -0.7752685546875, -0.733673095703125, -0.69207763671875, -0.650482177734375, -0.60888671875, -0.567291259765625, -0.52569580078125, -0.484100341796875, -0.4425048828125, -0.400909423828125, -0.35931396484375, -0.317718505859375, -0.276123046875, -0.234527587890625, -0.19293212890625, -0.151336669921875, -0.1097412109375, -0.068145751953125, -0.02655029296875, 0.015045166015625, 0.056640625, 0.098236083984375, 0.13983154296875, 0.181427001953125, 0.2230224609375, 0.264617919921875, 0.30621337890625, 0.347808837890625, 0.389404296875, 0.430999755859375, 0.47259521484375, 0.514190673828125, 0.5557861328125, 0.597381591796875, 0.63897705078125, 0.680572509765625, 0.72216796875, 0.763763427734375, 0.80535888671875, 0.846954345703125, 0.8885498046875, 0.930145263671875, 0.97174072265625, 1.013336181640625, 1.054931640625, 1.096527099609375, 1.13812255859375, 1.179718017578125, 1.2213134765625, 1.262908935546875, 1.30450439453125, 1.346099853515625, 1.3876953125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 7.0, 15.0, 13.0, 24.0, 40.0, 49.0, 67.0, 113.0, 143.0, 202.0, 310.0, 453.0, 751.0, 1176.0, 2007.0, 3262.0, 5887.0, 10420.0, 18879.0, 35295.0, 70014.0, 156448.0, 395040.0, 2608640.0, 2293670.0, 386992.0, 153232.0, 69926.0, 34786.0, 18817.0, 10326.0, 5905.0, 3376.0, 1911.0, 1128.0, 710.0, 439.0, 296.0, 202.0, 130.0, 99.0, 76.0, 57.0, 37.0, 20.0, 11.0, 10.0, 8.0, 6.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 3.0], "bins": [-0.41455078125, -0.4015922546386719, -0.38863372802734375, -0.3756752014160156, -0.3627166748046875, -0.3497581481933594, -0.33679962158203125, -0.3238410949707031, -0.310882568359375, -0.2979240417480469, -0.28496551513671875, -0.2720069885253906, -0.2590484619140625, -0.24608993530273438, -0.23313140869140625, -0.22017288208007812, -0.20721435546875, -0.19425582885742188, -0.18129730224609375, -0.16833877563476562, -0.1553802490234375, -0.14242172241210938, -0.12946319580078125, -0.11650466918945312, -0.103546142578125, -0.09058761596679688, -0.07762908935546875, -0.06467056274414062, -0.0517120361328125, -0.038753509521484375, -0.02579498291015625, -0.012836456298828125, 0.0001220703125, 0.013080596923828125, 0.02603912353515625, 0.038997650146484375, 0.0519561767578125, 0.06491470336914062, 0.07787322998046875, 0.09083175659179688, 0.103790283203125, 0.11674880981445312, 0.12970733642578125, 0.14266586303710938, 0.1556243896484375, 0.16858291625976562, 0.18154144287109375, 0.19449996948242188, 0.20745849609375, 0.22041702270507812, 0.23337554931640625, 0.24633407592773438, 0.2592926025390625, 0.2722511291503906, 0.28520965576171875, 0.2981681823730469, 0.311126708984375, 0.3240852355957031, 0.33704376220703125, 0.3500022888183594, 0.3629608154296875, 0.3759193420410156, 0.38887786865234375, 0.4018363952636719, 0.414794921875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 11.0, 13.0, 13.0, 8.0, 13.0, 21.0, 17.0, 24.0, 34.0, 32.0, 35.0, 43.0, 33.0, 50.0, 44.0, 109.0, 603.0, 453.0, 60.0, 53.0, 45.0, 50.0, 34.0, 27.0, 34.0, 25.0, 16.0, 15.0, 24.0, 8.0, 12.0, 15.0, 7.0, 9.0, 9.0, 9.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0390625, -1.0065460205078125, -0.974029541015625, -0.9415130615234375, -0.90899658203125, -0.8764801025390625, -0.843963623046875, -0.8114471435546875, -0.7789306640625, -0.7464141845703125, -0.713897705078125, -0.6813812255859375, -0.64886474609375, -0.6163482666015625, -0.583831787109375, -0.5513153076171875, -0.518798828125, -0.4862823486328125, -0.453765869140625, -0.4212493896484375, -0.38873291015625, -0.3562164306640625, -0.323699951171875, -0.2911834716796875, -0.2586669921875, -0.2261505126953125, -0.193634033203125, -0.1611175537109375, -0.12860107421875, -0.0960845947265625, -0.063568115234375, -0.0310516357421875, 0.00146484375, 0.0339813232421875, 0.066497802734375, 0.0990142822265625, 0.13153076171875, 0.1640472412109375, 0.196563720703125, 0.2290802001953125, 0.2615966796875, 0.2941131591796875, 0.326629638671875, 0.3591461181640625, 0.39166259765625, 0.4241790771484375, 0.456695556640625, 0.4892120361328125, 0.521728515625, 0.5542449951171875, 0.586761474609375, 0.6192779541015625, 0.65179443359375, 0.6843109130859375, 0.716827392578125, 0.7493438720703125, 0.7818603515625, 0.8143768310546875, 0.846893310546875, 0.8794097900390625, 0.91192626953125, 0.9444427490234375, 0.976959228515625, 1.0094757080078125, 1.0419921875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 9.0, 6.0, 22.0, 37.0, 72.0, 139.0, 250.0, 260.0, 123.0, 45.0, 24.0, 13.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.409177303314209, -5.300930500030518, -5.192684173583984, -5.084437370300293, -4.976190567016602, -4.86794376373291, -4.759697437286377, -4.6514506340026855, -4.543204307556152, -4.434957504272461, -4.326711177825928, -4.218464374542236, -4.110217571258545, -4.001971244812012, -3.8937244415283203, -3.785477638244629, -3.6772308349609375, -3.568984270095825, -3.460737466812134, -3.3524909019470215, -3.24424409866333, -3.1359975337982178, -3.0277509689331055, -2.919504165649414, -2.8112576007843018, -2.7030110359191895, -2.594764232635498, -2.4865176677703857, -2.3782711029052734, -2.270024299621582, -2.1617777347564697, -2.0535311698913574, -1.945284128189087, -1.837037444114685, -1.7287907600402832, -1.620544195175171, -1.512297511100769, -1.4040508270263672, -1.2958042621612549, -1.187557578086853, -1.0793108940124512, -0.9710642099380493, -0.8628175854682922, -0.7545709609985352, -0.6463242769241333, -0.5380775928497314, -0.42983096837997437, -0.3215843439102173, -0.21333765983581543, -0.10509100556373596, 0.003155648708343506, 0.11140230298042297, 0.21964895725250244, 0.3278956413269043, 0.4361422657966614, 0.5443888902664185, 0.6526355743408203, 0.7608822584152222, 0.8691288828849792, 0.9773755073547363, 1.0856221914291382, 1.19386887550354, 1.3021154403686523, 1.4103621244430542, 1.518608808517456]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 5.0, 5.0, 6.0, 6.0, 11.0, 12.0, 9.0, 15.0, 20.0, 21.0, 20.0, 29.0, 35.0, 36.0, 32.0, 31.0, 36.0, 39.0, 50.0, 40.0, 44.0, 48.0, 33.0, 32.0, 44.0, 45.0, 45.0, 37.0, 24.0, 28.0, 23.0, 22.0, 22.0, 18.0, 9.0, 15.0, 14.0, 14.0, 9.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3610608577728271, -1.3172632455825806, -1.2734655141830444, -1.2296679019927979, -1.1858702898025513, -1.1420726776123047, -1.0982749462127686, -1.054477334022522, -1.0106797218322754, -0.966882050037384, -0.9230844378471375, -0.8792867660522461, -0.8354891538619995, -0.7916914820671082, -0.7478938102722168, -0.7040961980819702, -0.6602984666824341, -0.6165007948875427, -0.5727031826972961, -0.5289055109024048, -0.4851078689098358, -0.44131022691726685, -0.3975125551223755, -0.3537149131298065, -0.30991727113723755, -0.2661196291446686, -0.22232197225093842, -0.17852431535720825, -0.13472667336463928, -0.09092903137207031, -0.047131359577178955, -0.0033337175846099854, 0.040463924407958984, 0.08426157385110855, 0.12805922329425812, 0.17185688018798828, 0.21565452218055725, 0.2594521641731262, 0.3032498359680176, 0.34704747796058655, 0.3908451199531555, 0.4346427619457245, 0.47844040393829346, 0.5222380757331848, 0.5660357475280762, 0.6098333597183228, 0.6536310315132141, 0.6974287033081055, 0.741226315498352, 0.7850239872932434, 0.82882159948349, 0.8726192712783813, 0.9164168834686279, 0.9602145552635193, 1.0040122270584106, 1.0478098392486572, 1.0916075706481934, 1.13540518283844, 1.179202914237976, 1.2230005264282227, 1.2667981386184692, 1.3105957508087158, 1.354393482208252, 1.3981910943984985, 1.4419887065887451]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 10.0, 15.0, 8.0, 15.0, 21.0, 47.0, 96.0, 159.0, 236.0, 392.0, 692.0, 1129.0, 2030.0, 3649.0, 6925.0, 13467.0, 27552.0, 67617.0, 462355.0, 3231138.0, 272673.0, 54348.0, 23992.0, 11953.0, 6131.0, 3185.0, 1806.0, 957.0, 591.0, 391.0, 230.0, 157.0, 113.0, 74.0, 34.0, 33.0, 22.0, 12.0, 11.0, 7.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0648193359375, -0.06236457824707031, -0.059909820556640625, -0.05745506286621094, -0.05500030517578125, -0.05254554748535156, -0.050090789794921875, -0.04763603210449219, -0.0451812744140625, -0.04272651672363281, -0.040271759033203125, -0.03781700134277344, -0.03536224365234375, -0.03290748596191406, -0.030452728271484375, -0.027997970581054688, -0.025543212890625, -0.023088455200195312, -0.020633697509765625, -0.018178939819335938, -0.01572418212890625, -0.013269424438476562, -0.010814666748046875, -0.008359909057617188, -0.0059051513671875, -0.0034503936767578125, -0.000995635986328125, 0.0014591217041015625, 0.00391387939453125, 0.0063686370849609375, 0.008823394775390625, 0.011278152465820312, 0.01373291015625, 0.016187667846679688, 0.018642425537109375, 0.021097183227539062, 0.02355194091796875, 0.026006698608398438, 0.028461456298828125, 0.030916213989257812, 0.0333709716796875, 0.03582572937011719, 0.038280487060546875, 0.04073524475097656, 0.04319000244140625, 0.04564476013183594, 0.048099517822265625, 0.05055427551269531, 0.053009033203125, 0.05546379089355469, 0.057918548583984375, 0.06037330627441406, 0.06282806396484375, 0.06528282165527344, 0.06773757934570312, 0.07019233703613281, 0.0726470947265625, 0.07510185241699219, 0.07755661010742188, 0.08001136779785156, 0.08246612548828125, 0.08492088317871094, 0.08737564086914062, 0.08983039855957031, 0.09228515625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 4.0, 11.0, 19.0, 16.0, 17.0, 24.0, 28.0, 36.0, 53.0, 51.0, 50.0, 62.0, 81.0, 74.0, 74.0, 56.0, 54.0, 54.0, 47.0, 47.0, 32.0, 19.0, 16.0, 15.0, 10.0, 6.0, 10.0, 7.0, 3.0, 7.0, 0.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03009033203125, -0.028993606567382812, -0.027896881103515625, -0.026800155639648438, -0.02570343017578125, -0.024606704711914062, -0.023509979248046875, -0.022413253784179688, -0.0213165283203125, -0.020219802856445312, -0.019123077392578125, -0.018026351928710938, -0.01692962646484375, -0.015832901000976562, -0.014736175537109375, -0.013639450073242188, -0.012542724609375, -0.011445999145507812, -0.010349273681640625, -0.009252548217773438, -0.00815582275390625, -0.0070590972900390625, -0.005962371826171875, -0.0048656463623046875, -0.0037689208984375, -0.0026721954345703125, -0.001575469970703125, -0.0004787445068359375, 0.00061798095703125, 0.0017147064208984375, 0.002811431884765625, 0.0039081573486328125, 0.0050048828125, 0.0061016082763671875, 0.007198333740234375, 0.008295059204101562, 0.00939178466796875, 0.010488510131835938, 0.011585235595703125, 0.012681961059570312, 0.0137786865234375, 0.014875411987304688, 0.015972137451171875, 0.017068862915039062, 0.01816558837890625, 0.019262313842773438, 0.020359039306640625, 0.021455764770507812, 0.022552490234375, 0.023649215698242188, 0.024745941162109375, 0.025842666625976562, 0.02693939208984375, 0.028036117553710938, 0.029132843017578125, 0.030229568481445312, 0.0313262939453125, 0.03242301940917969, 0.033519744873046875, 0.03461647033691406, 0.03571319580078125, 0.03680992126464844, 0.037906646728515625, 0.03900337219238281, 0.04010009765625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 5.0, 6.0, 15.0, 21.0, 24.0, 36.0, 49.0, 91.0, 130.0, 182.0, 325.0, 525.0, 934.0, 1767.0, 3507.0, 7688.0, 18821.0, 59279.0, 382661.0, 3451607.0, 197212.0, 42145.0, 14624.0, 6161.0, 2929.0, 1504.0, 760.0, 461.0, 315.0, 172.0, 99.0, 50.0, 66.0, 32.0, 17.0, 17.0, 15.0, 11.0, 8.0, 5.0, 1.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07147216796875, -0.06945133209228516, -0.06743049621582031, -0.06540966033935547, -0.06338882446289062, -0.06136798858642578, -0.05934715270996094, -0.057326316833496094, -0.05530548095703125, -0.053284645080566406, -0.05126380920410156, -0.04924297332763672, -0.047222137451171875, -0.04520130157470703, -0.04318046569824219, -0.041159629821777344, -0.0391387939453125, -0.037117958068847656, -0.03509712219238281, -0.03307628631591797, -0.031055450439453125, -0.02903461456298828, -0.027013778686523438, -0.024992942810058594, -0.02297210693359375, -0.020951271057128906, -0.018930435180664062, -0.01690959930419922, -0.014888763427734375, -0.012867927551269531, -0.010847091674804688, -0.008826255798339844, -0.006805419921875, -0.004784584045410156, -0.0027637481689453125, -0.0007429122924804688, 0.001277923583984375, 0.0032987594604492188, 0.0053195953369140625, 0.007340431213378906, 0.00936126708984375, 0.011382102966308594, 0.013402938842773438, 0.015423774719238281, 0.017444610595703125, 0.01946544647216797, 0.021486282348632812, 0.023507118225097656, 0.0255279541015625, 0.027548789978027344, 0.029569625854492188, 0.03159046173095703, 0.033611297607421875, 0.03563213348388672, 0.03765296936035156, 0.039673805236816406, 0.04169464111328125, 0.043715476989746094, 0.04573631286621094, 0.04775714874267578, 0.049777984619140625, 0.05179882049560547, 0.05381965637207031, 0.055840492248535156, 0.057861328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 7.0, 6.0, 7.0, 12.0, 14.0, 12.0, 19.0, 15.0, 33.0, 41.0, 51.0, 98.0, 143.0, 338.0, 1098.0, 1270.0, 415.0, 150.0, 79.0, 78.0, 41.0, 41.0, 26.0, 11.0, 15.0, 13.0, 4.0, 6.0, 10.0, 2.0, 11.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0654296875, -0.06356334686279297, -0.06169700622558594, -0.059830665588378906, -0.057964324951171875, -0.056097984313964844, -0.05423164367675781, -0.05236530303955078, -0.05049896240234375, -0.04863262176513672, -0.04676628112792969, -0.044899940490722656, -0.043033599853515625, -0.041167259216308594, -0.03930091857910156, -0.03743457794189453, -0.0355682373046875, -0.03370189666748047, -0.03183555603027344, -0.029969215393066406, -0.028102874755859375, -0.026236534118652344, -0.024370193481445312, -0.02250385284423828, -0.02063751220703125, -0.01877117156982422, -0.016904830932617188, -0.015038490295410156, -0.013172149658203125, -0.011305809020996094, -0.009439468383789062, -0.007573127746582031, -0.005706787109375, -0.0038404464721679688, -0.0019741058349609375, -0.00010776519775390625, 0.001758575439453125, 0.0036249160766601562, 0.0054912567138671875, 0.007357597351074219, 0.00922393798828125, 0.011090278625488281, 0.012956619262695312, 0.014822959899902344, 0.016689300537109375, 0.018555641174316406, 0.020421981811523438, 0.02228832244873047, 0.0241546630859375, 0.02602100372314453, 0.027887344360351562, 0.029753684997558594, 0.031620025634765625, 0.033486366271972656, 0.03535270690917969, 0.03721904754638672, 0.03908538818359375, 0.04095172882080078, 0.04281806945800781, 0.044684410095214844, 0.046550750732421875, 0.048417091369628906, 0.05028343200683594, 0.05214977264404297, 0.05401611328125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 16.0, 39.0, 154.0, 402.0, 285.0, 86.0, 16.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4441463351249695, -0.43014997243881226, -0.41615357995033264, -0.402157187461853, -0.3881608247756958, -0.3741644620895386, -0.36016806960105896, -0.34617167711257935, -0.3321753144264221, -0.3181789517402649, -0.3041825592517853, -0.29018616676330566, -0.27618980407714844, -0.2621934413909912, -0.2481970489025116, -0.23420067131519318, -0.22020429372787476, -0.20620791614055634, -0.19221153855323792, -0.1782151609659195, -0.16421878337860107, -0.15022240579128265, -0.13622602820396423, -0.12222965061664581, -0.10823327302932739, -0.09423689544200897, -0.08024051785469055, -0.06624414026737213, -0.05224776268005371, -0.03825138509273529, -0.02425500750541687, -0.01025862991809845, 0.0037377476692199707, 0.01773412525653839, 0.03173050284385681, 0.04572688043117523, 0.05972325801849365, 0.07371963560581207, 0.0877160131931305, 0.10171239078044891, 0.11570876836776733, 0.12970514595508575, 0.14370152354240417, 0.1576979011297226, 0.17169427871704102, 0.18569065630435944, 0.19968703389167786, 0.21368341147899628, 0.2276797890663147, 0.24167616665363312, 0.25567254424095154, 0.26966893672943115, 0.2836652994155884, 0.2976616621017456, 0.3116580545902252, 0.32565444707870483, 0.33965080976486206, 0.3536471724510193, 0.3676435649394989, 0.3816399574279785, 0.39563632011413574, 0.40963268280029297, 0.4236290752887726, 0.4376254677772522, 0.4516218304634094]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 8.0, 10.0, 8.0, 16.0, 17.0, 24.0, 27.0, 35.0, 35.0, 40.0, 56.0, 67.0, 53.0, 51.0, 57.0, 76.0, 69.0, 68.0, 53.0, 51.0, 37.0, 37.0, 23.0, 22.0, 15.0, 15.0, 16.0, 12.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1354028582572937, -0.13110730051994324, -0.12681174278259277, -0.1225161999464035, -0.11822064220905304, -0.11392508447170258, -0.10962953418493271, -0.10533398389816284, -0.10103842616081238, -0.09674286842346191, -0.09244731813669205, -0.08815176784992218, -0.08385621011257172, -0.07956065237522125, -0.07526510208845139, -0.07096955180168152, -0.06667399406433105, -0.06237844005227089, -0.058082886040210724, -0.05378733202815056, -0.04949177801609039, -0.04519622400403023, -0.04090066999197006, -0.0366051159799099, -0.03230956196784973, -0.028014007955789566, -0.0237184539437294, -0.019422899931669235, -0.01512734591960907, -0.010831791907548904, -0.006536237895488739, -0.0022406838834285736, 0.002054870128631592, 0.006350424140691757, 0.010645978152751923, 0.014941532164812088, 0.019237086176872253, 0.02353264018893242, 0.027828194200992584, 0.03212374821305275, 0.036419302225112915, 0.04071485623717308, 0.045010410249233246, 0.04930596426129341, 0.05360151827335358, 0.05789707228541374, 0.06219262629747391, 0.06648817658424377, 0.07078373432159424, 0.0750792920589447, 0.07937484234571457, 0.08367039263248444, 0.0879659503698349, 0.09226150810718536, 0.09655705839395523, 0.1008526086807251, 0.10514816641807556, 0.10944372415542603, 0.11373927444219589, 0.11803482472896576, 0.12233038246631622, 0.1266259402036667, 0.13092148303985596, 0.13521704077720642, 0.13951259851455688]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 4.0, 0.0, 4.0, 5.0, 5.0, 13.0, 18.0, 22.0, 24.0, 33.0, 54.0, 74.0, 114.0, 207.0, 291.0, 468.0, 778.0, 1365.0, 2467.0, 4897.0, 10013.0, 23516.0, 64778.0, 248816.0, 490829.0, 128300.0, 40336.0, 15678.0, 7218.0, 3446.0, 1938.0, 1123.0, 622.0, 359.0, 258.0, 147.0, 103.0, 77.0, 47.0, 31.0, 31.0, 20.0, 4.0, 9.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0748291015625, -0.07258033752441406, -0.07033157348632812, -0.06808280944824219, -0.06583404541015625, -0.06358528137207031, -0.061336517333984375, -0.05908775329589844, -0.0568389892578125, -0.05459022521972656, -0.052341461181640625, -0.05009269714355469, -0.04784393310546875, -0.04559516906738281, -0.043346405029296875, -0.04109764099121094, -0.038848876953125, -0.03660011291503906, -0.034351348876953125, -0.03210258483886719, -0.02985382080078125, -0.027605056762695312, -0.025356292724609375, -0.023107528686523438, -0.0208587646484375, -0.018610000610351562, -0.016361236572265625, -0.014112472534179688, -0.01186370849609375, -0.009614944458007812, -0.007366180419921875, -0.0051174163818359375, -0.00286865234375, -0.0006198883056640625, 0.001628875732421875, 0.0038776397705078125, 0.00612640380859375, 0.008375167846679688, 0.010623931884765625, 0.012872695922851562, 0.0151214599609375, 0.017370223999023438, 0.019618988037109375, 0.021867752075195312, 0.02411651611328125, 0.026365280151367188, 0.028614044189453125, 0.030862808227539062, 0.033111572265625, 0.03536033630371094, 0.037609100341796875, 0.03985786437988281, 0.04210662841796875, 0.04435539245605469, 0.046604156494140625, 0.04885292053222656, 0.0511016845703125, 0.05335044860839844, 0.055599212646484375, 0.05784797668457031, 0.06009674072265625, 0.06234550476074219, 0.06459426879882812, 0.06684303283691406, 0.069091796875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 2.0, 10.0, 14.0, 10.0, 16.0, 18.0, 28.0, 34.0, 26.0, 54.0, 43.0, 62.0, 65.0, 58.0, 72.0, 72.0, 62.0, 52.0, 55.0, 39.0, 42.0, 32.0, 37.0, 16.0, 14.0, 20.0, 8.0, 8.0, 5.0, 3.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029266357421875, -0.028245925903320312, -0.027225494384765625, -0.026205062866210938, -0.02518463134765625, -0.024164199829101562, -0.023143768310546875, -0.022123336791992188, -0.0211029052734375, -0.020082473754882812, -0.019062042236328125, -0.018041610717773438, -0.01702117919921875, -0.016000747680664062, -0.014980316162109375, -0.013959884643554688, -0.012939453125, -0.011919021606445312, -0.010898590087890625, -0.009878158569335938, -0.00885772705078125, -0.007837295532226562, -0.006816864013671875, -0.0057964324951171875, -0.0047760009765625, -0.0037555694580078125, -0.002735137939453125, -0.0017147064208984375, -0.00069427490234375, 0.0003261566162109375, 0.001346588134765625, 0.0023670196533203125, 0.003387451171875, 0.0044078826904296875, 0.005428314208984375, 0.0064487457275390625, 0.00746917724609375, 0.008489608764648438, 0.009510040283203125, 0.010530471801757812, 0.0115509033203125, 0.012571334838867188, 0.013591766357421875, 0.014612197875976562, 0.01563262939453125, 0.016653060913085938, 0.017673492431640625, 0.018693923950195312, 0.01971435546875, 0.020734786987304688, 0.021755218505859375, 0.022775650024414062, 0.02379608154296875, 0.024816513061523438, 0.025836944580078125, 0.026857376098632812, 0.0278778076171875, 0.028898239135742188, 0.029918670654296875, 0.030939102172851562, 0.03195953369140625, 0.03297996520996094, 0.034000396728515625, 0.03502082824707031, 0.036041259765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 8.0, 8.0, 7.0, 10.0, 14.0, 24.0, 35.0, 40.0, 60.0, 107.0, 186.0, 452.0, 998.0, 2316.0, 5369.0, 13411.0, 34677.0, 103129.0, 412657.0, 339486.0, 85801.0, 29667.0, 11635.0, 4764.0, 1936.0, 849.0, 386.0, 198.0, 100.0, 67.0, 32.0, 26.0, 26.0, 18.0, 11.0, 11.0, 7.0, 6.0, 6.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.065673828125, -0.06340312957763672, -0.06113243103027344, -0.058861732482910156, -0.056591033935546875, -0.054320335388183594, -0.05204963684082031, -0.04977893829345703, -0.04750823974609375, -0.04523754119873047, -0.04296684265136719, -0.040696144104003906, -0.038425445556640625, -0.036154747009277344, -0.03388404846191406, -0.03161334991455078, -0.0293426513671875, -0.02707195281982422, -0.024801254272460938, -0.022530555725097656, -0.020259857177734375, -0.017989158630371094, -0.015718460083007812, -0.013447761535644531, -0.01117706298828125, -0.008906364440917969, -0.0066356658935546875, -0.004364967346191406, -0.002094268798828125, 0.00017642974853515625, 0.0024471282958984375, 0.004717826843261719, 0.006988525390625, 0.009259223937988281, 0.011529922485351562, 0.013800621032714844, 0.016071319580078125, 0.018342018127441406, 0.020612716674804688, 0.02288341522216797, 0.02515411376953125, 0.02742481231689453, 0.029695510864257812, 0.031966209411621094, 0.034236907958984375, 0.036507606506347656, 0.03877830505371094, 0.04104900360107422, 0.0433197021484375, 0.04559040069580078, 0.04786109924316406, 0.050131797790527344, 0.052402496337890625, 0.054673194885253906, 0.05694389343261719, 0.05921459197998047, 0.06148529052734375, 0.06375598907470703, 0.06602668762207031, 0.0682973861694336, 0.07056808471679688, 0.07283878326416016, 0.07510948181152344, 0.07738018035888672, 0.07965087890625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 8.0, 4.0, 9.0, 8.0, 12.0, 11.0, 12.0, 11.0, 29.0, 22.0, 28.0, 16.0, 25.0, 37.0, 34.0, 36.0, 39.0, 44.0, 35.0, 48.0, 54.0, 50.0, 43.0, 38.0, 33.0, 33.0, 39.0, 29.0, 26.0, 24.0, 28.0, 20.0, 27.0, 20.0, 15.0, 22.0, 8.0, 5.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058746337890625, -0.05666399002075195, -0.054581642150878906, -0.05249929428100586, -0.05041694641113281, -0.048334598541259766, -0.04625225067138672, -0.04416990280151367, -0.042087554931640625, -0.04000520706176758, -0.03792285919189453, -0.035840511322021484, -0.03375816345214844, -0.03167581558227539, -0.029593467712402344, -0.027511119842529297, -0.02542877197265625, -0.023346424102783203, -0.021264076232910156, -0.01918172836303711, -0.017099380493164062, -0.015017032623291016, -0.012934684753417969, -0.010852336883544922, -0.008769989013671875, -0.006687641143798828, -0.004605293273925781, -0.0025229454040527344, -0.0004405975341796875, 0.0016417503356933594, 0.0037240982055664062, 0.005806446075439453, 0.0078887939453125, 0.009971141815185547, 0.012053489685058594, 0.01413583755493164, 0.016218185424804688, 0.018300533294677734, 0.02038288116455078, 0.022465229034423828, 0.024547576904296875, 0.026629924774169922, 0.02871227264404297, 0.030794620513916016, 0.03287696838378906, 0.03495931625366211, 0.037041664123535156, 0.0391240119934082, 0.04120635986328125, 0.0432887077331543, 0.045371055603027344, 0.04745340347290039, 0.04953575134277344, 0.051618099212646484, 0.05370044708251953, 0.05578279495239258, 0.057865142822265625, 0.05994749069213867, 0.06202983856201172, 0.06411218643188477, 0.06619453430175781, 0.06827688217163086, 0.0703592300415039, 0.07244157791137695, 0.07452392578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 2.0, 3.0, 2.0, 3.0, 6.0, 12.0, 12.0, 16.0, 21.0, 37.0, 45.0, 71.0, 95.0, 138.0, 232.0, 404.0, 629.0, 1063.0, 2011.0, 3874.0, 7999.0, 19453.0, 61976.0, 356254.0, 472413.0, 80035.0, 22962.0, 9153.0, 4306.0, 2179.0, 1257.0, 698.0, 425.0, 250.0, 175.0, 104.0, 91.0, 53.0, 28.0, 20.0, 19.0, 12.0, 9.0, 6.0, 2.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01404571533203125, -0.013545632362365723, -0.013045549392700195, -0.012545466423034668, -0.01204538345336914, -0.011545300483703613, -0.011045217514038086, -0.010545134544372559, -0.010045051574707031, -0.009544968605041504, -0.009044885635375977, -0.00854480266571045, -0.008044719696044922, -0.0075446367263793945, -0.007044553756713867, -0.00654447078704834, -0.0060443878173828125, -0.005544304847717285, -0.005044221878051758, -0.0045441389083862305, -0.004044055938720703, -0.0035439729690551758, -0.0030438899993896484, -0.002543807029724121, -0.0020437240600585938, -0.0015436410903930664, -0.001043558120727539, -0.0005434751510620117, -4.3392181396484375e-05, 0.00045669078826904297, 0.0009567737579345703, 0.0014568567276000977, 0.001956939697265625, 0.0024570226669311523, 0.0029571056365966797, 0.003457188606262207, 0.003957271575927734, 0.004457354545593262, 0.004957437515258789, 0.005457520484924316, 0.005957603454589844, 0.006457686424255371, 0.0069577693939208984, 0.007457852363586426, 0.007957935333251953, 0.00845801830291748, 0.008958101272583008, 0.009458184242248535, 0.009958267211914062, 0.01045835018157959, 0.010958433151245117, 0.011458516120910645, 0.011958599090576172, 0.0124586820602417, 0.012958765029907227, 0.013458847999572754, 0.013958930969238281, 0.014459013938903809, 0.014959096908569336, 0.015459179878234863, 0.01595926284790039, 0.016459345817565918, 0.016959428787231445, 0.017459511756896973, 0.0179595947265625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 7.0, 3.0, 11.0, 5.0, 14.0, 16.0, 23.0, 44.0, 28.0, 66.0, 50.0, 72.0, 90.0, 45.0, 97.0, 50.0, 68.0, 43.0, 71.0, 70.0, 24.0, 38.0, 12.0, 22.0, 10.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2186508178710938e-06, -3.1245872378349304e-06, -3.030523657798767e-06, -2.9364600777626038e-06, -2.8423964977264404e-06, -2.748332917690277e-06, -2.6542693376541138e-06, -2.5602057576179504e-06, -2.466142177581787e-06, -2.3720785975456238e-06, -2.2780150175094604e-06, -2.183951437473297e-06, -2.089887857437134e-06, -1.9958242774009705e-06, -1.9017606973648071e-06, -1.8076971173286438e-06, -1.7136335372924805e-06, -1.6195699572563171e-06, -1.5255063772201538e-06, -1.4314427971839905e-06, -1.3373792171478271e-06, -1.2433156371116638e-06, -1.1492520570755005e-06, -1.0551884770393372e-06, -9.611248970031738e-07, -8.670613169670105e-07, -7.729977369308472e-07, -6.789341568946838e-07, -5.848705768585205e-07, -4.908069968223572e-07, -3.9674341678619385e-07, -3.026798367500305e-07, -2.086162567138672e-07, -1.1455267667770386e-07, -2.0489096641540527e-08, 7.35744833946228e-08, 1.6763806343078613e-07, 2.6170164346694946e-07, 3.557652235031128e-07, 4.498288035392761e-07, 5.438923835754395e-07, 6.379559636116028e-07, 7.320195436477661e-07, 8.260831236839294e-07, 9.201467037200928e-07, 1.014210283756256e-06, 1.1082738637924194e-06, 1.2023374438285828e-06, 1.296401023864746e-06, 1.3904646039009094e-06, 1.4845281839370728e-06, 1.578591763973236e-06, 1.6726553440093994e-06, 1.7667189240455627e-06, 1.860782504081726e-06, 1.9548460841178894e-06, 2.0489096641540527e-06, 2.142973244190216e-06, 2.2370368242263794e-06, 2.3311004042625427e-06, 2.425163984298706e-06, 2.5192275643348694e-06, 2.6132911443710327e-06, 2.707354724407196e-06, 2.8014183044433594e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 8.0, 8.0, 17.0, 34.0, 51.0, 97.0, 136.0, 254.0, 451.0, 932.0, 2110.0, 5767.0, 18909.0, 151621.0, 799089.0, 51112.0, 11091.0, 3774.0, 1503.0, 703.0, 388.0, 194.0, 118.0, 66.0, 50.0, 24.0, 15.0, 14.0, 4.0, 11.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047882080078125, -0.04669380187988281, -0.045505523681640625, -0.04431724548339844, -0.04312896728515625, -0.04194068908691406, -0.040752410888671875, -0.03956413269042969, -0.0383758544921875, -0.03718757629394531, -0.035999298095703125, -0.03481101989746094, -0.03362274169921875, -0.03243446350097656, -0.031246185302734375, -0.030057907104492188, -0.02886962890625, -0.027681350708007812, -0.026493072509765625, -0.025304794311523438, -0.02411651611328125, -0.022928237915039062, -0.021739959716796875, -0.020551681518554688, -0.0193634033203125, -0.018175125122070312, -0.016986846923828125, -0.015798568725585938, -0.01461029052734375, -0.013422012329101562, -0.012233734130859375, -0.011045455932617188, -0.009857177734375, -0.008668899536132812, -0.007480621337890625, -0.0062923431396484375, -0.00510406494140625, -0.0039157867431640625, -0.002727508544921875, -0.0015392303466796875, -0.0003509521484375, 0.0008373260498046875, 0.002025604248046875, 0.0032138824462890625, 0.00440216064453125, 0.0055904388427734375, 0.006778717041015625, 0.007966995239257812, 0.0091552734375, 0.010343551635742188, 0.011531829833984375, 0.012720108032226562, 0.01390838623046875, 0.015096664428710938, 0.016284942626953125, 0.017473220825195312, 0.0186614990234375, 0.019849777221679688, 0.021038055419921875, 0.022226333618164062, 0.02341461181640625, 0.024602890014648438, 0.025791168212890625, 0.026979446411132812, 0.028167724609375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 11.0, 8.0, 13.0, 6.0, 8.0, 16.0, 25.0, 43.0, 86.0, 140.0, 191.0, 154.0, 109.0, 52.0, 38.0, 24.0, 16.0, 15.0, 15.0, 8.0, 5.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041290283203125, -0.04025411605834961, -0.03921794891357422, -0.03818178176879883, -0.03714561462402344, -0.03610944747924805, -0.035073280334472656, -0.034037113189697266, -0.033000946044921875, -0.031964778900146484, -0.030928611755371094, -0.029892444610595703, -0.028856277465820312, -0.027820110321044922, -0.02678394317626953, -0.02574777603149414, -0.02471160888671875, -0.02367544174194336, -0.02263927459716797, -0.021603107452392578, -0.020566940307617188, -0.019530773162841797, -0.018494606018066406, -0.017458438873291016, -0.016422271728515625, -0.015386104583740234, -0.014349937438964844, -0.013313770294189453, -0.012277603149414062, -0.011241436004638672, -0.010205268859863281, -0.00916910171508789, -0.0081329345703125, -0.007096767425537109, -0.006060600280761719, -0.005024433135986328, -0.0039882659912109375, -0.002952098846435547, -0.0019159317016601562, -0.0008797645568847656, 0.000156402587890625, 0.0011925697326660156, 0.0022287368774414062, 0.003264904022216797, 0.0043010711669921875, 0.005337238311767578, 0.006373405456542969, 0.007409572601318359, 0.00844573974609375, 0.00948190689086914, 0.010518074035644531, 0.011554241180419922, 0.012590408325195312, 0.013626575469970703, 0.014662742614746094, 0.015698909759521484, 0.016735076904296875, 0.017771244049072266, 0.018807411193847656, 0.019843578338623047, 0.020879745483398438, 0.021915912628173828, 0.02295207977294922, 0.02398824691772461, 0.0250244140625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 11.0, 26.0, 55.0, 120.0, 267.0, 247.0, 144.0, 56.0, 29.0, 16.0, 10.0, 11.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7273724675178528, -0.7053150534629822, -0.6832576990127563, -0.6612002849578857, -0.6391429305076599, -0.6170855164527893, -0.5950281620025635, -0.5729707479476929, -0.5509133338928223, -0.5288559198379517, -0.5067985653877258, -0.4847411513328552, -0.4626837968826294, -0.4406263828277588, -0.41856899857521057, -0.39651161432266235, -0.3744542598724365, -0.3523968756198883, -0.3303394913673401, -0.3082820773124695, -0.28622472286224365, -0.26416730880737305, -0.24210992455482483, -0.2200525403022766, -0.1979951560497284, -0.17593777179718018, -0.15388038754463196, -0.13182298839092255, -0.10976560413837433, -0.08770821988582611, -0.0656508207321167, -0.04359343647956848, -0.021536052227020264, 0.0005213357508182526, 0.02257872372865677, 0.044636115431785583, 0.0666934996843338, 0.08875088393688202, 0.11080828309059143, 0.13286566734313965, 0.15492305159568787, 0.17698043584823608, 0.1990378201007843, 0.2210952192544937, 0.24315260350704193, 0.26520997285842896, 0.28726738691329956, 0.3093247711658478, 0.331382155418396, 0.3534395396709442, 0.37549692392349243, 0.39755433797836304, 0.41961169242858887, 0.4416691064834595, 0.4637264907360077, 0.4857838749885559, 0.5078412294387817, 0.5298986434936523, 0.5519559979438782, 0.5740134119987488, 0.5960707664489746, 0.6181281805038452, 0.6401855945587158, 0.6622429490089417, 0.6843003630638123]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 5.0, 9.0, 1.0, 2.0, 9.0, 4.0, 13.0, 9.0, 13.0, 18.0, 19.0, 24.0, 33.0, 34.0, 35.0, 41.0, 39.0, 41.0, 41.0, 55.0, 43.0, 60.0, 48.0, 43.0, 41.0, 47.0, 43.0, 40.0, 46.0, 26.0, 20.0, 15.0, 22.0, 14.0, 11.0, 11.0, 5.0, 9.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41310280561447144, -0.4009588658809662, -0.38881492614746094, -0.3766709864139557, -0.36452704668045044, -0.3523831367492676, -0.34023916721343994, -0.3280952572822571, -0.31595131754875183, -0.3038073778152466, -0.29166343808174133, -0.2795194983482361, -0.26737555861473083, -0.2552316188812256, -0.24308769404888153, -0.23094376921653748, -0.21879981458187103, -0.20665587484836578, -0.19451193511486053, -0.18236801028251648, -0.17022407054901123, -0.15808013081550598, -0.14593619108200073, -0.13379225134849548, -0.12164831906557083, -0.10950437933206558, -0.09736044704914093, -0.08521650731563568, -0.07307256758213043, -0.06092863529920578, -0.04878469556570053, -0.03664076328277588, -0.02449682354927063, -0.012352886609733105, -0.00020894967019557953, 0.01193498820066452, 0.02407892420887947, 0.03622286021709442, 0.04836679995059967, 0.06051073223352432, 0.07265467196702957, 0.08479861170053482, 0.09694254398345947, 0.10908648371696472, 0.12123042345046997, 0.13337436318397522, 0.14551830291748047, 0.15766222774982452, 0.16980616748332977, 0.18195010721683502, 0.19409404695034027, 0.20623797178268433, 0.21838191151618958, 0.23052585124969482, 0.24266979098320007, 0.2548137307167053, 0.26695767045021057, 0.2791016101837158, 0.29124554991722107, 0.3033894896507263, 0.31553342938423157, 0.3276773691177368, 0.3398212790489197, 0.3519652187824249, 0.3641091585159302]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 7.0, 7.0, 5.0, 9.0, 15.0, 13.0, 17.0, 26.0, 27.0, 42.0, 67.0, 113.0, 101.0, 188.0, 248.0, 372.0, 608.0, 1027.0, 1954.0, 4630.0, 16359.0, 232568.0, 3873885.0, 46572.0, 8587.0, 2930.0, 1498.0, 819.0, 501.0, 294.0, 213.0, 146.0, 106.0, 74.0, 70.0, 45.0, 32.0, 29.0, 14.0, 13.0, 7.0, 17.0, 3.0, 2.0, 5.0, 2.0, 6.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.1993408203125, -0.19296646118164062, -0.18659210205078125, -0.18021774291992188, -0.1738433837890625, -0.16746902465820312, -0.16109466552734375, -0.15472030639648438, -0.148345947265625, -0.14197158813476562, -0.13559722900390625, -0.12922286987304688, -0.1228485107421875, -0.11647415161132812, -0.11009979248046875, -0.10372543334960938, -0.09735107421875, -0.09097671508789062, -0.08460235595703125, -0.07822799682617188, -0.0718536376953125, -0.06547927856445312, -0.05910491943359375, -0.052730560302734375, -0.046356201171875, -0.039981842041015625, -0.03360748291015625, -0.027233123779296875, -0.0208587646484375, -0.014484405517578125, -0.00811004638671875, -0.001735687255859375, 0.004638671875, 0.011013031005859375, 0.01738739013671875, 0.023761749267578125, 0.0301361083984375, 0.036510467529296875, 0.04288482666015625, 0.049259185791015625, 0.055633544921875, 0.062007904052734375, 0.06838226318359375, 0.07475662231445312, 0.0811309814453125, 0.08750534057617188, 0.09387969970703125, 0.10025405883789062, 0.10662841796875, 0.11300277709960938, 0.11937713623046875, 0.12575149536132812, 0.1321258544921875, 0.13850021362304688, 0.14487457275390625, 0.15124893188476562, 0.157623291015625, 0.16399765014648438, 0.17037200927734375, 0.17674636840820312, 0.1831207275390625, 0.18949508666992188, 0.19586944580078125, 0.20224380493164062, 0.2086181640625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 1.0, 7.0, 8.0, 2.0, 8.0, 17.0, 12.0, 23.0, 23.0, 24.0, 39.0, 22.0, 49.0, 46.0, 40.0, 60.0, 57.0, 64.0, 63.0, 47.0, 50.0, 52.0, 32.0, 62.0, 39.0, 29.0, 15.0, 25.0, 16.0, 15.0, 12.0, 9.0, 7.0, 4.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0275726318359375, -0.02665257453918457, -0.02573251724243164, -0.02481245994567871, -0.02389240264892578, -0.02297234535217285, -0.022052288055419922, -0.021132230758666992, -0.020212173461914062, -0.019292116165161133, -0.018372058868408203, -0.017452001571655273, -0.016531944274902344, -0.015611886978149414, -0.014691829681396484, -0.013771772384643555, -0.012851715087890625, -0.011931657791137695, -0.011011600494384766, -0.010091543197631836, -0.009171485900878906, -0.008251428604125977, -0.007331371307373047, -0.006411314010620117, -0.0054912567138671875, -0.004571199417114258, -0.003651142120361328, -0.0027310848236083984, -0.0018110275268554688, -0.0008909702301025391, 2.9087066650390625e-05, 0.0009491443634033203, 0.00186920166015625, 0.0027892589569091797, 0.0037093162536621094, 0.004629373550415039, 0.005549430847167969, 0.0064694881439208984, 0.007389545440673828, 0.008309602737426758, 0.009229660034179688, 0.010149717330932617, 0.011069774627685547, 0.011989831924438477, 0.012909889221191406, 0.013829946517944336, 0.014750003814697266, 0.015670061111450195, 0.016590118408203125, 0.017510175704956055, 0.018430233001708984, 0.019350290298461914, 0.020270347595214844, 0.021190404891967773, 0.022110462188720703, 0.023030519485473633, 0.023950576782226562, 0.024870634078979492, 0.025790691375732422, 0.02671074867248535, 0.02763080596923828, 0.02855086326599121, 0.02947092056274414, 0.03039097785949707, 0.03131103515625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 5.0, 7.0, 17.0, 25.0, 40.0, 95.0, 184.0, 386.0, 902.0, 2279.0, 6687.0, 26702.0, 187229.0, 3248425.0, 647457.0, 56213.0, 11582.0, 3544.0, 1366.0, 614.0, 229.0, 125.0, 54.0, 29.0, 16.0, 10.0, 10.0, 6.0, 4.0, 5.0, 4.0, 4.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.107177734375, -0.10368824005126953, -0.10019874572753906, -0.0967092514038086, -0.09321975708007812, -0.08973026275634766, -0.08624076843261719, -0.08275127410888672, -0.07926177978515625, -0.07577228546142578, -0.07228279113769531, -0.06879329681396484, -0.06530380249023438, -0.061814308166503906, -0.05832481384277344, -0.05483531951904297, -0.0513458251953125, -0.04785633087158203, -0.04436683654785156, -0.040877342224121094, -0.037387847900390625, -0.033898353576660156, -0.030408859252929688, -0.02691936492919922, -0.02342987060546875, -0.01994037628173828, -0.016450881958007812, -0.012961387634277344, -0.009471893310546875, -0.005982398986816406, -0.0024929046630859375, 0.0009965896606445312, 0.004486083984375, 0.007975578308105469, 0.011465072631835938, 0.014954566955566406, 0.018444061279296875, 0.021933555603027344, 0.025423049926757812, 0.02891254425048828, 0.03240203857421875, 0.03589153289794922, 0.03938102722167969, 0.042870521545410156, 0.046360015869140625, 0.049849510192871094, 0.05333900451660156, 0.05682849884033203, 0.0603179931640625, 0.06380748748779297, 0.06729698181152344, 0.0707864761352539, 0.07427597045898438, 0.07776546478271484, 0.08125495910644531, 0.08474445343017578, 0.08823394775390625, 0.09172344207763672, 0.09521293640136719, 0.09870243072509766, 0.10219192504882812, 0.1056814193725586, 0.10917091369628906, 0.11266040802001953, 0.11614990234375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 9.0, 6.0, 12.0, 7.0, 14.0, 16.0, 27.0, 32.0, 47.0, 49.0, 66.0, 82.0, 146.0, 214.0, 372.0, 661.0, 763.0, 549.0, 334.0, 216.0, 103.0, 90.0, 67.0, 44.0, 41.0, 20.0, 17.0, 13.0, 9.0, 6.0, 7.0, 8.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.037841796875, -0.03663301467895508, -0.035424232482910156, -0.034215450286865234, -0.03300666809082031, -0.03179788589477539, -0.03058910369873047, -0.029380321502685547, -0.028171539306640625, -0.026962757110595703, -0.02575397491455078, -0.02454519271850586, -0.023336410522460938, -0.022127628326416016, -0.020918846130371094, -0.019710063934326172, -0.01850128173828125, -0.017292499542236328, -0.016083717346191406, -0.014874935150146484, -0.013666152954101562, -0.01245737075805664, -0.011248588562011719, -0.010039806365966797, -0.008831024169921875, -0.007622241973876953, -0.006413459777832031, -0.005204677581787109, -0.0039958953857421875, -0.0027871131896972656, -0.0015783309936523438, -0.0003695487976074219, 0.0008392333984375, 0.002048015594482422, 0.0032567977905273438, 0.004465579986572266, 0.0056743621826171875, 0.006883144378662109, 0.008091926574707031, 0.009300708770751953, 0.010509490966796875, 0.011718273162841797, 0.012927055358886719, 0.01413583755493164, 0.015344619750976562, 0.016553401947021484, 0.017762184143066406, 0.018970966339111328, 0.02017974853515625, 0.021388530731201172, 0.022597312927246094, 0.023806095123291016, 0.025014877319335938, 0.02622365951538086, 0.02743244171142578, 0.028641223907470703, 0.029850006103515625, 0.031058788299560547, 0.03226757049560547, 0.03347635269165039, 0.03468513488769531, 0.035893917083740234, 0.037102699279785156, 0.03831148147583008, 0.039520263671875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 12.0, 19.0, 34.0, 74.0, 128.0, 204.0, 209.0, 149.0, 84.0, 44.0, 15.0, 12.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3223196268081665, -0.3140208423137665, -0.30572205781936646, -0.29742327332496643, -0.2891244888305664, -0.2808257043361664, -0.27252691984176636, -0.26422810554504395, -0.2559293508529663, -0.24763056635856628, -0.23933178186416626, -0.23103299736976624, -0.2227342128753662, -0.2144354283809662, -0.20613662898540497, -0.19783784449100494, -0.18953904509544373, -0.1812402606010437, -0.17294147610664368, -0.16464269161224365, -0.15634390711784363, -0.1480451226234436, -0.13974632322788239, -0.13144753873348236, -0.12314875423908234, -0.11484996974468231, -0.10655118525028229, -0.09825239330530167, -0.08995360881090164, -0.08165482431650162, -0.073356032371521, -0.06505724787712097, -0.05675843358039856, -0.048459649085998535, -0.04016086086630821, -0.03186207264661789, -0.023563288152217865, -0.01526450365781784, -0.006965715438127518, 0.0013330727815628052, 0.00963185727596283, 0.017930643633008003, 0.026229429990053177, 0.0345282182097435, 0.042827002704143524, 0.05112578719854355, 0.05942457541823387, 0.0677233636379242, 0.07602214813232422, 0.08432093262672424, 0.09261971712112427, 0.10091850906610489, 0.10921729356050491, 0.11751607805490494, 0.12581486999988556, 0.13411365449428558, 0.1424124389886856, 0.15071122348308563, 0.15901000797748566, 0.16730879247188568, 0.1756075918674469, 0.18390637636184692, 0.19220516085624695, 0.20050394535064697, 0.208802729845047]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 9.0, 6.0, 10.0, 8.0, 12.0, 13.0, 18.0, 15.0, 16.0, 24.0, 28.0, 17.0, 21.0, 35.0, 30.0, 36.0, 35.0, 34.0, 38.0, 43.0, 37.0, 38.0, 33.0, 32.0, 28.0, 44.0, 34.0, 30.0, 35.0, 26.0, 28.0, 23.0, 29.0, 14.0, 14.0, 28.0, 18.0, 11.0, 11.0, 5.0, 8.0, 5.0, 8.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0], "bins": [-0.10288834571838379, -0.09980973601341248, -0.09673112630844116, -0.09365251660346985, -0.09057390689849854, -0.08749529719352722, -0.08441668748855591, -0.0813380777835846, -0.07825946807861328, -0.07518085837364197, -0.07210224866867065, -0.06902363896369934, -0.06594502925872803, -0.06286641955375671, -0.0597878098487854, -0.05670920014381409, -0.05363059043884277, -0.05055198073387146, -0.047473371028900146, -0.04439476132392883, -0.04131615161895752, -0.038237541913986206, -0.03515893220901489, -0.03208032250404358, -0.029001712799072266, -0.025923103094100952, -0.02284449338912964, -0.019765883684158325, -0.01668727397918701, -0.013608664274215698, -0.010530054569244385, -0.007451444864273071, -0.004372835159301758, -0.0012942254543304443, 0.0017843842506408691, 0.004862993955612183, 0.007941603660583496, 0.01102021336555481, 0.014098823070526123, 0.017177432775497437, 0.02025604248046875, 0.023334652185440063, 0.026413261890411377, 0.02949187159538269, 0.032570481300354004, 0.03564909100532532, 0.03872770071029663, 0.041806310415267944, 0.04488492012023926, 0.04796352982521057, 0.051042139530181885, 0.0541207492351532, 0.05719935894012451, 0.060277968645095825, 0.06335657835006714, 0.06643518805503845, 0.06951379776000977, 0.07259240746498108, 0.07567101716995239, 0.0787496268749237, 0.08182823657989502, 0.08490684628486633, 0.08798545598983765, 0.09106406569480896, 0.09414267539978027]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 6.0, 5.0, 9.0, 17.0, 26.0, 41.0, 66.0, 83.0, 149.0, 176.0, 290.0, 421.0, 631.0, 970.0, 1481.0, 2324.0, 3649.0, 5773.0, 9620.0, 15923.0, 27872.0, 51881.0, 103539.0, 216405.0, 285621.0, 154178.0, 74100.0, 38847.0, 21410.0, 12435.0, 7550.0, 4687.0, 2865.0, 1934.0, 1184.0, 778.0, 526.0, 327.0, 245.0, 165.0, 106.0, 77.0, 40.0, 35.0, 32.0, 19.0, 18.0, 6.0, 8.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.06182861328125, -0.060024261474609375, -0.05821990966796875, -0.056415557861328125, -0.0546112060546875, -0.052806854248046875, -0.05100250244140625, -0.049198150634765625, -0.047393798828125, -0.045589447021484375, -0.04378509521484375, -0.041980743408203125, -0.0401763916015625, -0.038372039794921875, -0.03656768798828125, -0.034763336181640625, -0.032958984375, -0.031154632568359375, -0.02935028076171875, -0.027545928955078125, -0.0257415771484375, -0.023937225341796875, -0.02213287353515625, -0.020328521728515625, -0.018524169921875, -0.016719818115234375, -0.01491546630859375, -0.013111114501953125, -0.0113067626953125, -0.009502410888671875, -0.00769805908203125, -0.005893707275390625, -0.00408935546875, -0.002285003662109375, -0.00048065185546875, 0.001323699951171875, 0.0031280517578125, 0.004932403564453125, 0.00673675537109375, 0.008541107177734375, 0.010345458984375, 0.012149810791015625, 0.01395416259765625, 0.015758514404296875, 0.0175628662109375, 0.019367218017578125, 0.02117156982421875, 0.022975921630859375, 0.0247802734375, 0.026584625244140625, 0.02838897705078125, 0.030193328857421875, 0.0319976806640625, 0.033802032470703125, 0.03560638427734375, 0.037410736083984375, 0.039215087890625, 0.041019439697265625, 0.04282379150390625, 0.044628143310546875, 0.0464324951171875, 0.048236846923828125, 0.05004119873046875, 0.051845550537109375, 0.05364990234375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 7.0, 10.0, 9.0, 13.0, 24.0, 15.0, 19.0, 20.0, 21.0, 30.0, 34.0, 44.0, 50.0, 46.0, 60.0, 54.0, 52.0, 40.0, 45.0, 38.0, 49.0, 44.0, 36.0, 38.0, 32.0, 35.0, 21.0, 22.0, 13.0, 8.0, 18.0, 8.0, 11.0, 4.0, 9.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.027496337890625, -0.0266878604888916, -0.025879383087158203, -0.025070905685424805, -0.024262428283691406, -0.023453950881958008, -0.02264547348022461, -0.02183699607849121, -0.021028518676757812, -0.020220041275024414, -0.019411563873291016, -0.018603086471557617, -0.01779460906982422, -0.01698613166809082, -0.016177654266357422, -0.015369176864624023, -0.014560699462890625, -0.013752222061157227, -0.012943744659423828, -0.01213526725769043, -0.011326789855957031, -0.010518312454223633, -0.009709835052490234, -0.008901357650756836, -0.008092880249023438, -0.007284402847290039, -0.006475925445556641, -0.005667448043823242, -0.004858970642089844, -0.004050493240356445, -0.003242015838623047, -0.0024335384368896484, -0.00162506103515625, -0.0008165836334228516, -8.106231689453125e-06, 0.0008003711700439453, 0.0016088485717773438, 0.002417325973510742, 0.0032258033752441406, 0.004034280776977539, 0.0048427581787109375, 0.005651235580444336, 0.006459712982177734, 0.007268190383911133, 0.008076667785644531, 0.00888514518737793, 0.009693622589111328, 0.010502099990844727, 0.011310577392578125, 0.012119054794311523, 0.012927532196044922, 0.01373600959777832, 0.014544486999511719, 0.015352964401245117, 0.016161441802978516, 0.016969919204711914, 0.017778396606445312, 0.01858687400817871, 0.01939535140991211, 0.020203828811645508, 0.021012306213378906, 0.021820783615112305, 0.022629261016845703, 0.0234377384185791, 0.0242462158203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 3.0, 11.0, 8.0, 11.0, 16.0, 14.0, 23.0, 12.0, 20.0, 25.0, 23.0, 26.0, 29.0, 28.0, 29.0, 67.0, 99.0, 593.0, 7830.0, 596531.0, 435911.0, 6248.0, 511.0, 133.0, 50.0, 42.0, 35.0, 30.0, 25.0, 35.0, 24.0, 20.0, 15.0, 13.0, 10.0, 6.0, 10.0, 11.0, 4.0, 6.0, 8.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.34130859375, -0.3306312561035156, -0.31995391845703125, -0.3092765808105469, -0.2985992431640625, -0.2879219055175781, -0.27724456787109375, -0.2665672302246094, -0.255889892578125, -0.24521255493164062, -0.23453521728515625, -0.22385787963867188, -0.2131805419921875, -0.20250320434570312, -0.19182586669921875, -0.18114852905273438, -0.17047119140625, -0.15979385375976562, -0.14911651611328125, -0.13843917846679688, -0.1277618408203125, -0.11708450317382812, -0.10640716552734375, -0.09572982788085938, -0.085052490234375, -0.07437515258789062, -0.06369781494140625, -0.053020477294921875, -0.0423431396484375, -0.031665802001953125, -0.02098846435546875, -0.010311126708984375, 0.0003662109375, 0.011043548583984375, 0.02172088623046875, 0.032398223876953125, 0.0430755615234375, 0.053752899169921875, 0.06443023681640625, 0.07510757446289062, 0.085784912109375, 0.09646224975585938, 0.10713958740234375, 0.11781692504882812, 0.1284942626953125, 0.13917160034179688, 0.14984893798828125, 0.16052627563476562, 0.17120361328125, 0.18188095092773438, 0.19255828857421875, 0.20323562622070312, 0.2139129638671875, 0.22459030151367188, 0.23526763916015625, 0.24594497680664062, 0.256622314453125, 0.2672996520996094, 0.27797698974609375, 0.2886543273925781, 0.2993316650390625, 0.3100090026855469, 0.32068634033203125, 0.3313636779785156, 0.342041015625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 12.0, 8.0, 17.0, 10.0, 16.0, 18.0, 19.0, 18.0, 27.0, 21.0, 25.0, 33.0, 28.0, 36.0, 34.0, 29.0, 36.0, 48.0, 42.0, 48.0, 52.0, 40.0, 44.0, 43.0, 40.0, 32.0, 26.0, 26.0, 31.0, 29.0, 19.0, 11.0, 12.0, 8.0, 9.0, 10.0, 10.0, 5.0, 8.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.054779052734375, -0.05305051803588867, -0.051321983337402344, -0.049593448638916016, -0.04786491394042969, -0.04613637924194336, -0.04440784454345703, -0.0426793098449707, -0.040950775146484375, -0.03922224044799805, -0.03749370574951172, -0.03576517105102539, -0.03403663635253906, -0.032308101654052734, -0.030579566955566406, -0.028851032257080078, -0.02712249755859375, -0.025393962860107422, -0.023665428161621094, -0.021936893463134766, -0.020208358764648438, -0.01847982406616211, -0.01675128936767578, -0.015022754669189453, -0.013294219970703125, -0.011565685272216797, -0.009837150573730469, -0.00810861587524414, -0.0063800811767578125, -0.004651546478271484, -0.0029230117797851562, -0.0011944770812988281, 0.0005340576171875, 0.002262592315673828, 0.003991127014160156, 0.005719661712646484, 0.0074481964111328125, 0.00917673110961914, 0.010905265808105469, 0.012633800506591797, 0.014362335205078125, 0.016090869903564453, 0.01781940460205078, 0.01954793930053711, 0.021276473999023438, 0.023005008697509766, 0.024733543395996094, 0.026462078094482422, 0.02819061279296875, 0.029919147491455078, 0.031647682189941406, 0.033376216888427734, 0.03510475158691406, 0.03683328628540039, 0.03856182098388672, 0.04029035568237305, 0.042018890380859375, 0.0437474250793457, 0.04547595977783203, 0.04720449447631836, 0.04893302917480469, 0.050661563873291016, 0.052390098571777344, 0.05411863327026367, 0.05584716796875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 8.0, 8.0, 9.0, 10.0, 12.0, 19.0, 22.0, 36.0, 43.0, 59.0, 105.0, 251.0, 494.0, 1471.0, 4418.0, 16975.0, 126084.0, 789912.0, 88826.0, 13791.0, 3711.0, 1212.0, 479.0, 257.0, 115.0, 79.0, 38.0, 30.0, 19.0, 12.0, 8.0, 8.0, 6.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07220458984375, -0.06966495513916016, -0.06712532043457031, -0.06458568572998047, -0.062046051025390625, -0.05950641632080078, -0.05696678161621094, -0.054427146911621094, -0.05188751220703125, -0.049347877502441406, -0.04680824279785156, -0.04426860809326172, -0.041728973388671875, -0.03918933868408203, -0.03664970397949219, -0.034110069274902344, -0.0315704345703125, -0.029030799865722656, -0.026491165161132812, -0.02395153045654297, -0.021411895751953125, -0.01887226104736328, -0.016332626342773438, -0.013792991638183594, -0.01125335693359375, -0.008713722229003906, -0.0061740875244140625, -0.0036344528198242188, -0.001094818115234375, 0.0014448165893554688, 0.0039844512939453125, 0.006524085998535156, 0.009063720703125, 0.011603355407714844, 0.014142990112304688, 0.01668262481689453, 0.019222259521484375, 0.02176189422607422, 0.024301528930664062, 0.026841163635253906, 0.02938079833984375, 0.031920433044433594, 0.03446006774902344, 0.03699970245361328, 0.039539337158203125, 0.04207897186279297, 0.04461860656738281, 0.047158241271972656, 0.0496978759765625, 0.052237510681152344, 0.05477714538574219, 0.05731678009033203, 0.059856414794921875, 0.06239604949951172, 0.06493568420410156, 0.0674753189086914, 0.07001495361328125, 0.0725545883178711, 0.07509422302246094, 0.07763385772705078, 0.08017349243164062, 0.08271312713623047, 0.08525276184082031, 0.08779239654541016, 0.09033203125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 10.0, 5.0, 11.0, 16.0, 30.0, 31.0, 42.0, 50.0, 90.0, 78.0, 136.0, 116.0, 91.0, 61.0, 50.0, 54.0, 30.0, 23.0, 14.0, 10.0, 8.0, 7.0, 5.0, 1.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0371208190917969e-05, -1.0102987289428711e-05, -9.834766387939453e-06, -9.566545486450195e-06, -9.298324584960938e-06, -9.03010368347168e-06, -8.761882781982422e-06, -8.493661880493164e-06, -8.225440979003906e-06, -7.957220077514648e-06, -7.68899917602539e-06, -7.420778274536133e-06, -7.152557373046875e-06, -6.884336471557617e-06, -6.616115570068359e-06, -6.3478946685791016e-06, -6.079673767089844e-06, -5.811452865600586e-06, -5.543231964111328e-06, -5.27501106262207e-06, -5.0067901611328125e-06, -4.738569259643555e-06, -4.470348358154297e-06, -4.202127456665039e-06, -3.933906555175781e-06, -3.6656856536865234e-06, -3.3974647521972656e-06, -3.129243850708008e-06, -2.86102294921875e-06, -2.592802047729492e-06, -2.3245811462402344e-06, -2.0563602447509766e-06, -1.7881393432617188e-06, -1.519918441772461e-06, -1.2516975402832031e-06, -9.834766387939453e-07, -7.152557373046875e-07, -4.470348358154297e-07, -1.7881393432617188e-07, 8.940696716308594e-08, 3.5762786865234375e-07, 6.258487701416016e-07, 8.940696716308594e-07, 1.1622905731201172e-06, 1.430511474609375e-06, 1.6987323760986328e-06, 1.9669532775878906e-06, 2.2351741790771484e-06, 2.5033950805664062e-06, 2.771615982055664e-06, 3.039836883544922e-06, 3.3080577850341797e-06, 3.5762786865234375e-06, 3.844499588012695e-06, 4.112720489501953e-06, 4.380941390991211e-06, 4.649162292480469e-06, 4.9173831939697266e-06, 5.185604095458984e-06, 5.453824996948242e-06, 5.7220458984375e-06, 5.990266799926758e-06, 6.258487701416016e-06, 6.5267086029052734e-06, 6.794929504394531e-06]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 9.0, 13.0, 10.0, 35.0, 41.0, 44.0, 97.0, 356.0, 4166.0, 962425.0, 80030.0, 968.0, 157.0, 65.0, 44.0, 31.0, 20.0, 17.0, 16.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.131103515625, -0.12722110748291016, -0.12333869934082031, -0.11945629119873047, -0.11557388305664062, -0.11169147491455078, -0.10780906677246094, -0.1039266586303711, -0.10004425048828125, -0.0961618423461914, -0.09227943420410156, -0.08839702606201172, -0.08451461791992188, -0.08063220977783203, -0.07674980163574219, -0.07286739349365234, -0.0689849853515625, -0.06510257720947266, -0.06122016906738281, -0.05733776092529297, -0.053455352783203125, -0.04957294464111328, -0.04569053649902344, -0.041808128356933594, -0.03792572021484375, -0.034043312072753906, -0.030160903930664062, -0.02627849578857422, -0.022396087646484375, -0.01851367950439453, -0.014631271362304688, -0.010748863220214844, -0.006866455078125, -0.0029840469360351562, 0.0008983612060546875, 0.004780769348144531, 0.008663177490234375, 0.012545585632324219, 0.016427993774414062, 0.020310401916503906, 0.02419281005859375, 0.028075218200683594, 0.03195762634277344, 0.03584003448486328, 0.039722442626953125, 0.04360485076904297, 0.04748725891113281, 0.051369667053222656, 0.0552520751953125, 0.059134483337402344, 0.06301689147949219, 0.06689929962158203, 0.07078170776367188, 0.07466411590576172, 0.07854652404785156, 0.0824289321899414, 0.08631134033203125, 0.0901937484741211, 0.09407615661621094, 0.09795856475830078, 0.10184097290039062, 0.10572338104248047, 0.10960578918457031, 0.11348819732666016, 0.11737060546875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 9.0, 8.0, 15.0, 35.0, 39.0, 40.0, 79.0, 109.0, 108.0, 114.0, 100.0, 90.0, 67.0, 56.0, 42.0, 24.0, 25.0, 17.0, 12.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0211944580078125, -0.020565032958984375, -0.01993560791015625, -0.019306182861328125, -0.0186767578125, -0.018047332763671875, -0.01741790771484375, -0.016788482666015625, -0.0161590576171875, -0.015529632568359375, -0.01490020751953125, -0.014270782470703125, -0.013641357421875, -0.013011932373046875, -0.01238250732421875, -0.011753082275390625, -0.0111236572265625, -0.010494232177734375, -0.00986480712890625, -0.009235382080078125, -0.00860595703125, -0.007976531982421875, -0.00734710693359375, -0.006717681884765625, -0.0060882568359375, -0.005458831787109375, -0.00482940673828125, -0.004199981689453125, -0.003570556640625, -0.002941131591796875, -0.00231170654296875, -0.001682281494140625, -0.0010528564453125, -0.000423431396484375, 0.00020599365234375, 0.000835418701171875, 0.00146484375, 0.002094268798828125, 0.00272369384765625, 0.003353118896484375, 0.0039825439453125, 0.004611968994140625, 0.00524139404296875, 0.005870819091796875, 0.006500244140625, 0.007129669189453125, 0.00775909423828125, 0.008388519287109375, 0.0090179443359375, 0.009647369384765625, 0.01027679443359375, 0.010906219482421875, 0.01153564453125, 0.012165069580078125, 0.01279449462890625, 0.013423919677734375, 0.0140533447265625, 0.014682769775390625, 0.01531219482421875, 0.015941619873046875, 0.016571044921875, 0.017200469970703125, 0.01782989501953125, 0.018459320068359375, 0.0190887451171875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [13.0, 82.0, 834.0, 88.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16815470159053802, -0.1013607308268547, -0.03456676006317139, 0.032227203249931335, 0.09902118146419525, 0.16581515967845917, 0.2326091080904007, 0.2994030714035034, 0.36619704961776733, 0.43299102783203125, 0.49978500604629517, 0.5665789842605591, 0.6333729028701782, 0.7001669406890869, 0.766960859298706, 0.83375483751297, 0.9005488157272339, 0.9673427939414978, 1.0341367721557617, 1.1009306907653809, 1.1677247285842896, 1.2345186471939087, 1.3013126850128174, 1.3681066036224365, 1.4349006414413452, 1.5016945600509644, 1.568488597869873, 1.6352825164794922, 1.7020765542984009, 1.76887047290802, 1.8356645107269287, 1.9024584293365479, 1.969252347946167, 2.036046266555786, 2.1028401851654053, 2.1696343421936035, 2.2364282608032227, 2.303222179412842, 2.370016098022461, 2.43681001663208, 2.5036041736602783, 2.5703980922698975, 2.6371920108795166, 2.703986167907715, 2.770780086517334, 2.837574005126953, 2.9043679237365723, 2.9711618423461914, 3.0379557609558105, 3.1047496795654297, 3.171543598175049, 3.238337755203247, 3.305131673812866, 3.3719255924224854, 3.4387195110321045, 3.5055136680603027, 3.572307586669922, 3.639101505279541, 3.70589542388916, 3.7726895809173584, 3.8394834995269775, 3.9062774181365967, 3.973071336746216, 4.039865493774414, 4.106659412384033]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 1.0, 3.0, 4.0, 5.0, 6.0, 8.0, 9.0, 13.0, 13.0, 7.0, 20.0, 23.0, 38.0, 20.0, 30.0, 41.0, 52.0, 51.0, 41.0, 40.0, 43.0, 45.0, 53.0, 50.0, 42.0, 40.0, 33.0, 37.0, 36.0, 30.0, 28.0, 31.0, 22.0, 18.0, 17.0, 13.0, 7.0, 8.0, 8.0, 4.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.2348107099533081, -0.22744937241077423, -0.22008804976940155, -0.21272671222686768, -0.205365389585495, -0.19800405204296112, -0.19064271450042725, -0.18328139185905457, -0.1759200543165207, -0.16855871677398682, -0.16119739413261414, -0.15383605659008026, -0.1464747190475464, -0.1391133964061737, -0.13175205886363983, -0.12439072877168655, -0.11702939867973328, -0.10966806858778, -0.10230673849582672, -0.09494540095329285, -0.08758407086133957, -0.08022274076938629, -0.07286140322685242, -0.06550007313489914, -0.05813874304294586, -0.050777412950992584, -0.04341607913374901, -0.03605474531650543, -0.028693415224552155, -0.021332085132598877, -0.013970751315355301, -0.006609417498111725, 0.0007519125938415527, 0.00811324454843998, 0.015474576503038406, 0.022835908457636833, 0.03019724041223526, 0.03755857050418854, 0.044919904321432114, 0.05228123813867569, 0.05964256823062897, 0.06700389832258224, 0.07436522841453552, 0.0817265659570694, 0.08908789604902267, 0.09644922614097595, 0.10381056368350983, 0.1111718937754631, 0.11853322386741638, 0.12589456140995026, 0.13325588405132294, 0.1406172215938568, 0.1479785442352295, 0.15533988177776337, 0.16270121932029724, 0.17006254196166992, 0.1774238795042038, 0.18478521704673767, 0.19214653968811035, 0.19950787723064423, 0.2068692147731781, 0.21423053741455078, 0.22159187495708466, 0.22895321249961853, 0.2363145351409912]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 6.0, 8.0, 11.0, 17.0, 12.0, 24.0, 29.0, 32.0, 33.0, 50.0, 75.0, 107.0, 188.0, 327.0, 737.0, 2204.0, 10765.0, 125933.0, 3978962.0, 63753.0, 7635.0, 1819.0, 654.0, 314.0, 181.0, 114.0, 68.0, 53.0, 33.0, 29.0, 29.0, 13.0, 17.0, 9.0, 10.0, 5.0, 4.0, 13.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.241943359375, -0.23447608947753906, -0.22700881958007812, -0.2195415496826172, -0.21207427978515625, -0.2046070098876953, -0.19713973999023438, -0.18967247009277344, -0.1822052001953125, -0.17473793029785156, -0.16727066040039062, -0.1598033905029297, -0.15233612060546875, -0.1448688507080078, -0.13740158081054688, -0.12993431091308594, -0.122467041015625, -0.11499977111816406, -0.10753250122070312, -0.10006523132324219, -0.09259796142578125, -0.08513069152832031, -0.07766342163085938, -0.07019615173339844, -0.0627288818359375, -0.05526161193847656, -0.047794342041015625, -0.04032707214355469, -0.03285980224609375, -0.025392532348632812, -0.017925262451171875, -0.010457992553710938, -0.00299072265625, 0.0044765472412109375, 0.011943817138671875, 0.019411087036132812, 0.02687835693359375, 0.03434562683105469, 0.041812896728515625, 0.04928016662597656, 0.0567474365234375, 0.06421470642089844, 0.07168197631835938, 0.07914924621582031, 0.08661651611328125, 0.09408378601074219, 0.10155105590820312, 0.10901832580566406, 0.116485595703125, 0.12395286560058594, 0.13142013549804688, 0.1388874053955078, 0.14635467529296875, 0.1538219451904297, 0.16128921508789062, 0.16875648498535156, 0.1762237548828125, 0.18369102478027344, 0.19115829467773438, 0.1986255645751953, 0.20609283447265625, 0.2135601043701172, 0.22102737426757812, 0.22849464416503906, 0.2359619140625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 9.0, 5.0, 9.0, 11.0, 9.0, 13.0, 15.0, 25.0, 20.0, 19.0, 32.0, 31.0, 35.0, 52.0, 53.0, 56.0, 54.0, 53.0, 68.0, 43.0, 47.0, 52.0, 49.0, 30.0, 31.0, 27.0, 26.0, 20.0, 20.0, 13.0, 15.0, 6.0, 11.0, 9.0, 6.0, 6.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0280303955078125, -0.027153730392456055, -0.02627706527709961, -0.025400400161743164, -0.02452373504638672, -0.023647069931030273, -0.022770404815673828, -0.021893739700317383, -0.021017074584960938, -0.020140409469604492, -0.019263744354248047, -0.0183870792388916, -0.017510414123535156, -0.01663374900817871, -0.015757083892822266, -0.01488041877746582, -0.014003753662109375, -0.01312708854675293, -0.012250423431396484, -0.011373758316040039, -0.010497093200683594, -0.009620428085327148, -0.008743762969970703, -0.007867097854614258, -0.0069904327392578125, -0.006113767623901367, -0.005237102508544922, -0.0043604373931884766, -0.0034837722778320312, -0.002607107162475586, -0.0017304420471191406, -0.0008537769317626953, 2.288818359375e-05, 0.0008995532989501953, 0.0017762184143066406, 0.002652883529663086, 0.0035295486450195312, 0.0044062137603759766, 0.005282878875732422, 0.006159543991088867, 0.0070362091064453125, 0.007912874221801758, 0.008789539337158203, 0.009666204452514648, 0.010542869567871094, 0.011419534683227539, 0.012296199798583984, 0.01317286491394043, 0.014049530029296875, 0.01492619514465332, 0.015802860260009766, 0.01667952537536621, 0.017556190490722656, 0.0184328556060791, 0.019309520721435547, 0.020186185836791992, 0.021062850952148438, 0.021939516067504883, 0.022816181182861328, 0.023692846298217773, 0.02456951141357422, 0.025446176528930664, 0.02632284164428711, 0.027199506759643555, 0.028076171875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 14.0, 13.0, 27.0, 33.0, 43.0, 77.0, 159.0, 301.0, 669.0, 2116.0, 9942.0, 98605.0, 3467504.0, 580332.0, 27998.0, 4375.0, 1134.0, 460.0, 187.0, 94.0, 67.0, 36.0, 29.0, 15.0, 13.0, 9.0, 3.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1790771484375, -0.17325401306152344, -0.16743087768554688, -0.1616077423095703, -0.15578460693359375, -0.1499614715576172, -0.14413833618164062, -0.13831520080566406, -0.1324920654296875, -0.12666893005371094, -0.12084579467773438, -0.11502265930175781, -0.10919952392578125, -0.10337638854980469, -0.09755325317382812, -0.09173011779785156, -0.085906982421875, -0.08008384704589844, -0.07426071166992188, -0.06843757629394531, -0.06261444091796875, -0.05679130554199219, -0.050968170166015625, -0.04514503479003906, -0.0393218994140625, -0.03349876403808594, -0.027675628662109375, -0.021852493286132812, -0.01602935791015625, -0.010206222534179688, -0.004383087158203125, 0.0014400482177734375, 0.00726318359375, 0.013086318969726562, 0.018909454345703125, 0.024732589721679688, 0.03055572509765625, 0.03637886047363281, 0.042201995849609375, 0.04802513122558594, 0.0538482666015625, 0.05967140197753906, 0.06549453735351562, 0.07131767272949219, 0.07714080810546875, 0.08296394348144531, 0.08878707885742188, 0.09461021423339844, 0.100433349609375, 0.10625648498535156, 0.11207962036132812, 0.11790275573730469, 0.12372589111328125, 0.1295490264892578, 0.13537216186523438, 0.14119529724121094, 0.1470184326171875, 0.15284156799316406, 0.15866470336914062, 0.1644878387451172, 0.17031097412109375, 0.1761341094970703, 0.18195724487304688, 0.18778038024902344, 0.193603515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 1.0, 8.0, 7.0, 11.0, 12.0, 17.0, 30.0, 46.0, 49.0, 75.0, 144.0, 202.0, 407.0, 855.0, 940.0, 507.0, 256.0, 171.0, 108.0, 81.0, 41.0, 36.0, 25.0, 13.0, 8.0, 5.0, 6.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.076416015625, -0.0741128921508789, -0.07180976867675781, -0.06950664520263672, -0.06720352172851562, -0.06490039825439453, -0.06259727478027344, -0.060294151306152344, -0.05799102783203125, -0.055687904357910156, -0.05338478088378906, -0.05108165740966797, -0.048778533935546875, -0.04647541046142578, -0.04417228698730469, -0.041869163513183594, -0.0395660400390625, -0.037262916564941406, -0.03495979309082031, -0.03265666961669922, -0.030353546142578125, -0.02805042266845703, -0.025747299194335938, -0.023444175720214844, -0.02114105224609375, -0.018837928771972656, -0.016534805297851562, -0.014231681823730469, -0.011928558349609375, -0.009625434875488281, -0.0073223114013671875, -0.005019187927246094, -0.002716064453125, -0.00041294097900390625, 0.0018901824951171875, 0.004193305969238281, 0.006496429443359375, 0.008799552917480469, 0.011102676391601562, 0.013405799865722656, 0.01570892333984375, 0.018012046813964844, 0.020315170288085938, 0.02261829376220703, 0.024921417236328125, 0.02722454071044922, 0.029527664184570312, 0.031830787658691406, 0.0341339111328125, 0.036437034606933594, 0.03874015808105469, 0.04104328155517578, 0.043346405029296875, 0.04564952850341797, 0.04795265197753906, 0.050255775451660156, 0.05255889892578125, 0.054862022399902344, 0.05716514587402344, 0.05946826934814453, 0.061771392822265625, 0.06407451629638672, 0.06637763977050781, 0.0686807632446289, 0.07098388671875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 8.0, 23.0, 66.0, 275.0, 448.0, 146.0, 32.0, 9.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19829000532627106, -0.17421525716781616, -0.15014050900936127, -0.12606576085090637, -0.10199102014303207, -0.07791627198457718, -0.05384153127670288, -0.029766783118247986, -0.005692034959793091, 0.018382711336016655, 0.0424574576318264, 0.066532202064991, 0.09060695022344589, 0.11468169838190079, 0.13875643908977509, 0.16283118724822998, 0.18690593540668488, 0.21098068356513977, 0.23505543172359467, 0.25913017988204956, 0.28320491313934326, 0.30727967619895935, 0.33135440945625305, 0.35542917251586914, 0.37950390577316284, 0.40357863903045654, 0.42765340209007263, 0.45172813534736633, 0.4758028984069824, 0.4998776316642761, 0.5239523649215698, 0.5480271577835083, 0.572101891040802, 0.5961766242980957, 0.6202513575553894, 0.6443261504173279, 0.6684008836746216, 0.6924756169319153, 0.716550350189209, 0.7406251430511475, 0.7646998763084412, 0.7887746095657349, 0.8128493428230286, 0.836924135684967, 0.8609988689422607, 0.8850736021995544, 0.9091483354568481, 0.9332231283187866, 0.9572978019714355, 0.9813725352287292, 1.005447268486023, 1.0295220613479614, 1.0535967350006104, 1.0776715278625488, 1.1017463207244873, 1.1258209943771362, 1.1498957872390747, 1.1739705801010132, 1.198045253753662, 1.2221200466156006, 1.2461947202682495, 1.270269513130188, 1.2943443059921265, 1.3184189796447754, 1.3424937725067139]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 7.0, 4.0, 9.0, 10.0, 16.0, 11.0, 25.0, 18.0, 24.0, 26.0, 28.0, 34.0, 48.0, 41.0, 44.0, 39.0, 53.0, 45.0, 37.0, 44.0, 50.0, 48.0, 40.0, 38.0, 33.0, 30.0, 32.0, 28.0, 25.0, 21.0, 15.0, 10.0, 14.0, 10.0, 11.0, 4.0, 12.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-0.19571727514266968, -0.19006359577178955, -0.18440990149974823, -0.1787562221288681, -0.17310252785682678, -0.16744884848594666, -0.16179516911506653, -0.1561414897441864, -0.15048779547214508, -0.14483411610126495, -0.13918042182922363, -0.1335267424583435, -0.12787306308746338, -0.12221936881542206, -0.11656568944454193, -0.11091200262308121, -0.10525831580162048, -0.09960462898015976, -0.09395094215869904, -0.08829726278781891, -0.08264357596635818, -0.07698988914489746, -0.07133620977401733, -0.06568252295255661, -0.060028836131095886, -0.05437514930963516, -0.04872146621346474, -0.04306778311729431, -0.03741409629583359, -0.031760409474372864, -0.02610672637820244, -0.020453043282032013, -0.014799356460571289, -0.009145671501755714, -0.0034919865429401398, 0.002161698415875435, 0.00781538337469101, 0.013469068333506584, 0.01912275329232216, 0.024776436388492584, 0.030430123209953308, 0.03608381003141403, 0.04173749312758446, 0.04739117622375488, 0.05304486304521561, 0.05869854986667633, 0.06435222923755646, 0.07000591605901718, 0.0756596028804779, 0.08131328970193863, 0.08696697652339935, 0.09262065589427948, 0.0982743427157402, 0.10392802953720093, 0.10958170890808105, 0.11523539572954178, 0.1208890825510025, 0.12654276192188263, 0.13219645619392395, 0.13785013556480408, 0.1435038149356842, 0.14915750920772552, 0.15481118857860565, 0.16046488285064697, 0.1661185622215271]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 10.0, 5.0, 13.0, 12.0, 20.0, 36.0, 50.0, 86.0, 136.0, 200.0, 408.0, 662.0, 1061.0, 1970.0, 3574.0, 6776.0, 13399.0, 27105.0, 59084.0, 150657.0, 350319.0, 255186.0, 96529.0, 40804.0, 19351.0, 9684.0, 5003.0, 2787.0, 1498.0, 841.0, 512.0, 286.0, 176.0, 103.0, 59.0, 48.0, 25.0, 23.0, 20.0, 12.0, 13.0, 4.0, 3.0, 8.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.07421875, -0.07220029830932617, -0.07018184661865234, -0.06816339492797852, -0.06614494323730469, -0.06412649154663086, -0.06210803985595703, -0.0600895881652832, -0.058071136474609375, -0.05605268478393555, -0.05403423309326172, -0.05201578140258789, -0.04999732971191406, -0.047978878021240234, -0.045960426330566406, -0.04394197463989258, -0.04192352294921875, -0.03990507125854492, -0.037886619567871094, -0.035868167877197266, -0.03384971618652344, -0.03183126449584961, -0.02981281280517578, -0.027794361114501953, -0.025775909423828125, -0.023757457733154297, -0.02173900604248047, -0.01972055435180664, -0.017702102661132812, -0.015683650970458984, -0.013665199279785156, -0.011646747589111328, -0.0096282958984375, -0.007609844207763672, -0.005591392517089844, -0.0035729408264160156, -0.0015544891357421875, 0.0004639625549316406, 0.0024824142456054688, 0.004500865936279297, 0.006519317626953125, 0.008537769317626953, 0.010556221008300781, 0.01257467269897461, 0.014593124389648438, 0.016611576080322266, 0.018630027770996094, 0.020648479461669922, 0.02266693115234375, 0.024685382843017578, 0.026703834533691406, 0.028722286224365234, 0.030740737915039062, 0.03275918960571289, 0.03477764129638672, 0.03679609298706055, 0.038814544677734375, 0.0408329963684082, 0.04285144805908203, 0.04486989974975586, 0.04688835144042969, 0.048906803131103516, 0.050925254821777344, 0.05294370651245117, 0.054962158203125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 7.0, 6.0, 14.0, 17.0, 17.0, 16.0, 29.0, 33.0, 38.0, 42.0, 34.0, 61.0, 58.0, 50.0, 61.0, 61.0, 58.0, 54.0, 59.0, 50.0, 46.0, 28.0, 24.0, 29.0, 27.0, 13.0, 14.0, 13.0, 15.0, 6.0, 2.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02191162109375, -0.021001815795898438, -0.020092010498046875, -0.019182205200195312, -0.01827239990234375, -0.017362594604492188, -0.016452789306640625, -0.015542984008789062, -0.0146331787109375, -0.013723373413085938, -0.012813568115234375, -0.011903762817382812, -0.01099395751953125, -0.010084152221679688, -0.009174346923828125, -0.008264541625976562, -0.007354736328125, -0.0064449310302734375, -0.005535125732421875, -0.0046253204345703125, -0.00371551513671875, -0.0028057098388671875, -0.001895904541015625, -0.0009860992431640625, -7.62939453125e-05, 0.0008335113525390625, 0.001743316650390625, 0.0026531219482421875, 0.00356292724609375, 0.0044727325439453125, 0.005382537841796875, 0.0062923431396484375, 0.0072021484375, 0.008111953735351562, 0.009021759033203125, 0.009931564331054688, 0.01084136962890625, 0.011751174926757812, 0.012660980224609375, 0.013570785522460938, 0.0144805908203125, 0.015390396118164062, 0.016300201416015625, 0.017210006713867188, 0.01811981201171875, 0.019029617309570312, 0.019939422607421875, 0.020849227905273438, 0.021759033203125, 0.022668838500976562, 0.023578643798828125, 0.024488449096679688, 0.02539825439453125, 0.026308059692382812, 0.027217864990234375, 0.028127670288085938, 0.0290374755859375, 0.029947280883789062, 0.030857086181640625, 0.03176689147949219, 0.03267669677734375, 0.03358650207519531, 0.034496307373046875, 0.03540611267089844, 0.03631591796875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 7.0, 8.0, 5.0, 6.0, 8.0, 12.0, 15.0, 18.0, 25.0, 27.0, 40.0, 30.0, 51.0, 63.0, 72.0, 93.0, 162.0, 269.0, 657.0, 2761.0, 14013.0, 84721.0, 607628.0, 289791.0, 38049.0, 7135.0, 1688.0, 461.0, 186.0, 113.0, 70.0, 72.0, 41.0, 44.0, 48.0, 40.0, 33.0, 26.0, 14.0, 15.0, 11.0, 9.0, 8.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1474609375, -0.142822265625, -0.13818359375, -0.133544921875, -0.12890625, -0.124267578125, -0.11962890625, -0.114990234375, -0.1103515625, -0.105712890625, -0.10107421875, -0.096435546875, -0.091796875, -0.087158203125, -0.08251953125, -0.077880859375, -0.0732421875, -0.068603515625, -0.06396484375, -0.059326171875, -0.0546875, -0.050048828125, -0.04541015625, -0.040771484375, -0.0361328125, -0.031494140625, -0.02685546875, -0.022216796875, -0.017578125, -0.012939453125, -0.00830078125, -0.003662109375, 0.0009765625, 0.005615234375, 0.01025390625, 0.014892578125, 0.01953125, 0.024169921875, 0.02880859375, 0.033447265625, 0.0380859375, 0.042724609375, 0.04736328125, 0.052001953125, 0.056640625, 0.061279296875, 0.06591796875, 0.070556640625, 0.0751953125, 0.079833984375, 0.08447265625, 0.089111328125, 0.09375, 0.098388671875, 0.10302734375, 0.107666015625, 0.1123046875, 0.116943359375, 0.12158203125, 0.126220703125, 0.130859375, 0.135498046875, 0.14013671875, 0.144775390625, 0.1494140625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 4.0, 8.0, 4.0, 9.0, 11.0, 15.0, 17.0, 14.0, 23.0, 23.0, 19.0, 25.0, 34.0, 48.0, 52.0, 31.0, 38.0, 48.0, 45.0, 40.0, 52.0, 36.0, 41.0, 43.0, 23.0, 28.0, 30.0, 28.0, 39.0, 27.0, 25.0, 27.0, 18.0, 24.0, 9.0, 13.0, 7.0, 5.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.058258056640625, -0.056387901306152344, -0.05451774597167969, -0.05264759063720703, -0.050777435302734375, -0.04890727996826172, -0.04703712463378906, -0.045166969299316406, -0.04329681396484375, -0.041426658630371094, -0.03955650329589844, -0.03768634796142578, -0.035816192626953125, -0.03394603729248047, -0.03207588195800781, -0.030205726623535156, -0.0283355712890625, -0.026465415954589844, -0.024595260620117188, -0.02272510528564453, -0.020854949951171875, -0.01898479461669922, -0.017114639282226562, -0.015244483947753906, -0.01337432861328125, -0.011504173278808594, -0.009634017944335938, -0.007763862609863281, -0.005893707275390625, -0.004023551940917969, -0.0021533966064453125, -0.00028324127197265625, 0.0015869140625, 0.0034570693969726562, 0.0053272247314453125, 0.007197380065917969, 0.009067535400390625, 0.010937690734863281, 0.012807846069335938, 0.014678001403808594, 0.01654815673828125, 0.018418312072753906, 0.020288467407226562, 0.02215862274169922, 0.024028778076171875, 0.02589893341064453, 0.027769088745117188, 0.029639244079589844, 0.0315093994140625, 0.033379554748535156, 0.03524971008300781, 0.03711986541748047, 0.038990020751953125, 0.04086017608642578, 0.04273033142089844, 0.044600486755371094, 0.04647064208984375, 0.048340797424316406, 0.05021095275878906, 0.05208110809326172, 0.053951263427734375, 0.05582141876220703, 0.05769157409667969, 0.059561729431152344, 0.061431884765625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 10.0, 8.0, 15.0, 18.0, 27.0, 28.0, 41.0, 46.0, 75.0, 113.0, 153.0, 238.0, 307.0, 492.0, 793.0, 1385.0, 2314.0, 4407.0, 10995.0, 49522.0, 837999.0, 110687.0, 15910.0, 5874.0, 2835.0, 1521.0, 941.0, 565.0, 397.0, 255.0, 176.0, 113.0, 90.0, 69.0, 44.0, 20.0, 21.0, 10.0, 10.0, 10.0, 10.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09747314453125, -0.09418582916259766, -0.09089851379394531, -0.08761119842529297, -0.08432388305664062, -0.08103656768798828, -0.07774925231933594, -0.0744619369506836, -0.07117462158203125, -0.0678873062133789, -0.06459999084472656, -0.06131267547607422, -0.058025360107421875, -0.05473804473876953, -0.05145072937011719, -0.048163414001464844, -0.0448760986328125, -0.041588783264160156, -0.03830146789550781, -0.03501415252685547, -0.031726837158203125, -0.02843952178955078, -0.025152206420898438, -0.021864891052246094, -0.01857757568359375, -0.015290260314941406, -0.012002944946289062, -0.008715629577636719, -0.005428314208984375, -0.0021409988403320312, 0.0011463165283203125, 0.004433631896972656, 0.007720947265625, 0.011008262634277344, 0.014295578002929688, 0.01758289337158203, 0.020870208740234375, 0.02415752410888672, 0.027444839477539062, 0.030732154846191406, 0.03401947021484375, 0.037306785583496094, 0.04059410095214844, 0.04388141632080078, 0.047168731689453125, 0.05045604705810547, 0.05374336242675781, 0.057030677795410156, 0.0603179931640625, 0.06360530853271484, 0.06689262390136719, 0.07017993927001953, 0.07346725463867188, 0.07675457000732422, 0.08004188537597656, 0.0833292007446289, 0.08661651611328125, 0.0899038314819336, 0.09319114685058594, 0.09647846221923828, 0.09976577758789062, 0.10305309295654297, 0.10634040832519531, 0.10962772369384766, 0.1129150390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 7.0, 16.0, 27.0, 65.0, 175.0, 346.0, 233.0, 73.0, 21.0, 14.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8848648071289062e-05, -2.815481275320053e-05, -2.7460977435112e-05, -2.6767142117023468e-05, -2.6073306798934937e-05, -2.5379471480846405e-05, -2.4685636162757874e-05, -2.3991800844669342e-05, -2.329796552658081e-05, -2.260413020849228e-05, -2.1910294890403748e-05, -2.1216459572315216e-05, -2.0522624254226685e-05, -1.9828788936138153e-05, -1.913495361804962e-05, -1.844111829996109e-05, -1.774728298187256e-05, -1.7053447663784027e-05, -1.6359612345695496e-05, -1.5665777027606964e-05, -1.4971941709518433e-05, -1.4278106391429901e-05, -1.358427107334137e-05, -1.2890435755252838e-05, -1.2196600437164307e-05, -1.1502765119075775e-05, -1.0808929800987244e-05, -1.0115094482898712e-05, -9.42125916481018e-06, -8.72742384672165e-06, -8.033588528633118e-06, -7.339753210544586e-06, -6.645917892456055e-06, -5.952082574367523e-06, -5.258247256278992e-06, -4.56441193819046e-06, -3.870576620101929e-06, -3.1767413020133972e-06, -2.4829059839248657e-06, -1.7890706658363342e-06, -1.0952353477478027e-06, -4.0140002965927124e-07, 2.9243528842926025e-07, 9.862706065177917e-07, 1.6801059246063232e-06, 2.3739412426948547e-06, 3.0677765607833862e-06, 3.7616118788719177e-06, 4.455447196960449e-06, 5.149282515048981e-06, 5.843117833137512e-06, 6.536953151226044e-06, 7.230788469314575e-06, 7.924623787403107e-06, 8.618459105491638e-06, 9.31229442358017e-06, 1.0006129741668701e-05, 1.0699965059757233e-05, 1.1393800377845764e-05, 1.2087635695934296e-05, 1.2781471014022827e-05, 1.3475306332111359e-05, 1.416914165019989e-05, 1.4862976968288422e-05, 1.5556812286376953e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 4.0, 13.0, 17.0, 16.0, 24.0, 44.0, 86.0, 149.0, 402.0, 1077.0, 3931.0, 21233.0, 333842.0, 646268.0, 33810.0, 5359.0, 1388.0, 430.0, 196.0, 87.0, 49.0, 38.0, 17.0, 9.0, 8.0, 10.0, 8.0, 9.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0667724609375, -0.06455516815185547, -0.06233787536621094, -0.060120582580566406, -0.057903289794921875, -0.055685997009277344, -0.05346870422363281, -0.05125141143798828, -0.04903411865234375, -0.04681682586669922, -0.04459953308105469, -0.042382240295410156, -0.040164947509765625, -0.037947654724121094, -0.03573036193847656, -0.03351306915283203, -0.0312957763671875, -0.02907848358154297, -0.026861190795898438, -0.024643898010253906, -0.022426605224609375, -0.020209312438964844, -0.017992019653320312, -0.01577472686767578, -0.01355743408203125, -0.011340141296386719, -0.009122848510742188, -0.006905555725097656, -0.004688262939453125, -0.0024709701538085938, -0.0002536773681640625, 0.0019636154174804688, 0.004180908203125, 0.006398200988769531, 0.008615493774414062, 0.010832786560058594, 0.013050079345703125, 0.015267372131347656, 0.017484664916992188, 0.01970195770263672, 0.02191925048828125, 0.02413654327392578, 0.026353836059570312, 0.028571128845214844, 0.030788421630859375, 0.033005714416503906, 0.03522300720214844, 0.03744029998779297, 0.0396575927734375, 0.04187488555908203, 0.04409217834472656, 0.046309471130371094, 0.048526763916015625, 0.050744056701660156, 0.05296134948730469, 0.05517864227294922, 0.05739593505859375, 0.05961322784423828, 0.06183052062988281, 0.06404781341552734, 0.06626510620117188, 0.0684823989868164, 0.07069969177246094, 0.07291698455810547, 0.07513427734375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 7.0, 3.0, 11.0, 12.0, 11.0, 19.0, 35.0, 41.0, 65.0, 78.0, 104.0, 129.0, 111.0, 104.0, 73.0, 57.0, 31.0, 29.0, 16.0, 7.0, 10.0, 8.0, 7.0, 5.0, 9.0, 5.0, 3.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0265655517578125, -0.025777101516723633, -0.024988651275634766, -0.0242002010345459, -0.02341175079345703, -0.022623300552368164, -0.021834850311279297, -0.02104640007019043, -0.020257949829101562, -0.019469499588012695, -0.018681049346923828, -0.01789259910583496, -0.017104148864746094, -0.016315698623657227, -0.01552724838256836, -0.014738798141479492, -0.013950347900390625, -0.013161897659301758, -0.01237344741821289, -0.011584997177124023, -0.010796546936035156, -0.010008096694946289, -0.009219646453857422, -0.008431196212768555, -0.0076427459716796875, -0.00685429573059082, -0.006065845489501953, -0.005277395248413086, -0.004488945007324219, -0.0037004947662353516, -0.0029120445251464844, -0.002123594284057617, -0.00133514404296875, -0.0005466938018798828, 0.00024175643920898438, 0.0010302066802978516, 0.0018186569213867188, 0.002607107162475586, 0.003395557403564453, 0.00418400764465332, 0.0049724578857421875, 0.005760908126831055, 0.006549358367919922, 0.007337808609008789, 0.008126258850097656, 0.008914709091186523, 0.00970315933227539, 0.010491609573364258, 0.011280059814453125, 0.012068510055541992, 0.01285696029663086, 0.013645410537719727, 0.014433860778808594, 0.015222311019897461, 0.016010761260986328, 0.016799211502075195, 0.017587661743164062, 0.01837611198425293, 0.019164562225341797, 0.019953012466430664, 0.02074146270751953, 0.0215299129486084, 0.022318363189697266, 0.023106813430786133, 0.023895263671875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 488.0, 511.0, 9.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8775930404663086, -2.810654640197754, -2.74371600151062, -2.6767776012420654, -2.6098389625549316, -2.542900562286377, -2.4759621620178223, -2.4090235233306885, -2.342085123062134, -2.275146722793579, -2.2082080841064453, -2.1412696838378906, -2.074331045150757, -2.007392644882202, -1.940454125404358, -1.8735156059265137, -1.8065770864486694, -1.7396385669708252, -1.672700047492981, -1.6057615280151367, -1.538823127746582, -1.4718846082687378, -1.4049460887908936, -1.3380075693130493, -1.271069049835205, -1.2041305303573608, -1.1371920108795166, -1.070253610610962, -1.0033150911331177, -0.9363765716552734, -0.8694380521774292, -0.802499532699585, -0.7355612516403198, -0.6686227321624756, -0.6016842722892761, -0.5347457528114319, -0.46780726313591003, -0.4008687734603882, -0.33393025398254395, -0.2669917643070221, -0.20005327463150024, -0.1331147849559784, -0.06617628037929535, 0.0007622241973876953, 0.06770071387290955, 0.1346392035484314, 0.20157772302627563, 0.2685162127017975, 0.33545470237731934, 0.4023931920528412, 0.46933168172836304, 0.5362702012062073, 0.6032086610794067, 0.670147180557251, 0.7370857000350952, 0.8040242195129395, 0.8709626793861389, 0.9379011988639832, 1.0048396587371826, 1.0717781782150269, 1.138716697692871, 1.2056550979614258, 1.2725937366485596, 1.3395321369171143, 1.4064706563949585]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 8.0, 9.0, 16.0, 11.0, 23.0, 19.0, 15.0, 25.0, 31.0, 30.0, 33.0, 35.0, 43.0, 39.0, 50.0, 48.0, 43.0, 33.0, 43.0, 55.0, 45.0, 55.0, 37.0, 33.0, 33.0, 28.0, 20.0, 22.0, 16.0, 17.0, 19.0, 10.0, 5.0, 10.0, 8.0, 7.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1744655966758728, -0.16909761726856232, -0.16372965276241302, -0.15836167335510254, -0.15299370884895325, -0.14762572944164276, -0.14225775003433228, -0.13688978552818298, -0.1315218061208725, -0.126153826713562, -0.12078586220741272, -0.11541788280010223, -0.11004991084337234, -0.10468193888664246, -0.09931395947933197, -0.09394598752260208, -0.08857801556587219, -0.0832100436091423, -0.07784207165241241, -0.07247409224510193, -0.06710612028837204, -0.06173814833164215, -0.056370172649621964, -0.051002196967601776, -0.04563422501087189, -0.040266253054142, -0.03489827737212181, -0.029530303552746773, -0.024162329733371735, -0.018794355913996696, -0.013426382094621658, -0.008058406412601471, -0.002690434455871582, 0.002677539363503456, 0.008045513182878494, 0.013413487002253532, 0.01878146082162857, 0.02414943464100361, 0.029517408460378647, 0.034885384142398834, 0.04025335609912872, 0.04562132805585861, 0.0509893037378788, 0.05635727941989899, 0.061725251376628876, 0.06709322333335876, 0.07246120274066925, 0.07782917469739914, 0.08319714665412903, 0.08856511861085892, 0.0939330905675888, 0.09930106997489929, 0.10466904193162918, 0.11003701388835907, 0.11540499329566956, 0.12077296525239944, 0.12614093720912933, 0.13150891661643982, 0.1368768811225891, 0.1422448605298996, 0.14761283993721008, 0.15298080444335938, 0.15834878385066986, 0.16371676325798035, 0.16908472776412964]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 7.0, 7.0, 8.0, 11.0, 11.0, 17.0, 18.0, 20.0, 34.0, 55.0, 72.0, 81.0, 109.0, 167.0, 313.0, 587.0, 1512.0, 5440.0, 32949.0, 1582671.0, 2518010.0, 42334.0, 6408.0, 1735.0, 683.0, 377.0, 194.0, 129.0, 86.0, 59.0, 44.0, 37.0, 36.0, 16.0, 14.0, 10.0, 5.0, 6.0, 8.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11865234375, -0.11426734924316406, -0.10988235473632812, -0.10549736022949219, -0.10111236572265625, -0.09672737121582031, -0.09234237670898438, -0.08795738220214844, -0.0835723876953125, -0.07918739318847656, -0.07480239868164062, -0.07041740417480469, -0.06603240966796875, -0.06164741516113281, -0.057262420654296875, -0.05287742614746094, -0.048492431640625, -0.04410743713378906, -0.039722442626953125, -0.03533744812011719, -0.03095245361328125, -0.026567459106445312, -0.022182464599609375, -0.017797470092773438, -0.0134124755859375, -0.009027481079101562, -0.004642486572265625, -0.0002574920654296875, 0.00412750244140625, 0.008512496948242188, 0.012897491455078125, 0.017282485961914062, 0.02166748046875, 0.026052474975585938, 0.030437469482421875, 0.03482246398925781, 0.03920745849609375, 0.04359245300292969, 0.047977447509765625, 0.05236244201660156, 0.0567474365234375, 0.06113243103027344, 0.06551742553710938, 0.06990242004394531, 0.07428741455078125, 0.07867240905761719, 0.08305740356445312, 0.08744239807128906, 0.091827392578125, 0.09621238708496094, 0.10059738159179688, 0.10498237609863281, 0.10936737060546875, 0.11375236511230469, 0.11813735961914062, 0.12252235412597656, 0.1269073486328125, 0.13129234313964844, 0.13567733764648438, 0.1400623321533203, 0.14444732666015625, 0.1488323211669922, 0.15321731567382812, 0.15760231018066406, 0.1619873046875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 6.0, 3.0, 2.0, 3.0, 9.0, 9.0, 5.0, 11.0, 10.0, 15.0, 17.0, 20.0, 24.0, 25.0, 26.0, 40.0, 28.0, 37.0, 40.0, 59.0, 43.0, 45.0, 59.0, 69.0, 50.0, 39.0, 46.0, 42.0, 38.0, 29.0, 29.0, 25.0, 23.0, 20.0, 16.0, 16.0, 6.0, 8.0, 8.0, 1.0, 4.0, 4.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019866943359375, -0.019012451171875, -0.018157958984375, -0.017303466796875, -0.016448974609375, -0.015594482421875, -0.014739990234375, -0.013885498046875, -0.013031005859375, -0.012176513671875, -0.011322021484375, -0.010467529296875, -0.009613037109375, -0.008758544921875, -0.007904052734375, -0.007049560546875, -0.006195068359375, -0.005340576171875, -0.004486083984375, -0.003631591796875, -0.002777099609375, -0.001922607421875, -0.001068115234375, -0.000213623046875, 0.000640869140625, 0.001495361328125, 0.002349853515625, 0.003204345703125, 0.004058837890625, 0.004913330078125, 0.005767822265625, 0.006622314453125, 0.007476806640625, 0.008331298828125, 0.009185791015625, 0.010040283203125, 0.010894775390625, 0.011749267578125, 0.012603759765625, 0.013458251953125, 0.014312744140625, 0.015167236328125, 0.016021728515625, 0.016876220703125, 0.017730712890625, 0.018585205078125, 0.019439697265625, 0.020294189453125, 0.021148681640625, 0.022003173828125, 0.022857666015625, 0.023712158203125, 0.024566650390625, 0.025421142578125, 0.026275634765625, 0.027130126953125, 0.027984619140625, 0.028839111328125, 0.029693603515625, 0.030548095703125, 0.031402587890625, 0.032257080078125, 0.033111572265625, 0.033966064453125, 0.034820556640625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 6.0, 6.0, 10.0, 21.0, 37.0, 90.0, 159.0, 342.0, 837.0, 2406.0, 40170.0, 3914199.0, 229321.0, 4679.0, 1121.0, 485.0, 210.0, 83.0, 48.0, 27.0, 8.0, 11.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.279541015625, -0.27170372009277344, -0.2638664245605469, -0.2560291290283203, -0.24819183349609375, -0.2403545379638672, -0.23251724243164062, -0.22467994689941406, -0.2168426513671875, -0.20900535583496094, -0.20116806030273438, -0.1933307647705078, -0.18549346923828125, -0.1776561737060547, -0.16981887817382812, -0.16198158264160156, -0.154144287109375, -0.14630699157714844, -0.13846969604492188, -0.1306324005126953, -0.12279510498046875, -0.11495780944824219, -0.10712051391601562, -0.09928321838378906, -0.0914459228515625, -0.08360862731933594, -0.07577133178710938, -0.06793403625488281, -0.06009674072265625, -0.05225944519042969, -0.044422149658203125, -0.03658485412597656, -0.02874755859375, -0.020910263061523438, -0.013072967529296875, -0.0052356719970703125, 0.00260162353515625, 0.010438919067382812, 0.018276214599609375, 0.026113510131835938, 0.0339508056640625, 0.04178810119628906, 0.049625396728515625, 0.05746269226074219, 0.06529998779296875, 0.07313728332519531, 0.08097457885742188, 0.08881187438964844, 0.096649169921875, 0.10448646545410156, 0.11232376098632812, 0.12016105651855469, 0.12799835205078125, 0.1358356475830078, 0.14367294311523438, 0.15151023864746094, 0.1593475341796875, 0.16718482971191406, 0.17502212524414062, 0.1828594207763672, 0.19069671630859375, 0.1985340118408203, 0.20637130737304688, 0.21420860290527344, 0.2220458984375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 10.0, 13.0, 34.0, 54.0, 146.0, 275.0, 722.0, 1254.0, 880.0, 377.0, 180.0, 71.0, 41.0, 10.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1253662109375, -0.12114334106445312, -0.11692047119140625, -0.11269760131835938, -0.1084747314453125, -0.10425186157226562, -0.10002899169921875, -0.09580612182617188, -0.091583251953125, -0.08736038208007812, -0.08313751220703125, -0.07891464233398438, -0.0746917724609375, -0.07046890258789062, -0.06624603271484375, -0.062023162841796875, -0.05780029296875, -0.053577423095703125, -0.04935455322265625, -0.045131683349609375, -0.0409088134765625, -0.036685943603515625, -0.03246307373046875, -0.028240203857421875, -0.024017333984375, -0.019794464111328125, -0.01557159423828125, -0.011348724365234375, -0.0071258544921875, -0.002902984619140625, 0.00131988525390625, 0.005542755126953125, 0.009765625, 0.013988494873046875, 0.01821136474609375, 0.022434234619140625, 0.0266571044921875, 0.030879974365234375, 0.03510284423828125, 0.039325714111328125, 0.043548583984375, 0.047771453857421875, 0.05199432373046875, 0.056217193603515625, 0.0604400634765625, 0.06466293334960938, 0.06888580322265625, 0.07310867309570312, 0.07733154296875, 0.08155441284179688, 0.08577728271484375, 0.09000015258789062, 0.0942230224609375, 0.09844589233398438, 0.10266876220703125, 0.10689163208007812, 0.111114501953125, 0.11533737182617188, 0.11956024169921875, 0.12378311157226562, 0.1280059814453125, 0.13222885131835938, 0.13645172119140625, 0.14067459106445312, 0.1448974609375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 15.0, 49.0, 71.0, 126.0, 169.0, 172.0, 160.0, 85.0, 69.0, 36.0, 19.0, 10.0, 5.0, 0.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.6791143417358398, -0.6659195423126221, -0.6527247428894043, -0.6395299434661865, -0.6263351440429688, -0.613140344619751, -0.5999455451965332, -0.5867507457733154, -0.5735559463500977, -0.5603611469268799, -0.5471663475036621, -0.5339715480804443, -0.5207767486572266, -0.5075819492340088, -0.49438712000846863, -0.48119232058525085, -0.4679974913597107, -0.4548026919364929, -0.44160789251327515, -0.4284130930900574, -0.4152182936668396, -0.4020234942436218, -0.38882866501808167, -0.3756338655948639, -0.3624390661716461, -0.34924426674842834, -0.33604946732521057, -0.3228546679019928, -0.30965983867645264, -0.29646503925323486, -0.2832702398300171, -0.2700754404067993, -0.25688064098358154, -0.24368584156036377, -0.230491042137146, -0.21729622781276703, -0.20410142838954926, -0.19090662896633148, -0.17771181464195251, -0.16451701521873474, -0.15132223069667816, -0.1381274312734604, -0.12493262439966202, -0.11173781752586365, -0.09854301810264587, -0.0853482186794281, -0.07215341180562973, -0.05895860493183136, -0.045763805508613586, -0.032569002360105515, -0.019374199211597443, -0.006179396063089371, 0.007015407085418701, 0.020210206508636475, 0.033405013382434845, 0.046599820256233215, 0.05979461967945099, 0.07298941910266876, 0.08618422597646713, 0.0993790328502655, 0.11257383227348328, 0.12576863169670105, 0.13896343111991882, 0.1521582454442978, 0.16535304486751556]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 15.0, 18.0, 9.0, 19.0, 16.0, 22.0, 28.0, 36.0, 35.0, 42.0, 54.0, 53.0, 42.0, 48.0, 53.0, 47.0, 53.0, 51.0, 47.0, 31.0, 38.0, 28.0, 34.0, 36.0, 28.0, 17.0, 26.0, 18.0, 14.0, 7.0, 9.0, 4.0, 9.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22015070915222168, -0.21260683238506317, -0.20506295561790466, -0.19751906394958496, -0.18997518718242645, -0.18243131041526794, -0.17488743364810944, -0.16734355688095093, -0.15979966521263123, -0.15225578844547272, -0.1447119116783142, -0.1371680200099945, -0.129624143242836, -0.12208026647567749, -0.11453638970851898, -0.10699251294136047, -0.09944863617420197, -0.09190475940704346, -0.08436087518930435, -0.07681699842214584, -0.06927311420440674, -0.06172923743724823, -0.05418536067008972, -0.046641480177640915, -0.03909759968519211, -0.0315537191927433, -0.024009840562939644, -0.016465961933135986, -0.00892208144068718, -0.0013782009482383728, 0.0061656758189201355, 0.013709556311368942, 0.02125343680381775, 0.028797317296266556, 0.03634119778871536, 0.04388507455587387, 0.05142895504832268, 0.058972835540771484, 0.06651671230792999, 0.0740605890750885, 0.0816044732928276, 0.08914835005998611, 0.09669223427772522, 0.10423611104488373, 0.11177998781204224, 0.11932387202978134, 0.12686774134635925, 0.13441163301467896, 0.14195550978183746, 0.14949938654899597, 0.15704326331615448, 0.164587140083313, 0.1721310317516327, 0.1796749085187912, 0.1872187852859497, 0.19476266205310822, 0.20230653882026672, 0.20985041558742523, 0.21739429235458374, 0.22493818402290344, 0.23248206079006195, 0.24002593755722046, 0.24756981432437897, 0.2551136910915375, 0.2626575827598572]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 9.0, 7.0, 9.0, 7.0, 15.0, 20.0, 26.0, 50.0, 86.0, 138.0, 261.0, 503.0, 1081.0, 2281.0, 4895.0, 11073.0, 25819.0, 65299.0, 191863.0, 416949.0, 208756.0, 70307.0, 27549.0, 11637.0, 5049.0, 2515.0, 1131.0, 572.0, 287.0, 126.0, 76.0, 37.0, 33.0, 21.0, 8.0, 10.0, 7.0, 7.0, 5.0, 2.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07867431640625, -0.07591724395751953, -0.07316017150878906, -0.0704030990600586, -0.06764602661132812, -0.06488895416259766, -0.06213188171386719, -0.05937480926513672, -0.05661773681640625, -0.05386066436767578, -0.05110359191894531, -0.048346519470214844, -0.045589447021484375, -0.042832374572753906, -0.04007530212402344, -0.03731822967529297, -0.0345611572265625, -0.03180408477783203, -0.029047012329101562, -0.026289939880371094, -0.023532867431640625, -0.020775794982910156, -0.018018722534179688, -0.015261650085449219, -0.01250457763671875, -0.009747505187988281, -0.0069904327392578125, -0.004233360290527344, -0.001476287841796875, 0.0012807846069335938, 0.0040378570556640625, 0.006794929504394531, 0.009552001953125, 0.012309074401855469, 0.015066146850585938, 0.017823219299316406, 0.020580291748046875, 0.023337364196777344, 0.026094436645507812, 0.02885150909423828, 0.03160858154296875, 0.03436565399169922, 0.03712272644042969, 0.039879798889160156, 0.042636871337890625, 0.045393943786621094, 0.04815101623535156, 0.05090808868408203, 0.0536651611328125, 0.05642223358154297, 0.05917930603027344, 0.061936378479003906, 0.06469345092773438, 0.06745052337646484, 0.07020759582519531, 0.07296466827392578, 0.07572174072265625, 0.07847881317138672, 0.08123588562011719, 0.08399295806884766, 0.08675003051757812, 0.0895071029663086, 0.09226417541503906, 0.09502124786376953, 0.0977783203125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 8.0, 11.0, 14.0, 24.0, 27.0, 29.0, 29.0, 39.0, 56.0, 43.0, 48.0, 65.0, 67.0, 63.0, 69.0, 57.0, 62.0, 55.0, 49.0, 40.0, 27.0, 34.0, 19.0, 20.0, 17.0, 15.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022369384765625, -0.021266937255859375, -0.02016448974609375, -0.019062042236328125, -0.0179595947265625, -0.016857147216796875, -0.01575469970703125, -0.014652252197265625, -0.0135498046875, -0.012447357177734375, -0.01134490966796875, -0.010242462158203125, -0.0091400146484375, -0.008037567138671875, -0.00693511962890625, -0.005832672119140625, -0.004730224609375, -0.003627777099609375, -0.00252532958984375, -0.001422882080078125, -0.0003204345703125, 0.000782012939453125, 0.00188446044921875, 0.002986907958984375, 0.00408935546875, 0.005191802978515625, 0.00629425048828125, 0.007396697998046875, 0.0084991455078125, 0.009601593017578125, 0.01070404052734375, 0.011806488037109375, 0.012908935546875, 0.014011383056640625, 0.01511383056640625, 0.016216278076171875, 0.0173187255859375, 0.018421173095703125, 0.01952362060546875, 0.020626068115234375, 0.021728515625, 0.022830963134765625, 0.02393341064453125, 0.025035858154296875, 0.0261383056640625, 0.027240753173828125, 0.02834320068359375, 0.029445648193359375, 0.030548095703125, 0.031650543212890625, 0.03275299072265625, 0.033855438232421875, 0.0349578857421875, 0.036060333251953125, 0.03716278076171875, 0.038265228271484375, 0.03936767578125, 0.040470123291015625, 0.04157257080078125, 0.042675018310546875, 0.0437774658203125, 0.044879913330078125, 0.04598236083984375, 0.047084808349609375, 0.048187255859375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 7.0, 6.0, 10.0, 15.0, 10.0, 16.0, 13.0, 24.0, 21.0, 37.0, 38.0, 69.0, 116.0, 152.0, 305.0, 687.0, 1707.0, 4660.0, 14219.0, 49646.0, 222513.0, 535324.0, 163075.0, 38190.0, 11244.0, 3761.0, 1338.0, 583.0, 271.0, 151.0, 95.0, 59.0, 39.0, 37.0, 24.0, 17.0, 19.0, 16.0, 12.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.102294921875, -0.09869384765625, -0.0950927734375, -0.09149169921875, -0.087890625, -0.08428955078125, -0.0806884765625, -0.07708740234375, -0.073486328125, -0.06988525390625, -0.0662841796875, -0.06268310546875, -0.05908203125, -0.05548095703125, -0.0518798828125, -0.04827880859375, -0.044677734375, -0.04107666015625, -0.0374755859375, -0.03387451171875, -0.0302734375, -0.02667236328125, -0.0230712890625, -0.01947021484375, -0.015869140625, -0.01226806640625, -0.0086669921875, -0.00506591796875, -0.00146484375, 0.00213623046875, 0.0057373046875, 0.00933837890625, 0.012939453125, 0.01654052734375, 0.0201416015625, 0.02374267578125, 0.02734375, 0.03094482421875, 0.0345458984375, 0.03814697265625, 0.041748046875, 0.04534912109375, 0.0489501953125, 0.05255126953125, 0.05615234375, 0.05975341796875, 0.0633544921875, 0.06695556640625, 0.070556640625, 0.07415771484375, 0.0777587890625, 0.08135986328125, 0.0849609375, 0.08856201171875, 0.0921630859375, 0.09576416015625, 0.099365234375, 0.10296630859375, 0.1065673828125, 0.11016845703125, 0.11376953125, 0.11737060546875, 0.1209716796875, 0.12457275390625, 0.128173828125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 1.0, 4.0, 5.0, 11.0, 12.0, 16.0, 13.0, 16.0, 12.0, 15.0, 27.0, 24.0, 32.0, 38.0, 24.0, 35.0, 37.0, 45.0, 41.0, 32.0, 39.0, 57.0, 37.0, 40.0, 38.0, 53.0, 33.0, 40.0, 30.0, 38.0, 19.0, 21.0, 13.0, 13.0, 16.0, 14.0, 16.0, 7.0, 9.0, 8.0, 3.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06890869140625, -0.066802978515625, -0.064697265625, -0.062591552734375, -0.06048583984375, -0.058380126953125, -0.0562744140625, -0.054168701171875, -0.05206298828125, -0.049957275390625, -0.0478515625, -0.045745849609375, -0.04364013671875, -0.041534423828125, -0.0394287109375, -0.037322998046875, -0.03521728515625, -0.033111572265625, -0.031005859375, -0.028900146484375, -0.02679443359375, -0.024688720703125, -0.0225830078125, -0.020477294921875, -0.01837158203125, -0.016265869140625, -0.01416015625, -0.012054443359375, -0.00994873046875, -0.007843017578125, -0.0057373046875, -0.003631591796875, -0.00152587890625, 0.000579833984375, 0.002685546875, 0.004791259765625, 0.00689697265625, 0.009002685546875, 0.0111083984375, 0.013214111328125, 0.01531982421875, 0.017425537109375, 0.01953125, 0.021636962890625, 0.02374267578125, 0.025848388671875, 0.0279541015625, 0.030059814453125, 0.03216552734375, 0.034271240234375, 0.036376953125, 0.038482666015625, 0.04058837890625, 0.042694091796875, 0.0447998046875, 0.046905517578125, 0.04901123046875, 0.051116943359375, 0.05322265625, 0.055328369140625, 0.05743408203125, 0.059539794921875, 0.0616455078125, 0.063751220703125, 0.06585693359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 2.0, 5.0, 12.0, 15.0, 23.0, 26.0, 41.0, 56.0, 67.0, 89.0, 132.0, 183.0, 295.0, 437.0, 723.0, 1151.0, 1906.0, 3566.0, 7698.0, 857903.0, 159873.0, 6520.0, 3118.0, 1715.0, 1090.0, 649.0, 380.0, 261.0, 184.0, 120.0, 76.0, 76.0, 44.0, 24.0, 32.0, 13.0, 14.0, 7.0, 7.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.29833984375, -0.2889862060546875, -0.279632568359375, -0.2702789306640625, -0.26092529296875, -0.2515716552734375, -0.242218017578125, -0.2328643798828125, -0.2235107421875, -0.2141571044921875, -0.204803466796875, -0.1954498291015625, -0.18609619140625, -0.1767425537109375, -0.167388916015625, -0.1580352783203125, -0.148681640625, -0.1393280029296875, -0.129974365234375, -0.1206207275390625, -0.11126708984375, -0.1019134521484375, -0.092559814453125, -0.0832061767578125, -0.0738525390625, -0.0644989013671875, -0.055145263671875, -0.0457916259765625, -0.03643798828125, -0.0270843505859375, -0.017730712890625, -0.0083770751953125, 0.0009765625, 0.0103302001953125, 0.019683837890625, 0.0290374755859375, 0.03839111328125, 0.0477447509765625, 0.057098388671875, 0.0664520263671875, 0.0758056640625, 0.0851593017578125, 0.094512939453125, 0.1038665771484375, 0.11322021484375, 0.1225738525390625, 0.131927490234375, 0.1412811279296875, 0.150634765625, 0.1599884033203125, 0.169342041015625, 0.1786956787109375, 0.18804931640625, 0.1974029541015625, 0.206756591796875, 0.2161102294921875, 0.2254638671875, 0.2348175048828125, 0.244171142578125, 0.2535247802734375, 0.26287841796875, 0.2722320556640625, 0.281585693359375, 0.2909393310546875, 0.30029296875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 300.0, 662.0, 13.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010645389556884766, -0.00010366085916757584, -0.00010086782276630402, -9.80747863650322e-05, -9.528174996376038e-05, -9.248871356248856e-05, -8.969567716121674e-05, -8.690264075994492e-05, -8.41096043586731e-05, -8.131656795740128e-05, -7.852353155612946e-05, -7.573049515485764e-05, -7.293745875358582e-05, -7.0144422352314e-05, -6.735138595104218e-05, -6.455834954977036e-05, -6.176531314849854e-05, -5.8972276747226715e-05, -5.6179240345954895e-05, -5.3386203944683075e-05, -5.0593167543411255e-05, -4.7800131142139435e-05, -4.5007094740867615e-05, -4.2214058339595795e-05, -3.9421021938323975e-05, -3.6627985537052155e-05, -3.3834949135780334e-05, -3.1041912734508514e-05, -2.8248876333236694e-05, -2.5455839931964874e-05, -2.2662803530693054e-05, -1.9869767129421234e-05, -1.7076730728149414e-05, -1.4283694326877594e-05, -1.1490657925605774e-05, -8.697621524333954e-06, -5.904585123062134e-06, -3.1115487217903137e-06, -3.1851232051849365e-07, 2.4745240807533264e-06, 5.2675604820251465e-06, 8.060596883296967e-06, 1.0853633284568787e-05, 1.3646669685840607e-05, 1.6439706087112427e-05, 1.9232742488384247e-05, 2.2025778889656067e-05, 2.4818815290927887e-05, 2.7611851692199707e-05, 3.0404888093471527e-05, 3.319792449474335e-05, 3.599096089601517e-05, 3.878399729728699e-05, 4.157703369855881e-05, 4.437007009983063e-05, 4.716310650110245e-05, 4.995614290237427e-05, 5.274917930364609e-05, 5.554221570491791e-05, 5.833525210618973e-05, 6.112828850746155e-05, 6.392132490873337e-05, 6.671436131000519e-05, 6.950739771127701e-05, 7.230043411254883e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 10.0, 8.0, 11.0, 10.0, 27.0, 34.0, 35.0, 73.0, 118.0, 198.0, 314.0, 638.0, 1177.0, 2333.0, 5474.0, 14816.0, 43860.0, 137376.0, 333499.0, 319222.0, 125839.0, 39971.0, 13391.0, 5267.0, 2261.0, 1114.0, 565.0, 324.0, 193.0, 127.0, 98.0, 57.0, 34.0, 17.0, 12.0, 16.0, 4.0, 7.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.0270538330078125, -0.026279926300048828, -0.025506019592285156, -0.024732112884521484, -0.023958206176757812, -0.02318429946899414, -0.02241039276123047, -0.021636486053466797, -0.020862579345703125, -0.020088672637939453, -0.01931476593017578, -0.01854085922241211, -0.017766952514648438, -0.016993045806884766, -0.016219139099121094, -0.015445232391357422, -0.01467132568359375, -0.013897418975830078, -0.013123512268066406, -0.012349605560302734, -0.011575698852539062, -0.01080179214477539, -0.010027885437011719, -0.009253978729248047, -0.008480072021484375, -0.007706165313720703, -0.006932258605957031, -0.006158351898193359, -0.0053844451904296875, -0.004610538482666016, -0.0038366317749023438, -0.003062725067138672, -0.002288818359375, -0.0015149116516113281, -0.0007410049438476562, 3.2901763916015625e-05, 0.0008068084716796875, 0.0015807151794433594, 0.0023546218872070312, 0.003128528594970703, 0.003902435302734375, 0.004676342010498047, 0.005450248718261719, 0.006224155426025391, 0.0069980621337890625, 0.007771968841552734, 0.008545875549316406, 0.009319782257080078, 0.01009368896484375, 0.010867595672607422, 0.011641502380371094, 0.012415409088134766, 0.013189315795898438, 0.01396322250366211, 0.014737129211425781, 0.015511035919189453, 0.016284942626953125, 0.017058849334716797, 0.01783275604248047, 0.01860666275024414, 0.019380569458007812, 0.020154476165771484, 0.020928382873535156, 0.021702289581298828, 0.0224761962890625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 9.0, 13.0, 15.0, 18.0, 21.0, 21.0, 38.0, 47.0, 47.0, 61.0, 56.0, 69.0, 74.0, 76.0, 88.0, 62.0, 58.0, 48.0, 35.0, 42.0, 34.0, 20.0, 11.0, 10.0, 8.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0197601318359375, -0.019195556640625, -0.0186309814453125, -0.01806640625, -0.0175018310546875, -0.016937255859375, -0.0163726806640625, -0.01580810546875, -0.0152435302734375, -0.014678955078125, -0.0141143798828125, -0.0135498046875, -0.0129852294921875, -0.012420654296875, -0.0118560791015625, -0.01129150390625, -0.0107269287109375, -0.010162353515625, -0.0095977783203125, -0.009033203125, -0.0084686279296875, -0.007904052734375, -0.0073394775390625, -0.00677490234375, -0.0062103271484375, -0.005645751953125, -0.0050811767578125, -0.0045166015625, -0.0039520263671875, -0.003387451171875, -0.0028228759765625, -0.00225830078125, -0.0016937255859375, -0.001129150390625, -0.0005645751953125, 0.0, 0.0005645751953125, 0.001129150390625, 0.0016937255859375, 0.00225830078125, 0.0028228759765625, 0.003387451171875, 0.0039520263671875, 0.0045166015625, 0.0050811767578125, 0.005645751953125, 0.0062103271484375, 0.00677490234375, 0.0073394775390625, 0.007904052734375, 0.0084686279296875, 0.009033203125, 0.0095977783203125, 0.010162353515625, 0.0107269287109375, 0.01129150390625, 0.0118560791015625, 0.012420654296875, 0.0129852294921875, 0.0135498046875, 0.0141143798828125, 0.014678955078125, 0.0152435302734375, 0.01580810546875, 0.0163726806640625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 11.0, 40.0, 218.0, 532.0, 186.0, 21.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21087102591991425, -0.1725473701953888, -0.13422369956970215, -0.0959000363945961, -0.05757637321949005, -0.019252702593803406, 0.019070953130722046, 0.0573946088552475, 0.09571827948093414, 0.1340419352054596, 0.17236560583114624, 0.21068927645683289, 0.24901293218135834, 0.2873365879058838, 0.32566025853157043, 0.3639839291572571, 0.40230756998062134, 0.440631240606308, 0.47895491123199463, 0.5172785520553589, 0.5556021928787231, 0.5939258933067322, 0.6322495341300964, 0.6705732345581055, 0.7088968753814697, 0.747220516204834, 0.785544216632843, 0.8238678574562073, 0.8621915578842163, 0.9005151987075806, 0.9388388395309448, 0.9771624803543091, 1.015486240386963, 1.0538098812103271, 1.0921335220336914, 1.1304572820663452, 1.1687809228897095, 1.2071045637130737, 1.245428204536438, 1.2837518453598022, 1.322075605392456, 1.3603992462158203, 1.3987228870391846, 1.4370466470718384, 1.4753702878952026, 1.513693928718567, 1.5520175695419312, 1.5903412103652954, 1.6286648511886597, 1.666988492012024, 1.7053121328353882, 1.743635892868042, 1.7819595336914062, 1.8202831745147705, 1.8586068153381348, 1.896930456161499, 1.9352540969848633, 1.9735777378082275, 2.011901378631592, 2.050225019454956, 2.0885486602783203, 2.1268725395202637, 2.165196180343628, 2.203519821166992, 2.2418434619903564]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 7.0, 5.0, 5.0, 15.0, 5.0, 14.0, 23.0, 13.0, 20.0, 25.0, 30.0, 36.0, 34.0, 35.0, 31.0, 36.0, 51.0, 53.0, 40.0, 58.0, 38.0, 41.0, 39.0, 46.0, 47.0, 30.0, 33.0, 27.0, 18.0, 25.0, 26.0, 17.0, 14.0, 16.0, 14.0, 11.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.22419613599777222, -0.21754124760627747, -0.21088634431362152, -0.20423145592212677, -0.19757655262947083, -0.19092166423797607, -0.18426677584648132, -0.17761188745498657, -0.17095698416233063, -0.16430209577083588, -0.15764719247817993, -0.15099230408668518, -0.14433741569519043, -0.13768251240253448, -0.13102762401103973, -0.12437272816896439, -0.11771783232688904, -0.11106293648481369, -0.10440804064273834, -0.09775315225124359, -0.09109825640916824, -0.0844433605670929, -0.07778847217559814, -0.0711335763335228, -0.06447868049144745, -0.0578237846493721, -0.05116889253258705, -0.044514000415802, -0.037859104573726654, -0.031204208731651306, -0.024549316614866257, -0.017894424498081207, -0.01123952865600586, -0.004584634676575661, 0.002070259302854538, 0.008725153282284737, 0.015380047261714935, 0.022034943103790283, 0.028689835220575333, 0.03534472733736038, 0.04199962317943573, 0.04865451902151108, 0.05530941113829613, 0.06196430325508118, 0.06861919909715652, 0.07527409493923187, 0.08192898333072662, 0.08858387917280197, 0.09523877501487732, 0.10189367085695267, 0.10854856669902802, 0.11520345509052277, 0.12185835093259811, 0.12851324677467346, 0.1351681351661682, 0.14182302355766296, 0.1484779268503189, 0.15513281524181366, 0.1617877185344696, 0.16844260692596436, 0.1750974953174591, 0.18175239861011505, 0.1884072870016098, 0.19506219029426575, 0.2017170786857605]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 9.0, 10.0, 11.0, 12.0, 17.0, 20.0, 28.0, 42.0, 53.0, 114.0, 125.0, 225.0, 404.0, 838.0, 2309.0, 10838.0, 186219.0, 3847993.0, 132626.0, 8714.0, 1980.0, 727.0, 369.0, 196.0, 120.0, 72.0, 61.0, 51.0, 30.0, 24.0, 15.0, 5.0, 11.0, 3.0, 5.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1552734375, -0.1510143280029297, -0.14675521850585938, -0.14249610900878906, -0.13823699951171875, -0.13397789001464844, -0.12971878051757812, -0.1254596710205078, -0.1212005615234375, -0.11694145202636719, -0.11268234252929688, -0.10842323303222656, -0.10416412353515625, -0.09990501403808594, -0.09564590454101562, -0.09138679504394531, -0.087127685546875, -0.08286857604980469, -0.07860946655273438, -0.07435035705566406, -0.07009124755859375, -0.06583213806152344, -0.061573028564453125, -0.05731391906738281, -0.0530548095703125, -0.04879570007324219, -0.044536590576171875, -0.04027748107910156, -0.03601837158203125, -0.03175926208496094, -0.027500152587890625, -0.023241043090820312, -0.01898193359375, -0.014722824096679688, -0.010463714599609375, -0.0062046051025390625, -0.00194549560546875, 0.0023136138916015625, 0.006572723388671875, 0.010831832885742188, 0.0150909423828125, 0.019350051879882812, 0.023609161376953125, 0.027868270874023438, 0.03212738037109375, 0.03638648986816406, 0.040645599365234375, 0.04490470886230469, 0.049163818359375, 0.05342292785644531, 0.057682037353515625, 0.06194114685058594, 0.06620025634765625, 0.07045936584472656, 0.07471847534179688, 0.07897758483886719, 0.0832366943359375, 0.08749580383300781, 0.09175491333007812, 0.09601402282714844, 0.10027313232421875, 0.10453224182128906, 0.10879135131835938, 0.11305046081542969, 0.1173095703125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 8.0, 5.0, 10.0, 8.0, 12.0, 17.0, 29.0, 28.0, 30.0, 35.0, 55.0, 49.0, 57.0, 68.0, 44.0, 73.0, 66.0, 57.0, 58.0, 53.0, 54.0, 34.0, 40.0, 23.0, 23.0, 21.0, 21.0, 12.0, 5.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038055419921875, -0.03687763214111328, -0.03569984436035156, -0.034522056579589844, -0.033344268798828125, -0.032166481018066406, -0.030988693237304688, -0.02981090545654297, -0.02863311767578125, -0.02745532989501953, -0.026277542114257812, -0.025099754333496094, -0.023921966552734375, -0.022744178771972656, -0.021566390991210938, -0.02038860321044922, -0.0192108154296875, -0.01803302764892578, -0.016855239868164062, -0.015677452087402344, -0.014499664306640625, -0.013321876525878906, -0.012144088745117188, -0.010966300964355469, -0.00978851318359375, -0.008610725402832031, -0.0074329376220703125, -0.006255149841308594, -0.005077362060546875, -0.0038995742797851562, -0.0027217864990234375, -0.0015439987182617188, -0.0003662109375, 0.0008115768432617188, 0.0019893646240234375, 0.0031671524047851562, 0.004344940185546875, 0.005522727966308594, 0.0067005157470703125, 0.007878303527832031, 0.00905609130859375, 0.010233879089355469, 0.011411666870117188, 0.012589454650878906, 0.013767242431640625, 0.014945030212402344, 0.016122817993164062, 0.01730060577392578, 0.0184783935546875, 0.01965618133544922, 0.020833969116210938, 0.022011756896972656, 0.023189544677734375, 0.024367332458496094, 0.025545120239257812, 0.02672290802001953, 0.02790069580078125, 0.02907848358154297, 0.030256271362304688, 0.031434059143066406, 0.032611846923828125, 0.033789634704589844, 0.03496742248535156, 0.03614521026611328, 0.037322998046875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 3.0, 13.0, 15.0, 18.0, 47.0, 55.0, 96.0, 123.0, 307.0, 763.0, 2426.0, 14021.0, 374836.0, 3677913.0, 113440.0, 7427.0, 1555.0, 564.0, 295.0, 124.0, 82.0, 48.0, 31.0, 24.0, 13.0, 10.0, 7.0, 1.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.14697265625, -0.1419658660888672, -0.13695907592773438, -0.13195228576660156, -0.12694549560546875, -0.12193870544433594, -0.11693191528320312, -0.11192512512207031, -0.1069183349609375, -0.10191154479980469, -0.09690475463867188, -0.09189796447753906, -0.08689117431640625, -0.08188438415527344, -0.07687759399414062, -0.07187080383300781, -0.066864013671875, -0.06185722351074219, -0.056850433349609375, -0.05184364318847656, -0.04683685302734375, -0.04183006286621094, -0.036823272705078125, -0.03181648254394531, -0.0268096923828125, -0.021802902221679688, -0.016796112060546875, -0.011789321899414062, -0.00678253173828125, -0.0017757415771484375, 0.003231048583984375, 0.008237838745117188, 0.01324462890625, 0.018251419067382812, 0.023258209228515625, 0.028264999389648438, 0.03327178955078125, 0.03827857971191406, 0.043285369873046875, 0.04829216003417969, 0.0532989501953125, 0.05830574035644531, 0.06331253051757812, 0.06831932067871094, 0.07332611083984375, 0.07833290100097656, 0.08333969116210938, 0.08834648132324219, 0.093353271484375, 0.09836006164550781, 0.10336685180664062, 0.10837364196777344, 0.11338043212890625, 0.11838722229003906, 0.12339401245117188, 0.1284008026123047, 0.1334075927734375, 0.1384143829345703, 0.14342117309570312, 0.14842796325683594, 0.15343475341796875, 0.15844154357910156, 0.16344833374023438, 0.1684551239013672, 0.1734619140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 8.0, 17.0, 17.0, 28.0, 40.0, 60.0, 76.0, 152.0, 230.0, 409.0, 660.0, 749.0, 608.0, 339.0, 255.0, 142.0, 79.0, 64.0, 37.0, 31.0, 21.0, 16.0, 9.0, 9.0, 7.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0858154296875, -0.08345890045166016, -0.08110237121582031, -0.07874584197998047, -0.07638931274414062, -0.07403278350830078, -0.07167625427246094, -0.0693197250366211, -0.06696319580078125, -0.0646066665649414, -0.06225013732910156, -0.05989360809326172, -0.057537078857421875, -0.05518054962158203, -0.05282402038574219, -0.050467491149902344, -0.0481109619140625, -0.045754432678222656, -0.04339790344238281, -0.04104137420654297, -0.038684844970703125, -0.03632831573486328, -0.03397178649902344, -0.031615257263183594, -0.02925872802734375, -0.026902198791503906, -0.024545669555664062, -0.02218914031982422, -0.019832611083984375, -0.01747608184814453, -0.015119552612304688, -0.012763023376464844, -0.010406494140625, -0.008049964904785156, -0.0056934356689453125, -0.0033369064331054688, -0.000980377197265625, 0.0013761520385742188, 0.0037326812744140625, 0.006089210510253906, 0.00844573974609375, 0.010802268981933594, 0.013158798217773438, 0.015515327453613281, 0.017871856689453125, 0.02022838592529297, 0.022584915161132812, 0.024941444396972656, 0.0272979736328125, 0.029654502868652344, 0.03201103210449219, 0.03436756134033203, 0.036724090576171875, 0.03908061981201172, 0.04143714904785156, 0.043793678283691406, 0.04615020751953125, 0.048506736755371094, 0.05086326599121094, 0.05321979522705078, 0.055576324462890625, 0.05793285369873047, 0.06028938293457031, 0.06264591217041016, 0.06500244140625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 20.0, 100.0, 429.0, 369.0, 66.0, 18.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5949653387069702, -1.5608994960784912, -1.5268336534500122, -1.4927678108215332, -1.4587019681930542, -1.4246361255645752, -1.3905702829360962, -1.3565044403076172, -1.3224385976791382, -1.2883727550506592, -1.2543069124221802, -1.2202410697937012, -1.1861752271652222, -1.1521093845367432, -1.1180435419082642, -1.0839776992797852, -1.0499117374420166, -1.0158458948135376, -0.9817800521850586, -0.9477142095565796, -0.9136483669281006, -0.8795825242996216, -0.8455166816711426, -0.8114508390426636, -0.7773849964141846, -0.7433191537857056, -0.7092533111572266, -0.6751874685287476, -0.6411216259002686, -0.6070557832717896, -0.5729899406433105, -0.5389240980148315, -0.5048581957817078, -0.47079235315322876, -0.43672651052474976, -0.40266066789627075, -0.36859482526779175, -0.33452898263931274, -0.30046311020851135, -0.26639726758003235, -0.23233142495155334, -0.19826558232307434, -0.16419973969459534, -0.13013388216495514, -0.09606803953647614, -0.06200219690799713, -0.027936339378356934, 0.00612950325012207, 0.040195345878601074, 0.07426118850708008, 0.10832703858613968, 0.14239288866519928, 0.17645873129367828, 0.2105245739221573, 0.24459043145179749, 0.2786562740802765, 0.3127221167087555, 0.3467879593372345, 0.3808538019657135, 0.4149196743965149, 0.4489855170249939, 0.4830513596534729, 0.5171172022819519, 0.5511830449104309, 0.5852488875389099]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 8.0, 7.0, 8.0, 15.0, 15.0, 24.0, 17.0, 22.0, 24.0, 31.0, 35.0, 22.0, 28.0, 39.0, 40.0, 34.0, 39.0, 52.0, 51.0, 46.0, 46.0, 52.0, 37.0, 38.0, 16.0, 35.0, 27.0, 25.0, 27.0, 20.0, 16.0, 12.0, 17.0, 10.0, 9.0, 13.0, 10.0, 7.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1805064082145691, -0.17507806420326233, -0.16964973509311676, -0.16422139108181, -0.15879304707050323, -0.15336471796035767, -0.1479363739490509, -0.14250802993774414, -0.13707968592643738, -0.13165134191513062, -0.12622301280498505, -0.12079466879367828, -0.11536632478237152, -0.10993798822164536, -0.10450965166091919, -0.09908130764961243, -0.09365297853946686, -0.08822464197874069, -0.08279629796743393, -0.07736796140670776, -0.071939617395401, -0.06651128083467484, -0.06108294427394867, -0.055654603987932205, -0.05022626370191574, -0.04479792341589928, -0.03936958312988281, -0.03394124656915665, -0.028512906283140182, -0.023084565997123718, -0.017656229436397552, -0.012227889150381088, -0.006799548864364624, -0.0013712095096707344, 0.004057129845023155, 0.00948546826839447, 0.014913808554410934, 0.0203421488404274, 0.025770485401153564, 0.03119882568717003, 0.03662716597318649, 0.04205550625920296, 0.04748384654521942, 0.05291218310594559, 0.05834052339196205, 0.06376886367797852, 0.06919720023870468, 0.07462553679943085, 0.08005388081073761, 0.08548221737146378, 0.09091056138277054, 0.0963388979434967, 0.10176724195480347, 0.10719557851552963, 0.1126239150762558, 0.11805225908756256, 0.12348059564828873, 0.1289089322090149, 0.13433727622032166, 0.13976562023162842, 0.145193949341774, 0.15062229335308075, 0.15605062246322632, 0.16147896647453308, 0.16690731048583984]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 4.0, 10.0, 10.0, 14.0, 21.0, 12.0, 39.0, 47.0, 41.0, 47.0, 68.0, 88.0, 126.0, 230.0, 351.0, 562.0, 988.0, 1675.0, 3372.0, 6248.0, 13041.0, 28412.0, 65734.0, 154638.0, 293277.0, 258692.0, 123124.0, 52367.0, 23099.0, 10691.0, 5274.0, 2673.0, 1388.0, 796.0, 460.0, 279.0, 168.0, 118.0, 82.0, 58.0, 46.0, 39.0, 34.0, 12.0, 34.0, 11.0, 12.0, 13.0, 4.0, 5.0, 9.0, 4.0, 2.0, 3.0, 4.0, 1.0], "bins": [-0.06390380859375, -0.061959266662597656, -0.06001472473144531, -0.05807018280029297, -0.056125640869140625, -0.05418109893798828, -0.05223655700683594, -0.050292015075683594, -0.04834747314453125, -0.046402931213378906, -0.04445838928222656, -0.04251384735107422, -0.040569305419921875, -0.03862476348876953, -0.03668022155761719, -0.034735679626464844, -0.0327911376953125, -0.030846595764160156, -0.028902053833007812, -0.02695751190185547, -0.025012969970703125, -0.02306842803955078, -0.021123886108398438, -0.019179344177246094, -0.01723480224609375, -0.015290260314941406, -0.013345718383789062, -0.011401176452636719, -0.009456634521484375, -0.007512092590332031, -0.0055675506591796875, -0.0036230087280273438, -0.001678466796875, 0.00026607513427734375, 0.0022106170654296875, 0.004155158996582031, 0.006099700927734375, 0.008044242858886719, 0.009988784790039062, 0.011933326721191406, 0.01387786865234375, 0.015822410583496094, 0.017766952514648438, 0.01971149444580078, 0.021656036376953125, 0.02360057830810547, 0.025545120239257812, 0.027489662170410156, 0.0294342041015625, 0.031378746032714844, 0.03332328796386719, 0.03526782989501953, 0.037212371826171875, 0.03915691375732422, 0.04110145568847656, 0.043045997619628906, 0.04499053955078125, 0.046935081481933594, 0.04887962341308594, 0.05082416534423828, 0.052768707275390625, 0.05471324920654297, 0.05665779113769531, 0.058602333068847656, 0.060546875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 4.0, 9.0, 7.0, 14.0, 17.0, 20.0, 21.0, 38.0, 52.0, 57.0, 87.0, 92.0, 84.0, 77.0, 65.0, 85.0, 64.0, 52.0, 44.0, 39.0, 37.0, 12.0, 10.0, 12.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045013427734375, -0.043608665466308594, -0.04220390319824219, -0.04079914093017578, -0.039394378662109375, -0.03798961639404297, -0.03658485412597656, -0.035180091857910156, -0.03377532958984375, -0.032370567321777344, -0.030965805053710938, -0.02956104278564453, -0.028156280517578125, -0.02675151824951172, -0.025346755981445312, -0.023941993713378906, -0.0225372314453125, -0.021132469177246094, -0.019727706909179688, -0.01832294464111328, -0.016918182373046875, -0.015513420104980469, -0.014108657836914062, -0.012703895568847656, -0.01129913330078125, -0.009894371032714844, -0.008489608764648438, -0.007084846496582031, -0.005680084228515625, -0.004275321960449219, -0.0028705596923828125, -0.0014657974243164062, -6.103515625e-05, 0.0013437271118164062, 0.0027484893798828125, 0.004153251647949219, 0.005558013916015625, 0.006962776184082031, 0.008367538452148438, 0.009772300720214844, 0.01117706298828125, 0.012581825256347656, 0.013986587524414062, 0.015391349792480469, 0.016796112060546875, 0.01820087432861328, 0.019605636596679688, 0.021010398864746094, 0.0224151611328125, 0.023819923400878906, 0.025224685668945312, 0.02662944793701172, 0.028034210205078125, 0.02943897247314453, 0.030843734741210938, 0.032248497009277344, 0.03365325927734375, 0.035058021545410156, 0.03646278381347656, 0.03786754608154297, 0.039272308349609375, 0.04067707061767578, 0.04208183288574219, 0.043486595153808594, 0.044891357421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 6.0, 11.0, 15.0, 17.0, 26.0, 36.0, 38.0, 41.0, 56.0, 69.0, 131.0, 148.0, 286.0, 579.0, 1224.0, 3257.0, 11199.0, 49500.0, 285893.0, 550537.0, 112980.0, 22731.0, 5935.0, 1909.0, 789.0, 388.0, 215.0, 138.0, 99.0, 75.0, 49.0, 33.0, 32.0, 24.0, 16.0, 22.0, 14.0, 9.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1168212890625, -0.11295890808105469, -0.10909652709960938, -0.10523414611816406, -0.10137176513671875, -0.09750938415527344, -0.09364700317382812, -0.08978462219238281, -0.0859222412109375, -0.08205986022949219, -0.07819747924804688, -0.07433509826660156, -0.07047271728515625, -0.06661033630371094, -0.06274795532226562, -0.05888557434082031, -0.055023193359375, -0.05116081237792969, -0.047298431396484375, -0.04343605041503906, -0.03957366943359375, -0.03571128845214844, -0.031848907470703125, -0.027986526489257812, -0.0241241455078125, -0.020261764526367188, -0.016399383544921875, -0.012537002563476562, -0.00867462158203125, -0.0048122406005859375, -0.000949859619140625, 0.0029125213623046875, 0.00677490234375, 0.010637283325195312, 0.014499664306640625, 0.018362045288085938, 0.02222442626953125, 0.026086807250976562, 0.029949188232421875, 0.03381156921386719, 0.0376739501953125, 0.04153633117675781, 0.045398712158203125, 0.04926109313964844, 0.05312347412109375, 0.05698585510253906, 0.060848236083984375, 0.06471061706542969, 0.068572998046875, 0.07243537902832031, 0.07629776000976562, 0.08016014099121094, 0.08402252197265625, 0.08788490295410156, 0.09174728393554688, 0.09560966491699219, 0.0994720458984375, 0.10333442687988281, 0.10719680786132812, 0.11105918884277344, 0.11492156982421875, 0.11878395080566406, 0.12264633178710938, 0.1265087127685547, 0.13037109375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 10.0, 6.0, 14.0, 7.0, 11.0, 24.0, 11.0, 11.0, 20.0, 22.0, 23.0, 26.0, 33.0, 32.0, 37.0, 45.0, 43.0, 49.0, 52.0, 49.0, 36.0, 36.0, 36.0, 35.0, 40.0, 29.0, 30.0, 26.0, 35.0, 21.0, 15.0, 15.0, 20.0, 15.0, 23.0, 16.0, 7.0, 12.0, 8.0, 3.0, 7.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.07476806640625, -0.07256507873535156, -0.07036209106445312, -0.06815910339355469, -0.06595611572265625, -0.06375312805175781, -0.061550140380859375, -0.05934715270996094, -0.0571441650390625, -0.05494117736816406, -0.052738189697265625, -0.05053520202636719, -0.04833221435546875, -0.04612922668457031, -0.043926239013671875, -0.04172325134277344, -0.039520263671875, -0.03731727600097656, -0.035114288330078125, -0.03291130065917969, -0.03070831298828125, -0.028505325317382812, -0.026302337646484375, -0.024099349975585938, -0.0218963623046875, -0.019693374633789062, -0.017490386962890625, -0.015287399291992188, -0.01308441162109375, -0.010881423950195312, -0.008678436279296875, -0.0064754486083984375, -0.0042724609375, -0.0020694732666015625, 0.000133514404296875, 0.0023365020751953125, 0.00453948974609375, 0.0067424774169921875, 0.008945465087890625, 0.011148452758789062, 0.0133514404296875, 0.015554428100585938, 0.017757415771484375, 0.019960403442382812, 0.02216339111328125, 0.024366378784179688, 0.026569366455078125, 0.028772354125976562, 0.030975341796875, 0.03317832946777344, 0.035381317138671875, 0.03758430480957031, 0.03978729248046875, 0.04199028015136719, 0.044193267822265625, 0.04639625549316406, 0.0485992431640625, 0.05080223083496094, 0.053005218505859375, 0.05520820617675781, 0.05741119384765625, 0.05961418151855469, 0.061817169189453125, 0.06402015686035156, 0.06622314453125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 7.0, 5.0, 5.0, 9.0, 7.0, 11.0, 20.0, 25.0, 34.0, 58.0, 55.0, 135.0, 186.0, 350.0, 510.0, 942.0, 1911.0, 4242.0, 12622.0, 43787.0, 156110.0, 385671.0, 302421.0, 97884.0, 26795.0, 8256.0, 3168.0, 1395.0, 706.0, 399.0, 276.0, 189.0, 124.0, 76.0, 38.0, 46.0, 13.0, 15.0, 16.0, 13.0, 5.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0243682861328125, -0.023625612258911133, -0.022882938385009766, -0.0221402645111084, -0.02139759063720703, -0.020654916763305664, -0.019912242889404297, -0.01916956901550293, -0.018426895141601562, -0.017684221267700195, -0.016941547393798828, -0.01619887351989746, -0.015456199645996094, -0.014713525772094727, -0.01397085189819336, -0.013228178024291992, -0.012485504150390625, -0.011742830276489258, -0.01100015640258789, -0.010257482528686523, -0.009514808654785156, -0.008772134780883789, -0.008029460906982422, -0.007286787033081055, -0.0065441131591796875, -0.00580143928527832, -0.005058765411376953, -0.004316091537475586, -0.0035734176635742188, -0.0028307437896728516, -0.0020880699157714844, -0.0013453960418701172, -0.00060272216796875, 0.0001399517059326172, 0.0008826255798339844, 0.0016252994537353516, 0.0023679733276367188, 0.003110647201538086, 0.003853321075439453, 0.00459599494934082, 0.0053386688232421875, 0.006081342697143555, 0.006824016571044922, 0.007566690444946289, 0.008309364318847656, 0.009052038192749023, 0.00979471206665039, 0.010537385940551758, 0.011280059814453125, 0.012022733688354492, 0.01276540756225586, 0.013508081436157227, 0.014250755310058594, 0.014993429183959961, 0.015736103057861328, 0.016478776931762695, 0.017221450805664062, 0.01796412467956543, 0.018706798553466797, 0.019449472427368164, 0.02019214630126953, 0.0209348201751709, 0.021677494049072266, 0.022420167922973633, 0.023162841796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 7.0, 3.0, 8.0, 16.0, 6.0, 13.0, 10.0, 15.0, 30.0, 33.0, 22.0, 68.0, 51.0, 78.0, 46.0, 50.0, 75.0, 56.0, 99.0, 50.0, 44.0, 59.0, 31.0, 36.0, 24.0, 20.0, 15.0, 8.0, 11.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0531158447265625e-06, -3.910623490810394e-06, -3.768131136894226e-06, -3.625638782978058e-06, -3.4831464290618896e-06, -3.3406540751457214e-06, -3.1981617212295532e-06, -3.055669367313385e-06, -2.913177013397217e-06, -2.7706846594810486e-06, -2.6281923055648804e-06, -2.485699951648712e-06, -2.343207597732544e-06, -2.2007152438163757e-06, -2.0582228899002075e-06, -1.9157305359840393e-06, -1.773238182067871e-06, -1.6307458281517029e-06, -1.4882534742355347e-06, -1.3457611203193665e-06, -1.2032687664031982e-06, -1.06077641248703e-06, -9.182840585708618e-07, -7.757917046546936e-07, -6.332993507385254e-07, -4.908069968223572e-07, -3.4831464290618896e-07, -2.0582228899002075e-07, -6.332993507385254e-08, 7.916241884231567e-08, 2.2165477275848389e-07, 3.641471266746521e-07, 5.066394805908203e-07, 6.491318345069885e-07, 7.916241884231567e-07, 9.34116542339325e-07, 1.0766088962554932e-06, 1.2191012501716614e-06, 1.3615936040878296e-06, 1.5040859580039978e-06, 1.646578311920166e-06, 1.7890706658363342e-06, 1.9315630197525024e-06, 2.0740553736686707e-06, 2.216547727584839e-06, 2.359040081501007e-06, 2.5015324354171753e-06, 2.6440247893333435e-06, 2.7865171432495117e-06, 2.92900949716568e-06, 3.071501851081848e-06, 3.2139942049980164e-06, 3.3564865589141846e-06, 3.4989789128303528e-06, 3.641471266746521e-06, 3.783963620662689e-06, 3.926455974578857e-06, 4.068948328495026e-06, 4.211440682411194e-06, 4.353933036327362e-06, 4.49642539024353e-06, 4.6389177441596985e-06, 4.781410098075867e-06, 4.923902451992035e-06, 5.066394805908203e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 8.0, 9.0, 15.0, 25.0, 33.0, 57.0, 86.0, 148.0, 245.0, 516.0, 955.0, 2313.0, 7182.0, 33489.0, 193895.0, 514409.0, 239087.0, 42518.0, 8571.0, 2599.0, 1119.0, 569.0, 292.0, 170.0, 82.0, 55.0, 38.0, 22.0, 18.0, 10.0, 9.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0229644775390625, -0.021990060806274414, -0.021015644073486328, -0.020041227340698242, -0.019066810607910156, -0.01809239387512207, -0.017117977142333984, -0.0161435604095459, -0.015169143676757812, -0.014194726943969727, -0.01322031021118164, -0.012245893478393555, -0.011271476745605469, -0.010297060012817383, -0.009322643280029297, -0.008348226547241211, -0.007373809814453125, -0.006399393081665039, -0.005424976348876953, -0.004450559616088867, -0.0034761428833007812, -0.0025017261505126953, -0.0015273094177246094, -0.0005528926849365234, 0.0004215240478515625, 0.0013959407806396484, 0.0023703575134277344, 0.0033447742462158203, 0.004319190979003906, 0.005293607711791992, 0.006268024444580078, 0.007242441177368164, 0.00821685791015625, 0.009191274642944336, 0.010165691375732422, 0.011140108108520508, 0.012114524841308594, 0.01308894157409668, 0.014063358306884766, 0.015037775039672852, 0.016012191772460938, 0.016986608505249023, 0.01796102523803711, 0.018935441970825195, 0.01990985870361328, 0.020884275436401367, 0.021858692169189453, 0.02283310890197754, 0.023807525634765625, 0.02478194236755371, 0.025756359100341797, 0.026730775833129883, 0.02770519256591797, 0.028679609298706055, 0.02965402603149414, 0.030628442764282227, 0.03160285949707031, 0.0325772762298584, 0.033551692962646484, 0.03452610969543457, 0.035500526428222656, 0.03647494316101074, 0.03744935989379883, 0.038423776626586914, 0.039398193359375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 1.0, 7.0, 9.0, 10.0, 6.0, 10.0, 12.0, 15.0, 23.0, 28.0, 40.0, 50.0, 49.0, 43.0, 42.0, 45.0, 36.0, 60.0, 36.0, 42.0, 56.0, 58.0, 39.0, 43.0, 36.0, 41.0, 34.0, 25.0, 16.0, 16.0, 18.0, 12.0, 10.0, 6.0, 9.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.0140533447265625, -0.013672590255737305, -0.01329183578491211, -0.012911081314086914, -0.012530326843261719, -0.012149572372436523, -0.011768817901611328, -0.011388063430786133, -0.011007308959960938, -0.010626554489135742, -0.010245800018310547, -0.009865045547485352, -0.009484291076660156, -0.009103536605834961, -0.008722782135009766, -0.00834202766418457, -0.007961273193359375, -0.00758051872253418, -0.007199764251708984, -0.006819009780883789, -0.006438255310058594, -0.0060575008392333984, -0.005676746368408203, -0.005295991897583008, -0.0049152374267578125, -0.004534482955932617, -0.004153728485107422, -0.0037729740142822266, -0.0033922195434570312, -0.003011465072631836, -0.0026307106018066406, -0.0022499561309814453, -0.00186920166015625, -0.0014884471893310547, -0.0011076927185058594, -0.0007269382476806641, -0.00034618377685546875, 3.457069396972656e-05, 0.0004153251647949219, 0.0007960796356201172, 0.0011768341064453125, 0.0015575885772705078, 0.0019383430480957031, 0.0023190975189208984, 0.0026998519897460938, 0.003080606460571289, 0.0034613609313964844, 0.0038421154022216797, 0.004222869873046875, 0.00460362434387207, 0.004984378814697266, 0.005365133285522461, 0.005745887756347656, 0.0061266422271728516, 0.006507396697998047, 0.006888151168823242, 0.0072689056396484375, 0.007649660110473633, 0.008030414581298828, 0.008411169052124023, 0.008791923522949219, 0.009172677993774414, 0.00955343246459961, 0.009934186935424805, 0.01031494140625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 12.0, 28.0, 109.0, 301.0, 394.0, 112.0, 34.0, 14.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5458758473396301, -0.5212050676345825, -0.4965343177318573, -0.4718635678291321, -0.4471927881240845, -0.42252200841903687, -0.39785125851631165, -0.3731805086135864, -0.3485097289085388, -0.3238389492034912, -0.299168199300766, -0.27449744939804077, -0.24982666969299316, -0.22515590488910675, -0.20048514008522034, -0.17581437528133392, -0.1511436104774475, -0.1264728456735611, -0.10180208086967468, -0.07713131606578827, -0.052460551261901855, -0.027789786458015442, -0.0031190216541290283, 0.021551743149757385, 0.0462225079536438, 0.07089327275753021, 0.09556403756141663, 0.12023480236530304, 0.14490556716918945, 0.16957633197307587, 0.19424709677696228, 0.2189178615808487, 0.24358856678009033, 0.26825934648513794, 0.29293009638786316, 0.3176008462905884, 0.342271625995636, 0.3669424057006836, 0.3916131556034088, 0.41628390550613403, 0.44095468521118164, 0.46562546491622925, 0.49029621481895447, 0.5149669647216797, 0.5396377444267273, 0.5643085241317749, 0.5889792442321777, 0.6136500239372253, 0.638320803642273, 0.6629915833473206, 0.6876623630523682, 0.712333083152771, 0.7370038628578186, 0.7616746425628662, 0.786345362663269, 0.8110161423683167, 0.8356869220733643, 0.8603577017784119, 0.8850284814834595, 0.9096992015838623, 0.9343699812889099, 0.9590407609939575, 0.9837114810943604, 1.0083823204040527, 1.0330530405044556]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 11.0, 15.0, 17.0, 14.0, 18.0, 27.0, 29.0, 37.0, 31.0, 40.0, 50.0, 46.0, 43.0, 57.0, 38.0, 60.0, 61.0, 49.0, 42.0, 53.0, 40.0, 27.0, 38.0, 30.0, 29.0, 25.0, 19.0, 12.0, 6.0, 9.0, 5.0, 7.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2855696678161621, -0.27587059140205383, -0.26617148518562317, -0.2564724087715149, -0.24677333235740662, -0.23707424104213715, -0.22737514972686768, -0.2176760733127594, -0.20797699689865112, -0.19827790558338165, -0.18857882916927338, -0.1788797378540039, -0.16918066143989563, -0.15948157012462616, -0.1497824788093567, -0.1400834023952484, -0.13038431107997894, -0.12068522721529007, -0.1109861433506012, -0.10128705203533173, -0.09158797562122345, -0.08188888430595398, -0.0721898004412651, -0.06249071657657623, -0.05279163271188736, -0.043092548847198486, -0.03339346498250961, -0.02369437739253044, -0.013995293527841568, -0.004296209663152695, 0.005402877926826477, 0.01510196179151535, 0.024801045656204224, 0.0345001295208931, 0.04419921338558197, 0.05389830097556114, 0.06359738111495972, 0.07329647243022919, 0.08299555629491806, 0.09269464015960693, 0.1023937240242958, 0.11209280788898468, 0.12179189175367355, 0.13149097561836243, 0.1411900669336319, 0.15088914334774017, 0.16058823466300964, 0.17028731107711792, 0.1799864023923874, 0.18968549370765686, 0.19938457012176514, 0.2090836614370346, 0.21878273785114288, 0.22848182916641235, 0.23818090558052063, 0.2478799968957901, 0.25757908821105957, 0.26727816462516785, 0.2769772708415985, 0.2866763472557068, 0.29637542366981506, 0.30607450008392334, 0.315773606300354, 0.3254726827144623, 0.33517175912857056]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0, 4.0, 5.0, 10.0, 13.0, 14.0, 27.0, 34.0, 53.0, 93.0, 185.0, 412.0, 998.0, 3161.0, 14689.0, 175436.0, 3782352.0, 196436.0, 15479.0, 3149.0, 1007.0, 372.0, 130.0, 76.0, 48.0, 25.0, 17.0, 22.0, 14.0, 7.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1492919921875, -0.14496612548828125, -0.1406402587890625, -0.13631439208984375, -0.131988525390625, -0.12766265869140625, -0.1233367919921875, -0.11901092529296875, -0.11468505859375, -0.11035919189453125, -0.1060333251953125, -0.10170745849609375, -0.097381591796875, -0.09305572509765625, -0.0887298583984375, -0.08440399169921875, -0.080078125, -0.07575225830078125, -0.0714263916015625, -0.06710052490234375, -0.062774658203125, -0.05844879150390625, -0.0541229248046875, -0.04979705810546875, -0.04547119140625, -0.04114532470703125, -0.0368194580078125, -0.03249359130859375, -0.028167724609375, -0.02384185791015625, -0.0195159912109375, -0.01519012451171875, -0.0108642578125, -0.00653839111328125, -0.0022125244140625, 0.00211334228515625, 0.006439208984375, 0.01076507568359375, 0.0150909423828125, 0.01941680908203125, 0.02374267578125, 0.02806854248046875, 0.0323944091796875, 0.03672027587890625, 0.041046142578125, 0.04537200927734375, 0.0496978759765625, 0.05402374267578125, 0.058349609375, 0.06267547607421875, 0.0670013427734375, 0.07132720947265625, 0.075653076171875, 0.07997894287109375, 0.0843048095703125, 0.08863067626953125, 0.09295654296875, 0.09728240966796875, 0.1016082763671875, 0.10593414306640625, 0.110260009765625, 0.11458587646484375, 0.1189117431640625, 0.12323760986328125, 0.1275634765625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 7.0, 5.0, 13.0, 12.0, 20.0, 16.0, 29.0, 31.0, 49.0, 44.0, 51.0, 51.0, 68.0, 64.0, 70.0, 62.0, 53.0, 47.0, 54.0, 47.0, 51.0, 31.0, 31.0, 17.0, 23.0, 12.0, 8.0, 11.0, 9.0, 4.0, 2.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043914794921875, -0.04267692565917969, -0.041439056396484375, -0.04020118713378906, -0.03896331787109375, -0.03772544860839844, -0.036487579345703125, -0.03524971008300781, -0.0340118408203125, -0.03277397155761719, -0.031536102294921875, -0.030298233032226562, -0.02906036376953125, -0.027822494506835938, -0.026584625244140625, -0.025346755981445312, -0.02410888671875, -0.022871017456054688, -0.021633148193359375, -0.020395278930664062, -0.01915740966796875, -0.017919540405273438, -0.016681671142578125, -0.015443801879882812, -0.0142059326171875, -0.012968063354492188, -0.011730194091796875, -0.010492324829101562, -0.00925445556640625, -0.008016586303710938, -0.006778717041015625, -0.0055408477783203125, -0.004302978515625, -0.0030651092529296875, -0.001827239990234375, -0.0005893707275390625, 0.00064849853515625, 0.0018863677978515625, 0.003124237060546875, 0.0043621063232421875, 0.0055999755859375, 0.0068378448486328125, 0.008075714111328125, 0.009313583374023438, 0.01055145263671875, 0.011789321899414062, 0.013027191162109375, 0.014265060424804688, 0.0155029296875, 0.016740798950195312, 0.017978668212890625, 0.019216537475585938, 0.02045440673828125, 0.021692276000976562, 0.022930145263671875, 0.024168014526367188, 0.0254058837890625, 0.026643753051757812, 0.027881622314453125, 0.029119491577148438, 0.03035736083984375, 0.03159523010253906, 0.032833099365234375, 0.03407096862792969, 0.035308837890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 3.0, 7.0, 7.0, 27.0, 58.0, 82.0, 215.0, 613.0, 3166.0, 1169800.0, 3015084.0, 4078.0, 674.0, 255.0, 109.0, 49.0, 23.0, 11.0, 9.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.340576171875, -0.3279838562011719, -0.31539154052734375, -0.3027992248535156, -0.2902069091796875, -0.2776145935058594, -0.26502227783203125, -0.2524299621582031, -0.239837646484375, -0.22724533081054688, -0.21465301513671875, -0.20206069946289062, -0.1894683837890625, -0.17687606811523438, -0.16428375244140625, -0.15169143676757812, -0.13909912109375, -0.12650680541992188, -0.11391448974609375, -0.10132217407226562, -0.0887298583984375, -0.07613754272460938, -0.06354522705078125, -0.050952911376953125, -0.038360595703125, -0.025768280029296875, -0.01317596435546875, -0.000583648681640625, 0.0120086669921875, 0.024600982666015625, 0.03719329833984375, 0.049785614013671875, 0.0623779296875, 0.07497024536132812, 0.08756256103515625, 0.10015487670898438, 0.1127471923828125, 0.12533950805664062, 0.13793182373046875, 0.15052413940429688, 0.163116455078125, 0.17570877075195312, 0.18830108642578125, 0.20089340209960938, 0.2134857177734375, 0.22607803344726562, 0.23867034912109375, 0.2512626647949219, 0.26385498046875, 0.2764472961425781, 0.28903961181640625, 0.3016319274902344, 0.3142242431640625, 0.3268165588378906, 0.33940887451171875, 0.3520011901855469, 0.364593505859375, 0.3771858215332031, 0.38977813720703125, 0.4023704528808594, 0.4149627685546875, 0.4275550842285156, 0.44014739990234375, 0.4527397155761719, 0.46533203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 9.0, 9.0, 23.0, 41.0, 95.0, 132.0, 318.0, 860.0, 1357.0, 688.0, 258.0, 132.0, 59.0, 43.0, 16.0, 12.0, 11.0, 2.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.162353515625, -0.15788650512695312, -0.15341949462890625, -0.14895248413085938, -0.1444854736328125, -0.14001846313476562, -0.13555145263671875, -0.13108444213867188, -0.126617431640625, -0.12215042114257812, -0.11768341064453125, -0.11321640014648438, -0.1087493896484375, -0.10428237915039062, -0.09981536865234375, -0.09534835815429688, -0.09088134765625, -0.08641433715820312, -0.08194732666015625, -0.07748031616210938, -0.0730133056640625, -0.06854629516601562, -0.06407928466796875, -0.059612274169921875, -0.055145263671875, -0.050678253173828125, -0.04621124267578125, -0.041744232177734375, -0.0372772216796875, -0.032810211181640625, -0.02834320068359375, -0.023876190185546875, -0.0194091796875, -0.014942169189453125, -0.01047515869140625, -0.006008148193359375, -0.0015411376953125, 0.002925872802734375, 0.00739288330078125, 0.011859893798828125, 0.016326904296875, 0.020793914794921875, 0.02526092529296875, 0.029727935791015625, 0.0341949462890625, 0.038661956787109375, 0.04312896728515625, 0.047595977783203125, 0.05206298828125, 0.056529998779296875, 0.06099700927734375, 0.06546401977539062, 0.0699310302734375, 0.07439804077148438, 0.07886505126953125, 0.08333206176757812, 0.087799072265625, 0.09226608276367188, 0.09673309326171875, 0.10120010375976562, 0.1056671142578125, 0.11013412475585938, 0.11460113525390625, 0.11906814575195312, 0.12353515625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 83.0, 543.0, 324.0, 46.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5149121284484863, -2.465409278869629, -2.4159061908721924, -2.366403341293335, -2.3169004917144775, -2.267397403717041, -2.2178945541381836, -2.168391704559326, -2.1188886165618896, -2.0693857669830322, -2.0198826789855957, -1.9703798294067383, -1.9208768606185913, -1.8713738918304443, -1.821871042251587, -1.77236807346344, -1.722865104675293, -1.673362135887146, -1.6238592863082886, -1.5743563175201416, -1.5248533487319946, -1.4753503799438477, -1.4258475303649902, -1.3763445615768433, -1.3268417119979858, -1.2773387432098389, -1.2278358936309814, -1.1783329248428345, -1.1288299560546875, -1.0793269872665405, -1.029824137687683, -0.9803211688995361, -0.9308182597160339, -0.8813153505325317, -0.8318123817443848, -0.7823094725608826, -0.7328065037727356, -0.6833035945892334, -0.6338006258010864, -0.5842977166175842, -0.534794807434082, -0.48529186844825745, -0.43578892946243286, -0.38628602027893066, -0.3367830514907837, -0.2872801423072815, -0.2377772033214569, -0.18827426433563232, -0.13877129554748535, -0.08926835656166077, -0.03976542502641678, 0.00973750650882721, 0.059240445494651794, 0.10874338448047638, 0.15824630856513977, 0.20774924755096436, 0.25725218653678894, 0.3067551255226135, 0.3562580645084381, 0.4057610034942627, 0.4552639126777649, 0.5047668814659119, 0.5542697906494141, 0.603772759437561, 0.6532756686210632]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 11.0, 7.0, 13.0, 16.0, 31.0, 19.0, 27.0, 35.0, 37.0, 39.0, 37.0, 53.0, 44.0, 39.0, 53.0, 42.0, 51.0, 53.0, 36.0, 39.0, 39.0, 34.0, 34.0, 35.0, 36.0, 22.0, 18.0, 23.0, 18.0, 8.0, 8.0, 11.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.2525344491004944, -0.24519746005535126, -0.23786047101020813, -0.2305234968662262, -0.22318650782108307, -0.21584951877593994, -0.208512544631958, -0.20117555558681488, -0.19383856654167175, -0.18650157749652863, -0.1791645884513855, -0.17182761430740356, -0.16449062526226044, -0.1571536362171173, -0.14981666207313538, -0.14247967302799225, -0.13514268398284912, -0.127805694937706, -0.12046871334314346, -0.11313173174858093, -0.1057947427034378, -0.09845775365829468, -0.09112077206373215, -0.08378379046916962, -0.07644680142402649, -0.06910981237888336, -0.06177283078432083, -0.054435845464468, -0.04709886014461517, -0.039761874824762344, -0.032424889504909515, -0.025087904185056686, -0.017750918865203857, -0.010413933545351028, -0.0030769482254981995, 0.0042600370943546295, 0.011597022414207458, 0.018934007734060287, 0.026270993053913116, 0.033607978373765945, 0.040944963693618774, 0.0482819490134716, 0.05561893433332443, 0.06295591592788696, 0.07029290497303009, 0.07762989401817322, 0.08496687561273575, 0.09230385720729828, 0.0996408462524414, 0.10697783529758453, 0.11431481689214706, 0.1216517984867096, 0.12898878753185272, 0.13632577657699585, 0.14366275072097778, 0.1509997397661209, 0.15833672881126404, 0.16567371785640717, 0.1730107069015503, 0.18034768104553223, 0.18768467009067535, 0.19502165913581848, 0.20235863327980042, 0.20969562232494354, 0.21703261137008667]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 11.0, 3.0, 12.0, 16.0, 21.0, 31.0, 36.0, 34.0, 61.0, 84.0, 106.0, 165.0, 263.0, 455.0, 823.0, 1428.0, 2793.0, 5802.0, 12147.0, 29061.0, 76613.0, 221783.0, 383721.0, 197093.0, 67418.0, 26378.0, 10980.0, 5297.0, 2577.0, 1356.0, 746.0, 400.0, 247.0, 178.0, 108.0, 87.0, 61.0, 42.0, 27.0, 27.0, 14.0, 12.0, 8.0, 17.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05267333984375, -0.050884246826171875, -0.04909515380859375, -0.047306060791015625, -0.0455169677734375, -0.043727874755859375, -0.04193878173828125, -0.040149688720703125, -0.038360595703125, -0.036571502685546875, -0.03478240966796875, -0.032993316650390625, -0.0312042236328125, -0.029415130615234375, -0.02762603759765625, -0.025836944580078125, -0.0240478515625, -0.022258758544921875, -0.02046966552734375, -0.018680572509765625, -0.0168914794921875, -0.015102386474609375, -0.01331329345703125, -0.011524200439453125, -0.009735107421875, -0.007946014404296875, -0.00615692138671875, -0.004367828369140625, -0.0025787353515625, -0.000789642333984375, 0.00099945068359375, 0.002788543701171875, 0.00457763671875, 0.006366729736328125, 0.00815582275390625, 0.009944915771484375, 0.0117340087890625, 0.013523101806640625, 0.01531219482421875, 0.017101287841796875, 0.018890380859375, 0.020679473876953125, 0.02246856689453125, 0.024257659912109375, 0.0260467529296875, 0.027835845947265625, 0.02962493896484375, 0.031414031982421875, 0.033203125, 0.034992218017578125, 0.03678131103515625, 0.038570404052734375, 0.0403594970703125, 0.042148590087890625, 0.04393768310546875, 0.045726776123046875, 0.047515869140625, 0.049304962158203125, 0.05109405517578125, 0.052883148193359375, 0.0546722412109375, 0.056461334228515625, 0.05825042724609375, 0.060039520263671875, 0.06182861328125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 9.0, 2.0, 5.0, 5.0, 12.0, 18.0, 20.0, 32.0, 42.0, 51.0, 57.0, 85.0, 85.0, 74.0, 82.0, 85.0, 64.0, 57.0, 51.0, 46.0, 31.0, 31.0, 17.0, 12.0, 11.0, 12.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05047607421875, -0.049115657806396484, -0.04775524139404297, -0.04639482498168945, -0.04503440856933594, -0.04367399215698242, -0.042313575744628906, -0.04095315933227539, -0.039592742919921875, -0.03823232650756836, -0.036871910095214844, -0.03551149368286133, -0.03415107727050781, -0.0327906608581543, -0.03143024444580078, -0.030069828033447266, -0.02870941162109375, -0.027348995208740234, -0.02598857879638672, -0.024628162384033203, -0.023267745971679688, -0.021907329559326172, -0.020546913146972656, -0.01918649673461914, -0.017826080322265625, -0.01646566390991211, -0.015105247497558594, -0.013744831085205078, -0.012384414672851562, -0.011023998260498047, -0.009663581848144531, -0.008303165435791016, -0.0069427490234375, -0.005582332611083984, -0.004221916198730469, -0.002861499786376953, -0.0015010833740234375, -0.00014066696166992188, 0.0012197494506835938, 0.0025801658630371094, 0.003940582275390625, 0.005300998687744141, 0.006661415100097656, 0.008021831512451172, 0.009382247924804688, 0.010742664337158203, 0.012103080749511719, 0.013463497161865234, 0.01482391357421875, 0.016184329986572266, 0.01754474639892578, 0.018905162811279297, 0.020265579223632812, 0.021625995635986328, 0.022986412048339844, 0.02434682846069336, 0.025707244873046875, 0.02706766128540039, 0.028428077697753906, 0.029788494110107422, 0.031148910522460938, 0.03250932693481445, 0.03386974334716797, 0.035230159759521484, 0.036590576171875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 3.0, 13.0, 8.0, 10.0, 15.0, 20.0, 26.0, 25.0, 32.0, 35.0, 55.0, 82.0, 171.0, 430.0, 1430.0, 6876.0, 46251.0, 490829.0, 451207.0, 42644.0, 6177.0, 1279.0, 400.0, 202.0, 95.0, 70.0, 38.0, 32.0, 28.0, 17.0, 14.0, 11.0, 6.0, 10.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1370849609375, -0.132659912109375, -0.12823486328125, -0.123809814453125, -0.119384765625, -0.114959716796875, -0.11053466796875, -0.106109619140625, -0.1016845703125, -0.097259521484375, -0.09283447265625, -0.088409423828125, -0.083984375, -0.079559326171875, -0.07513427734375, -0.070709228515625, -0.0662841796875, -0.061859130859375, -0.05743408203125, -0.053009033203125, -0.048583984375, -0.044158935546875, -0.03973388671875, -0.035308837890625, -0.0308837890625, -0.026458740234375, -0.02203369140625, -0.017608642578125, -0.01318359375, -0.008758544921875, -0.00433349609375, 9.1552734375e-05, 0.0045166015625, 0.008941650390625, 0.01336669921875, 0.017791748046875, 0.022216796875, 0.026641845703125, 0.03106689453125, 0.035491943359375, 0.0399169921875, 0.044342041015625, 0.04876708984375, 0.053192138671875, 0.0576171875, 0.062042236328125, 0.06646728515625, 0.070892333984375, 0.0753173828125, 0.079742431640625, 0.08416748046875, 0.088592529296875, 0.093017578125, 0.097442626953125, 0.10186767578125, 0.106292724609375, 0.1107177734375, 0.115142822265625, 0.11956787109375, 0.123992919921875, 0.12841796875, 0.132843017578125, 0.13726806640625, 0.141693115234375, 0.1461181640625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 7.0, 12.0, 14.0, 14.0, 21.0, 23.0, 32.0, 33.0, 31.0, 53.0, 49.0, 42.0, 53.0, 52.0, 44.0, 49.0, 47.0, 54.0, 50.0, 40.0, 37.0, 34.0, 26.0, 28.0, 27.0, 22.0, 23.0, 23.0, 13.0, 9.0, 11.0, 8.0, 5.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.085693359375, -0.08310508728027344, -0.08051681518554688, -0.07792854309082031, -0.07534027099609375, -0.07275199890136719, -0.07016372680664062, -0.06757545471191406, -0.0649871826171875, -0.06239891052246094, -0.059810638427734375, -0.05722236633300781, -0.05463409423828125, -0.05204582214355469, -0.049457550048828125, -0.04686927795410156, -0.044281005859375, -0.04169273376464844, -0.039104461669921875, -0.03651618957519531, -0.03392791748046875, -0.03133964538574219, -0.028751373291015625, -0.026163101196289062, -0.0235748291015625, -0.020986557006835938, -0.018398284912109375, -0.015810012817382812, -0.01322174072265625, -0.010633468627929688, -0.008045196533203125, -0.0054569244384765625, -0.00286865234375, -0.0002803802490234375, 0.002307891845703125, 0.0048961639404296875, 0.00748443603515625, 0.010072708129882812, 0.012660980224609375, 0.015249252319335938, 0.0178375244140625, 0.020425796508789062, 0.023014068603515625, 0.025602340698242188, 0.02819061279296875, 0.030778884887695312, 0.033367156982421875, 0.03595542907714844, 0.038543701171875, 0.04113197326660156, 0.043720245361328125, 0.04630851745605469, 0.04889678955078125, 0.05148506164550781, 0.054073333740234375, 0.05666160583496094, 0.0592498779296875, 0.06183815002441406, 0.06442642211914062, 0.06701469421386719, 0.06960296630859375, 0.07219123840332031, 0.07477951049804688, 0.07736778259277344, 0.0799560546875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 14.0, 20.0, 41.0, 70.0, 130.0, 324.0, 1188.0, 8476.0, 198298.0, 783847.0, 51508.0, 3514.0, 663.0, 227.0, 100.0, 60.0, 35.0, 11.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.060882568359375, -0.05940866470336914, -0.05793476104736328, -0.05646085739135742, -0.05498695373535156, -0.0535130500793457, -0.052039146423339844, -0.050565242767333984, -0.049091339111328125, -0.047617435455322266, -0.046143531799316406, -0.04466962814331055, -0.04319572448730469, -0.04172182083129883, -0.04024791717529297, -0.03877401351928711, -0.03730010986328125, -0.03582620620727539, -0.03435230255126953, -0.03287839889526367, -0.03140449523925781, -0.029930591583251953, -0.028456687927246094, -0.026982784271240234, -0.025508880615234375, -0.024034976959228516, -0.022561073303222656, -0.021087169647216797, -0.019613265991210938, -0.018139362335205078, -0.01666545867919922, -0.01519155502319336, -0.0137176513671875, -0.01224374771118164, -0.010769844055175781, -0.009295940399169922, -0.007822036743164062, -0.006348133087158203, -0.004874229431152344, -0.0034003257751464844, -0.001926422119140625, -0.0004525184631347656, 0.0010213851928710938, 0.002495288848876953, 0.0039691925048828125, 0.005443096160888672, 0.006916999816894531, 0.00839090347290039, 0.00986480712890625, 0.01133871078491211, 0.012812614440917969, 0.014286518096923828, 0.015760421752929688, 0.017234325408935547, 0.018708229064941406, 0.020182132720947266, 0.021656036376953125, 0.023129940032958984, 0.024603843688964844, 0.026077747344970703, 0.027551651000976562, 0.029025554656982422, 0.03049945831298828, 0.03197336196899414, 0.033447265625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 12.0, 16.0, 30.0, 42.0, 65.0, 74.0, 132.0, 118.0, 128.0, 93.0, 79.0, 82.0, 43.0, 27.0, 23.0, 13.0, 10.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0531158447265625e-06, -3.862194716930389e-06, -3.6712735891342163e-06, -3.4803524613380432e-06, -3.28943133354187e-06, -3.098510205745697e-06, -2.907589077949524e-06, -2.716667950153351e-06, -2.5257468223571777e-06, -2.3348256945610046e-06, -2.1439045667648315e-06, -1.9529834389686584e-06, -1.7620623111724854e-06, -1.5711411833763123e-06, -1.3802200555801392e-06, -1.189298927783966e-06, -9.98377799987793e-07, -8.074566721916199e-07, -6.165355443954468e-07, -4.256144165992737e-07, -2.3469328880310059e-07, -4.377216100692749e-08, 1.471489667892456e-07, 3.380700945854187e-07, 5.289912223815918e-07, 7.199123501777649e-07, 9.10833477973938e-07, 1.101754605770111e-06, 1.2926757335662842e-06, 1.4835968613624573e-06, 1.6745179891586304e-06, 1.8654391169548035e-06, 2.0563602447509766e-06, 2.2472813725471497e-06, 2.4382025003433228e-06, 2.629123628139496e-06, 2.820044755935669e-06, 3.010965883731842e-06, 3.201887011528015e-06, 3.3928081393241882e-06, 3.5837292671203613e-06, 3.7746503949165344e-06, 3.9655715227127075e-06, 4.156492650508881e-06, 4.347413778305054e-06, 4.538334906101227e-06, 4.7292560338974e-06, 4.920177161693573e-06, 5.111098289489746e-06, 5.302019417285919e-06, 5.492940545082092e-06, 5.683861672878265e-06, 5.8747828006744385e-06, 6.0657039284706116e-06, 6.256625056266785e-06, 6.447546184062958e-06, 6.638467311859131e-06, 6.829388439655304e-06, 7.020309567451477e-06, 7.21123069524765e-06, 7.402151823043823e-06, 7.593072950839996e-06, 7.78399407863617e-06, 7.974915206432343e-06, 8.165836334228516e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 1.0, 16.0, 13.0, 20.0, 40.0, 57.0, 148.0, 338.0, 889.0, 3181.0, 19259.0, 207073.0, 660172.0, 139779.0, 13640.0, 2558.0, 751.0, 300.0, 140.0, 61.0, 39.0, 30.0, 10.0, 11.0, 8.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0251617431640625, -0.024209260940551758, -0.023256778717041016, -0.022304296493530273, -0.02135181427001953, -0.02039933204650879, -0.019446849822998047, -0.018494367599487305, -0.017541885375976562, -0.01658940315246582, -0.015636920928955078, -0.014684438705444336, -0.013731956481933594, -0.012779474258422852, -0.01182699203491211, -0.010874509811401367, -0.009922027587890625, -0.008969545364379883, -0.00801706314086914, -0.0070645809173583984, -0.006112098693847656, -0.005159616470336914, -0.004207134246826172, -0.0032546520233154297, -0.0023021697998046875, -0.0013496875762939453, -0.0003972053527832031, 0.0005552768707275391, 0.0015077590942382812, 0.0024602413177490234, 0.0034127235412597656, 0.004365205764770508, 0.00531768798828125, 0.006270170211791992, 0.007222652435302734, 0.008175134658813477, 0.009127616882324219, 0.010080099105834961, 0.011032581329345703, 0.011985063552856445, 0.012937545776367188, 0.01389002799987793, 0.014842510223388672, 0.015794992446899414, 0.016747474670410156, 0.0176999568939209, 0.01865243911743164, 0.019604921340942383, 0.020557403564453125, 0.021509885787963867, 0.02246236801147461, 0.02341485023498535, 0.024367332458496094, 0.025319814682006836, 0.026272296905517578, 0.02722477912902832, 0.028177261352539062, 0.029129743576049805, 0.030082225799560547, 0.03103470802307129, 0.03198719024658203, 0.03293967247009277, 0.033892154693603516, 0.03484463691711426, 0.035797119140625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 10.0, 6.0, 10.0, 15.0, 22.0, 23.0, 42.0, 38.0, 55.0, 89.0, 93.0, 92.0, 94.0, 92.0, 84.0, 76.0, 54.0, 24.0, 28.0, 14.0, 11.0, 4.0, 11.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.02301025390625, -0.022460103034973145, -0.02190995216369629, -0.021359801292419434, -0.020809650421142578, -0.020259499549865723, -0.019709348678588867, -0.01915919780731201, -0.018609046936035156, -0.0180588960647583, -0.017508745193481445, -0.01695859432220459, -0.016408443450927734, -0.01585829257965088, -0.015308141708374023, -0.014757990837097168, -0.014207839965820312, -0.013657689094543457, -0.013107538223266602, -0.012557387351989746, -0.01200723648071289, -0.011457085609436035, -0.01090693473815918, -0.010356783866882324, -0.009806632995605469, -0.009256482124328613, -0.008706331253051758, -0.008156180381774902, -0.007606029510498047, -0.007055878639221191, -0.006505727767944336, -0.0059555768966674805, -0.005405426025390625, -0.0048552751541137695, -0.004305124282836914, -0.0037549734115600586, -0.003204822540283203, -0.0026546716690063477, -0.002104520797729492, -0.0015543699264526367, -0.0010042190551757812, -0.0004540681838989258, 9.608268737792969e-05, 0.0006462335586547852, 0.0011963844299316406, 0.001746535301208496, 0.0022966861724853516, 0.002846837043762207, 0.0033969879150390625, 0.003947138786315918, 0.0044972896575927734, 0.005047440528869629, 0.005597591400146484, 0.00614774227142334, 0.006697893142700195, 0.007248044013977051, 0.007798194885253906, 0.008348345756530762, 0.008898496627807617, 0.009448647499084473, 0.009998798370361328, 0.010548949241638184, 0.011099100112915039, 0.011649250984191895, 0.01219940185546875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 16.0, 17.0, 54.0, 123.0, 322.0, 279.0, 136.0, 32.0, 12.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5291925072669983, -0.5136475563049316, -0.4981025755405426, -0.48255759477615356, -0.4670126438140869, -0.4514676630496979, -0.43592268228530884, -0.4203777313232422, -0.40483275055885315, -0.3892877697944641, -0.37374281883239746, -0.3581978380680084, -0.3426528871059418, -0.32710790634155273, -0.3115629553794861, -0.29601797461509705, -0.280472993850708, -0.26492801308631897, -0.24938306212425232, -0.23383808135986328, -0.21829311549663544, -0.2027481496334076, -0.18720318377017975, -0.1716582179069519, -0.15611326694488525, -0.1405683010816574, -0.12502333521842957, -0.10947836190462112, -0.09393338859081268, -0.07838842272758484, -0.062843456864357, -0.04729848355054855, -0.03175351023674011, -0.01620854064822197, -0.0006635729223489761, 0.014881394803524017, 0.03042636439204216, 0.0459713339805603, 0.06151629984378815, 0.07706127315759659, 0.09260623902082443, 0.10815120488405228, 0.12369617819786072, 0.13924114406108856, 0.1547861099243164, 0.17033109068870544, 0.1858760416507721, 0.20142102241516113, 0.21696598827838898, 0.23251095414161682, 0.24805592000484467, 0.2636008858680725, 0.27914586663246155, 0.2946908473968506, 0.31023579835891724, 0.3257807791233063, 0.3413257300853729, 0.35687071084976196, 0.3724156618118286, 0.38796064257621765, 0.4035055935382843, 0.41905057430267334, 0.43459552526474, 0.45014050602912903, 0.46568548679351807]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 2.0, 2.0, 8.0, 10.0, 11.0, 11.0, 11.0, 8.0, 9.0, 22.0, 32.0, 22.0, 20.0, 39.0, 36.0, 27.0, 36.0, 41.0, 51.0, 35.0, 41.0, 39.0, 39.0, 36.0, 40.0, 40.0, 34.0, 35.0, 40.0, 26.0, 29.0, 24.0, 22.0, 29.0, 16.0, 10.0, 16.0, 9.0, 17.0, 6.0, 6.0, 4.0, 3.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2475351095199585, -0.24045318365097046, -0.23337127268314362, -0.22628934681415558, -0.21920742094516754, -0.2121255099773407, -0.20504358410835266, -0.19796165823936462, -0.1908797323703766, -0.18379780650138855, -0.1767158955335617, -0.16963396966457367, -0.16255204379558563, -0.1554701328277588, -0.14838820695877075, -0.14130628108978271, -0.13422437012195587, -0.12714244425296783, -0.1200605258345604, -0.11297860741615295, -0.10589668154716492, -0.09881476312875748, -0.09173284471035004, -0.084650918841362, -0.07756900042295456, -0.07048708200454712, -0.06340515613555908, -0.05632323771715164, -0.0492413155734539, -0.042159393429756165, -0.035077475011348724, -0.027995552867650986, -0.020913630723953247, -0.013831709511578083, -0.006749788299202919, 0.0003321319818496704, 0.007414054125547409, 0.014495976269245148, 0.021577894687652588, 0.028659816831350327, 0.035741738975048065, 0.042823661118745804, 0.04990558326244354, 0.05698750168085098, 0.06406942009925842, 0.07115134596824646, 0.0782332643866539, 0.08531518280506134, 0.09239710867404938, 0.09947902709245682, 0.10656095296144485, 0.1136428713798523, 0.12072479724884033, 0.12780672311782837, 0.1348886340856552, 0.14197055995464325, 0.1490524709224701, 0.15613439679145813, 0.16321630775928497, 0.170298233628273, 0.17738015949726105, 0.1844620704650879, 0.19154399633407593, 0.19862592220306396, 0.205707848072052]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 1.0, 5.0, 5.0, 9.0, 13.0, 20.0, 32.0, 44.0, 61.0, 103.0, 145.0, 264.0, 461.0, 1027.0, 2415.0, 6433.0, 23409.0, 219048.0, 2908324.0, 963519.0, 51010.0, 12066.0, 3535.0, 1220.0, 531.0, 271.0, 132.0, 69.0, 42.0, 29.0, 16.0, 9.0, 12.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0924072265625, -0.08995723724365234, -0.08750724792480469, -0.08505725860595703, -0.08260726928710938, -0.08015727996826172, -0.07770729064941406, -0.0752573013305664, -0.07280731201171875, -0.0703573226928711, -0.06790733337402344, -0.06545734405517578, -0.06300735473632812, -0.06055736541748047, -0.05810737609863281, -0.055657386779785156, -0.0532073974609375, -0.050757408142089844, -0.04830741882324219, -0.04585742950439453, -0.043407440185546875, -0.04095745086669922, -0.03850746154785156, -0.036057472229003906, -0.03360748291015625, -0.031157493591308594, -0.028707504272460938, -0.02625751495361328, -0.023807525634765625, -0.02135753631591797, -0.018907546997070312, -0.016457557678222656, -0.014007568359375, -0.011557579040527344, -0.009107589721679688, -0.006657600402832031, -0.004207611083984375, -0.0017576217651367188, 0.0006923675537109375, 0.0031423568725585938, 0.00559234619140625, 0.008042335510253906, 0.010492324829101562, 0.012942314147949219, 0.015392303466796875, 0.01784229278564453, 0.020292282104492188, 0.022742271423339844, 0.0251922607421875, 0.027642250061035156, 0.030092239379882812, 0.03254222869873047, 0.034992218017578125, 0.03744220733642578, 0.03989219665527344, 0.042342185974121094, 0.04479217529296875, 0.047242164611816406, 0.04969215393066406, 0.05214214324951172, 0.054592132568359375, 0.05704212188720703, 0.05949211120605469, 0.061942100524902344, 0.06439208984375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 15.0, 23.0, 28.0, 25.0, 35.0, 39.0, 57.0, 56.0, 66.0, 71.0, 67.0, 71.0, 74.0, 60.0, 79.0, 38.0, 43.0, 37.0, 26.0, 22.0, 30.0, 9.0, 9.0, 10.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061004638671875, -0.05951881408691406, -0.058032989501953125, -0.05654716491699219, -0.05506134033203125, -0.05357551574707031, -0.052089691162109375, -0.05060386657714844, -0.0491180419921875, -0.04763221740722656, -0.046146392822265625, -0.04466056823730469, -0.04317474365234375, -0.04168891906738281, -0.040203094482421875, -0.03871726989746094, -0.0372314453125, -0.03574562072753906, -0.034259796142578125, -0.03277397155761719, -0.03128814697265625, -0.029802322387695312, -0.028316497802734375, -0.026830673217773438, -0.0253448486328125, -0.023859024047851562, -0.022373199462890625, -0.020887374877929688, -0.01940155029296875, -0.017915725708007812, -0.016429901123046875, -0.014944076538085938, -0.013458251953125, -0.011972427368164062, -0.010486602783203125, -0.009000778198242188, -0.00751495361328125, -0.0060291290283203125, -0.004543304443359375, -0.0030574798583984375, -0.0015716552734375, -8.58306884765625e-05, 0.001399993896484375, 0.0028858184814453125, 0.00437164306640625, 0.0058574676513671875, 0.007343292236328125, 0.008829116821289062, 0.01031494140625, 0.011800765991210938, 0.013286590576171875, 0.014772415161132812, 0.01625823974609375, 0.017744064331054688, 0.019229888916015625, 0.020715713500976562, 0.0222015380859375, 0.023687362670898438, 0.025173187255859375, 0.026659011840820312, 0.02814483642578125, 0.029630661010742188, 0.031116485595703125, 0.03260231018066406, 0.034088134765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 5.0, 6.0, 9.0, 7.0, 21.0, 19.0, 35.0, 34.0, 60.0, 91.0, 130.0, 208.0, 367.0, 1076.0, 6581.0, 267641.0, 3868997.0, 44629.0, 2854.0, 676.0, 292.0, 157.0, 100.0, 75.0, 54.0, 39.0, 28.0, 22.0, 16.0, 15.0, 6.0, 10.0, 6.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1820068359375, -0.1765422821044922, -0.17107772827148438, -0.16561317443847656, -0.16014862060546875, -0.15468406677246094, -0.14921951293945312, -0.1437549591064453, -0.1382904052734375, -0.1328258514404297, -0.12736129760742188, -0.12189674377441406, -0.11643218994140625, -0.11096763610839844, -0.10550308227539062, -0.10003852844238281, -0.094573974609375, -0.08910942077636719, -0.08364486694335938, -0.07818031311035156, -0.07271575927734375, -0.06725120544433594, -0.061786651611328125, -0.05632209777832031, -0.0508575439453125, -0.04539299011230469, -0.039928436279296875, -0.03446388244628906, -0.02899932861328125, -0.023534774780273438, -0.018070220947265625, -0.012605667114257812, -0.00714111328125, -0.0016765594482421875, 0.003787994384765625, 0.009252548217773438, 0.01471710205078125, 0.020181655883789062, 0.025646209716796875, 0.031110763549804688, 0.0365753173828125, 0.04203987121582031, 0.047504425048828125, 0.05296897888183594, 0.05843353271484375, 0.06389808654785156, 0.06936264038085938, 0.07482719421386719, 0.080291748046875, 0.08575630187988281, 0.09122085571289062, 0.09668540954589844, 0.10214996337890625, 0.10761451721191406, 0.11307907104492188, 0.11854362487792969, 0.1240081787109375, 0.1294727325439453, 0.13493728637695312, 0.14040184020996094, 0.14586639404296875, 0.15133094787597656, 0.15679550170898438, 0.1622600555419922, 0.167724609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 9.0, 4.0, 9.0, 9.0, 14.0, 16.0, 22.0, 38.0, 42.0, 42.0, 58.0, 100.0, 115.0, 189.0, 337.0, 534.0, 686.0, 654.0, 400.0, 241.0, 140.0, 112.0, 81.0, 58.0, 44.0, 25.0, 23.0, 14.0, 15.0, 15.0, 6.0, 2.0, 4.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049468994140625, -0.04780244827270508, -0.046135902404785156, -0.044469356536865234, -0.04280281066894531, -0.04113626480102539, -0.03946971893310547, -0.03780317306518555, -0.036136627197265625, -0.0344700813293457, -0.03280353546142578, -0.03113698959350586, -0.029470443725585938, -0.027803897857666016, -0.026137351989746094, -0.024470806121826172, -0.02280426025390625, -0.021137714385986328, -0.019471168518066406, -0.017804622650146484, -0.016138076782226562, -0.01447153091430664, -0.012804985046386719, -0.011138439178466797, -0.009471893310546875, -0.007805347442626953, -0.006138801574707031, -0.004472255706787109, -0.0028057098388671875, -0.0011391639709472656, 0.0005273818969726562, 0.002193927764892578, 0.0038604736328125, 0.005527019500732422, 0.007193565368652344, 0.008860111236572266, 0.010526657104492188, 0.01219320297241211, 0.013859748840332031, 0.015526294708251953, 0.017192840576171875, 0.018859386444091797, 0.02052593231201172, 0.02219247817993164, 0.023859024047851562, 0.025525569915771484, 0.027192115783691406, 0.028858661651611328, 0.03052520751953125, 0.03219175338745117, 0.033858299255371094, 0.035524845123291016, 0.03719139099121094, 0.03885793685913086, 0.04052448272705078, 0.0421910285949707, 0.043857574462890625, 0.04552412033081055, 0.04719066619873047, 0.04885721206665039, 0.05052375793457031, 0.052190303802490234, 0.053856849670410156, 0.05552339553833008, 0.05718994140625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 8.0, 30.0, 90.0, 243.0, 342.0, 190.0, 77.0, 20.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8728346228599548, -0.8544085621833801, -0.8359824419021606, -0.8175563812255859, -0.7991302609443665, -0.7807042002677917, -0.7622780799865723, -0.7438520193099976, -0.7254259586334229, -0.7069998979568481, -0.6885737776756287, -0.670147716999054, -0.6517215967178345, -0.6332955360412598, -0.6148694157600403, -0.5964433550834656, -0.5780172348022461, -0.5595911741256714, -0.5411650538444519, -0.5227389931678772, -0.5043128728866577, -0.485886812210083, -0.4674607217311859, -0.4490346312522888, -0.4306085407733917, -0.41218245029449463, -0.39375635981559753, -0.37533026933670044, -0.35690420866012573, -0.33847808837890625, -0.32005202770233154, -0.30162593722343445, -0.2831997871398926, -0.2647736966609955, -0.2463476061820984, -0.2279215306043625, -0.2094954401254654, -0.1910693496465683, -0.1726432740688324, -0.1542171835899353, -0.1357910931110382, -0.11736500263214111, -0.09893891960382462, -0.08051283657550812, -0.06208674609661102, -0.04366065561771393, -0.02523457258939743, -0.006808489561080933, 0.011617600917816162, 0.03004368767142296, 0.048469774425029755, 0.06689585745334625, 0.08532194793224335, 0.10374803841114044, 0.12217412143945694, 0.14060020446777344, 0.15902629494667053, 0.17745238542556763, 0.19587847590446472, 0.21430455148220062, 0.23273064196109772, 0.251156747341156, 0.2695828080177307, 0.2880088984966278, 0.3064349889755249]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 7.0, 3.0, 4.0, 7.0, 6.0, 8.0, 5.0, 21.0, 13.0, 14.0, 16.0, 27.0, 19.0, 22.0, 28.0, 24.0, 30.0, 32.0, 30.0, 47.0, 37.0, 32.0, 40.0, 37.0, 51.0, 35.0, 37.0, 36.0, 40.0, 33.0, 23.0, 32.0, 24.0, 25.0, 30.0, 24.0, 20.0, 16.0, 13.0, 14.0, 14.0, 8.0, 8.0, 6.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.13420706987380981, -0.1296379715204239, -0.12506887316703796, -0.12049977481365204, -0.11593067646026611, -0.11136157810688019, -0.10679247230291367, -0.10222337394952774, -0.09765427559614182, -0.09308517724275589, -0.08851607888936996, -0.08394698053598404, -0.07937787473201752, -0.07480877637863159, -0.07023967802524567, -0.06567057967185974, -0.061101481318473816, -0.05653238296508789, -0.051963284611701965, -0.04739418253302574, -0.042825084179639816, -0.03825598582625389, -0.03368688374757767, -0.029117785394191742, -0.024548687040805817, -0.01997958868741989, -0.015410488471388817, -0.010841389186680317, -0.006272289901971817, -0.0017031915485858917, 0.002865908667445183, 0.007435008883476257, 0.012004107236862183, 0.016573205590248108, 0.021142305806279182, 0.025711406022310257, 0.030280504375696182, 0.03484960272908211, 0.03941870480775833, 0.04398780316114426, 0.04855690151453018, 0.05312599986791611, 0.05769509822130203, 0.062264200299978256, 0.06683330237865448, 0.0714024007320404, 0.07597149908542633, 0.08054059743881226, 0.08510969579219818, 0.0896787941455841, 0.09424789249897003, 0.09881699085235596, 0.10338608920574188, 0.10795518755912781, 0.11252429336309433, 0.11709339171648026, 0.12166249006986618, 0.1262315958738327, 0.13080069422721863, 0.13536979258060455, 0.13993889093399048, 0.1445079892873764, 0.14907708764076233, 0.15364618599414825, 0.15821528434753418]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 6.0, 8.0, 12.0, 14.0, 16.0, 37.0, 43.0, 53.0, 86.0, 145.0, 194.0, 370.0, 766.0, 1491.0, 3519.0, 8650.0, 23516.0, 71657.0, 237247.0, 418152.0, 192351.0, 57881.0, 19335.0, 7281.0, 2922.0, 1273.0, 603.0, 369.0, 199.0, 108.0, 82.0, 46.0, 29.0, 26.0, 13.0, 19.0, 6.0, 9.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0709228515625, -0.0685110092163086, -0.06609916687011719, -0.06368732452392578, -0.061275482177734375, -0.05886363983154297, -0.05645179748535156, -0.054039955139160156, -0.05162811279296875, -0.049216270446777344, -0.04680442810058594, -0.04439258575439453, -0.041980743408203125, -0.03956890106201172, -0.03715705871582031, -0.034745216369628906, -0.0323333740234375, -0.029921531677246094, -0.027509689331054688, -0.02509784698486328, -0.022686004638671875, -0.02027416229248047, -0.017862319946289062, -0.015450477600097656, -0.01303863525390625, -0.010626792907714844, -0.008214950561523438, -0.005803108215332031, -0.003391265869140625, -0.0009794235229492188, 0.0014324188232421875, 0.0038442611694335938, 0.006256103515625, 0.008667945861816406, 0.011079788208007812, 0.013491630554199219, 0.015903472900390625, 0.01831531524658203, 0.020727157592773438, 0.023138999938964844, 0.02555084228515625, 0.027962684631347656, 0.030374526977539062, 0.03278636932373047, 0.035198211669921875, 0.03761005401611328, 0.04002189636230469, 0.042433738708496094, 0.0448455810546875, 0.047257423400878906, 0.04966926574707031, 0.05208110809326172, 0.054492950439453125, 0.05690479278564453, 0.05931663513183594, 0.061728477478027344, 0.06414031982421875, 0.06655216217041016, 0.06896400451660156, 0.07137584686279297, 0.07378768920898438, 0.07619953155517578, 0.07861137390136719, 0.0810232162475586, 0.08343505859375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 16.0, 13.0, 21.0, 26.0, 37.0, 39.0, 54.0, 62.0, 75.0, 59.0, 87.0, 79.0, 72.0, 99.0, 52.0, 41.0, 43.0, 45.0, 33.0, 18.0, 16.0, 8.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0609130859375, -0.05942535400390625, -0.0579376220703125, -0.05644989013671875, -0.054962158203125, -0.05347442626953125, -0.0519866943359375, -0.05049896240234375, -0.04901123046875, -0.04752349853515625, -0.0460357666015625, -0.04454803466796875, -0.043060302734375, -0.04157257080078125, -0.0400848388671875, -0.03859710693359375, -0.037109375, -0.03562164306640625, -0.0341339111328125, -0.03264617919921875, -0.031158447265625, -0.02967071533203125, -0.0281829833984375, -0.02669525146484375, -0.02520751953125, -0.02371978759765625, -0.0222320556640625, -0.02074432373046875, -0.019256591796875, -0.01776885986328125, -0.0162811279296875, -0.01479339599609375, -0.0133056640625, -0.01181793212890625, -0.0103302001953125, -0.00884246826171875, -0.007354736328125, -0.00586700439453125, -0.0043792724609375, -0.00289154052734375, -0.00140380859375, 8.392333984375e-05, 0.0015716552734375, 0.00305938720703125, 0.004547119140625, 0.00603485107421875, 0.0075225830078125, 0.00901031494140625, 0.010498046875, 0.01198577880859375, 0.0134735107421875, 0.01496124267578125, 0.016448974609375, 0.01793670654296875, 0.0194244384765625, 0.02091217041015625, 0.02239990234375, 0.02388763427734375, 0.0253753662109375, 0.02686309814453125, 0.028350830078125, 0.02983856201171875, 0.0313262939453125, 0.03281402587890625, 0.0343017578125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 5.0, 11.0, 13.0, 10.0, 15.0, 27.0, 26.0, 30.0, 56.0, 66.0, 90.0, 163.0, 239.0, 404.0, 828.0, 2009.0, 6191.0, 27886.0, 199264.0, 659664.0, 123820.0, 19757.0, 4720.0, 1530.0, 687.0, 326.0, 199.0, 118.0, 114.0, 89.0, 48.0, 47.0, 27.0, 29.0, 11.0, 13.0, 10.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1209716796875, -0.11723709106445312, -0.11350250244140625, -0.10976791381835938, -0.1060333251953125, -0.10229873657226562, -0.09856414794921875, -0.09482955932617188, -0.091094970703125, -0.08736038208007812, -0.08362579345703125, -0.07989120483398438, -0.0761566162109375, -0.07242202758789062, -0.06868743896484375, -0.06495285034179688, -0.06121826171875, -0.057483673095703125, -0.05374908447265625, -0.050014495849609375, -0.0462799072265625, -0.042545318603515625, -0.03881072998046875, -0.035076141357421875, -0.031341552734375, -0.027606964111328125, -0.02387237548828125, -0.020137786865234375, -0.0164031982421875, -0.012668609619140625, -0.00893402099609375, -0.005199432373046875, -0.00146484375, 0.002269744873046875, 0.00600433349609375, 0.009738922119140625, 0.0134735107421875, 0.017208099365234375, 0.02094268798828125, 0.024677276611328125, 0.028411865234375, 0.032146453857421875, 0.03588104248046875, 0.039615631103515625, 0.0433502197265625, 0.047084808349609375, 0.05081939697265625, 0.054553985595703125, 0.05828857421875, 0.062023162841796875, 0.06575775146484375, 0.06949234008789062, 0.0732269287109375, 0.07696151733398438, 0.08069610595703125, 0.08443069458007812, 0.088165283203125, 0.09189987182617188, 0.09563446044921875, 0.09936904907226562, 0.1031036376953125, 0.10683822631835938, 0.11057281494140625, 0.11430740356445312, 0.1180419921875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 7.0, 8.0, 9.0, 9.0, 19.0, 12.0, 16.0, 29.0, 24.0, 38.0, 43.0, 30.0, 41.0, 47.0, 48.0, 49.0, 44.0, 58.0, 54.0, 57.0, 36.0, 58.0, 46.0, 41.0, 27.0, 25.0, 16.0, 18.0, 17.0, 8.0, 12.0, 20.0, 7.0, 9.0, 6.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07696533203125, -0.07451629638671875, -0.0720672607421875, -0.06961822509765625, -0.067169189453125, -0.06472015380859375, -0.0622711181640625, -0.05982208251953125, -0.057373046875, -0.05492401123046875, -0.0524749755859375, -0.05002593994140625, -0.047576904296875, -0.04512786865234375, -0.0426788330078125, -0.04022979736328125, -0.03778076171875, -0.03533172607421875, -0.0328826904296875, -0.03043365478515625, -0.027984619140625, -0.02553558349609375, -0.0230865478515625, -0.02063751220703125, -0.0181884765625, -0.01573944091796875, -0.0132904052734375, -0.01084136962890625, -0.008392333984375, -0.00594329833984375, -0.0034942626953125, -0.00104522705078125, 0.00140380859375, 0.00385284423828125, 0.0063018798828125, 0.00875091552734375, 0.011199951171875, 0.01364898681640625, 0.0160980224609375, 0.01854705810546875, 0.02099609375, 0.02344512939453125, 0.0258941650390625, 0.02834320068359375, 0.030792236328125, 0.03324127197265625, 0.0356903076171875, 0.03813934326171875, 0.04058837890625, 0.04303741455078125, 0.0454864501953125, 0.04793548583984375, 0.050384521484375, 0.05283355712890625, 0.0552825927734375, 0.05773162841796875, 0.0601806640625, 0.06262969970703125, 0.0650787353515625, 0.06752777099609375, 0.069976806640625, 0.07242584228515625, 0.0748748779296875, 0.07732391357421875, 0.07977294921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 12.0, 9.0, 13.0, 18.0, 28.0, 44.0, 51.0, 110.0, 132.0, 229.0, 442.0, 826.0, 1751.0, 3974.0, 9039.0, 25031.0, 87512.0, 294622.0, 395310.0, 161691.0, 42993.0, 14200.0, 5499.0, 2358.0, 1142.0, 566.0, 324.0, 211.0, 132.0, 88.0, 61.0, 40.0, 23.0, 19.0, 12.0, 11.0, 11.0, 5.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.01898193359375, -0.018427371978759766, -0.01787281036376953, -0.017318248748779297, -0.016763687133789062, -0.016209125518798828, -0.015654563903808594, -0.01510000228881836, -0.014545440673828125, -0.01399087905883789, -0.013436317443847656, -0.012881755828857422, -0.012327194213867188, -0.011772632598876953, -0.011218070983886719, -0.010663509368896484, -0.01010894775390625, -0.009554386138916016, -0.008999824523925781, -0.008445262908935547, -0.007890701293945312, -0.007336139678955078, -0.006781578063964844, -0.006227016448974609, -0.005672454833984375, -0.005117893218994141, -0.004563331604003906, -0.004008769989013672, -0.0034542083740234375, -0.002899646759033203, -0.0023450851440429688, -0.0017905235290527344, -0.0012359619140625, -0.0006814002990722656, -0.00012683868408203125, 0.0004277229309082031, 0.0009822845458984375, 0.0015368461608886719, 0.0020914077758789062, 0.0026459693908691406, 0.003200531005859375, 0.0037550926208496094, 0.004309654235839844, 0.004864215850830078, 0.0054187774658203125, 0.005973339080810547, 0.006527900695800781, 0.007082462310791016, 0.00763702392578125, 0.008191585540771484, 0.008746147155761719, 0.009300708770751953, 0.009855270385742188, 0.010409832000732422, 0.010964393615722656, 0.01151895523071289, 0.012073516845703125, 0.01262807846069336, 0.013182640075683594, 0.013737201690673828, 0.014291763305664062, 0.014846324920654297, 0.015400886535644531, 0.015955448150634766, 0.016510009765625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 4.0, 5.0, 4.0, 8.0, 12.0, 14.0, 13.0, 30.0, 33.0, 36.0, 63.0, 80.0, 92.0, 73.0, 78.0, 99.0, 61.0, 75.0, 73.0, 26.0, 35.0, 22.0, 22.0, 6.0, 13.0, 3.0, 1.0, 6.0, 8.0, 0.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.198883056640625e-06, -6.037764251232147e-06, -5.8766454458236694e-06, -5.715526640415192e-06, -5.554407835006714e-06, -5.393289029598236e-06, -5.232170224189758e-06, -5.0710514187812805e-06, -4.909932613372803e-06, -4.748813807964325e-06, -4.587695002555847e-06, -4.426576197147369e-06, -4.265457391738892e-06, -4.104338586330414e-06, -3.943219780921936e-06, -3.7821009755134583e-06, -3.6209821701049805e-06, -3.4598633646965027e-06, -3.298744559288025e-06, -3.137625753879547e-06, -2.9765069484710693e-06, -2.8153881430625916e-06, -2.6542693376541138e-06, -2.493150532245636e-06, -2.332031726837158e-06, -2.1709129214286804e-06, -2.0097941160202026e-06, -1.8486753106117249e-06, -1.687556505203247e-06, -1.5264376997947693e-06, -1.3653188943862915e-06, -1.2042000889778137e-06, -1.043081283569336e-06, -8.819624781608582e-07, -7.208436727523804e-07, -5.597248673439026e-07, -3.986060619354248e-07, -2.3748725652694702e-07, -7.636845111846924e-08, 8.475035429000854e-08, 2.4586915969848633e-07, 4.069879651069641e-07, 5.681067705154419e-07, 7.292255759239197e-07, 8.903443813323975e-07, 1.0514631867408752e-06, 1.212581992149353e-06, 1.3737007975578308e-06, 1.5348196029663086e-06, 1.6959384083747864e-06, 1.8570572137832642e-06, 2.018176019191742e-06, 2.1792948246002197e-06, 2.3404136300086975e-06, 2.5015324354171753e-06, 2.662651240825653e-06, 2.823770046234131e-06, 2.9848888516426086e-06, 3.1460076570510864e-06, 3.307126462459564e-06, 3.468245267868042e-06, 3.6293640732765198e-06, 3.7904828786849976e-06, 3.951601684093475e-06, 4.112720489501953e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 8.0, 5.0, 12.0, 30.0, 55.0, 113.0, 232.0, 610.0, 1830.0, 9452.0, 96528.0, 715144.0, 204406.0, 16060.0, 2701.0, 783.0, 309.0, 146.0, 62.0, 37.0, 18.0, 12.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0323486328125, -0.031177997589111328, -0.030007362365722656, -0.028836727142333984, -0.027666091918945312, -0.02649545669555664, -0.02532482147216797, -0.024154186248779297, -0.022983551025390625, -0.021812915802001953, -0.02064228057861328, -0.01947164535522461, -0.018301010131835938, -0.017130374908447266, -0.015959739685058594, -0.014789104461669922, -0.01361846923828125, -0.012447834014892578, -0.011277198791503906, -0.010106563568115234, -0.008935928344726562, -0.007765293121337891, -0.006594657897949219, -0.005424022674560547, -0.004253387451171875, -0.003082752227783203, -0.0019121170043945312, -0.0007414817810058594, 0.0004291534423828125, 0.0015997886657714844, 0.0027704238891601562, 0.003941059112548828, 0.0051116943359375, 0.006282329559326172, 0.007452964782714844, 0.008623600006103516, 0.009794235229492188, 0.01096487045288086, 0.012135505676269531, 0.013306140899658203, 0.014476776123046875, 0.015647411346435547, 0.01681804656982422, 0.01798868179321289, 0.019159317016601562, 0.020329952239990234, 0.021500587463378906, 0.022671222686767578, 0.02384185791015625, 0.025012493133544922, 0.026183128356933594, 0.027353763580322266, 0.028524398803710938, 0.02969503402709961, 0.03086566925048828, 0.03203630447387695, 0.033206939697265625, 0.0343775749206543, 0.03554821014404297, 0.03671884536743164, 0.03788948059082031, 0.039060115814208984, 0.040230751037597656, 0.04140138626098633, 0.042572021484375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 5.0, 9.0, 18.0, 25.0, 39.0, 52.0, 90.0, 90.0, 86.0, 110.0, 105.0, 95.0, 72.0, 70.0, 55.0, 28.0, 18.0, 17.0, 8.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0278472900390625, -0.02723848819732666, -0.02662968635559082, -0.02602088451385498, -0.02541208267211914, -0.0248032808303833, -0.02419447898864746, -0.02358567714691162, -0.02297687530517578, -0.02236807346343994, -0.0217592716217041, -0.02115046977996826, -0.020541667938232422, -0.019932866096496582, -0.019324064254760742, -0.018715262413024902, -0.018106460571289062, -0.017497658729553223, -0.016888856887817383, -0.016280055046081543, -0.015671253204345703, -0.015062451362609863, -0.014453649520874023, -0.013844847679138184, -0.013236045837402344, -0.012627243995666504, -0.012018442153930664, -0.011409640312194824, -0.010800838470458984, -0.010192036628723145, -0.009583234786987305, -0.008974432945251465, -0.008365631103515625, -0.007756829261779785, -0.007148027420043945, -0.0065392255783081055, -0.005930423736572266, -0.005321621894836426, -0.004712820053100586, -0.004104018211364746, -0.0034952163696289062, -0.0028864145278930664, -0.0022776126861572266, -0.0016688108444213867, -0.0010600090026855469, -0.00045120716094970703, 0.0001575946807861328, 0.0007663965225219727, 0.0013751983642578125, 0.0019840002059936523, 0.002592802047729492, 0.003201603889465332, 0.003810405731201172, 0.004419207572937012, 0.0050280094146728516, 0.005636811256408691, 0.006245613098144531, 0.006854414939880371, 0.007463216781616211, 0.00807201862335205, 0.00868082046508789, 0.00928962230682373, 0.00989842414855957, 0.01050722599029541, 0.01111602783203125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 7.0, 9.0, 28.0, 60.0, 126.0, 245.0, 292.0, 149.0, 51.0, 24.0, 8.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.7293717861175537, -0.7159048914909363, -0.7024379372596741, -0.6889710426330566, -0.6755040884017944, -0.662037193775177, -0.6485702395439148, -0.6351033449172974, -0.6216363906860352, -0.6081694960594177, -0.5947025418281555, -0.5812356472015381, -0.5677686929702759, -0.5543017983436584, -0.5408348441123962, -0.5273679494857788, -0.5139010548591614, -0.500434160232544, -0.48696720600128174, -0.4735002815723419, -0.4600333571434021, -0.44656646251678467, -0.43309953808784485, -0.41963261365890503, -0.4061656892299652, -0.3926987648010254, -0.37923184037208557, -0.36576491594314575, -0.3522980213165283, -0.3388310670852661, -0.3253641724586487, -0.31189724802970886, -0.29843032360076904, -0.2849633991718292, -0.2714964747428894, -0.2580295503139496, -0.24456264078617096, -0.23109571635723114, -0.21762880682945251, -0.2041618824005127, -0.19069497287273407, -0.17722804844379425, -0.16376113891601562, -0.1502942144870758, -0.136827290058136, -0.12336036562919617, -0.10989344865083694, -0.09642653167247772, -0.0829596072435379, -0.06949268281459808, -0.05602576583623886, -0.04255884513258934, -0.02909192442893982, -0.015625, -0.0021580830216407776, 0.011308833956718445, 0.024775758385658264, 0.038242679089307785, 0.051709599792957306, 0.06517651677131653, 0.07864344120025635, 0.09211036562919617, 0.10557728260755539, 0.11904419958591461, 0.13251112401485443]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 14.0, 13.0, 10.0, 13.0, 16.0, 22.0, 20.0, 19.0, 33.0, 30.0, 31.0, 40.0, 38.0, 26.0, 43.0, 27.0, 53.0, 50.0, 36.0, 33.0, 38.0, 40.0, 42.0, 39.0, 32.0, 25.0, 23.0, 26.0, 34.0, 18.0, 14.0, 22.0, 15.0, 12.0, 6.0, 10.0, 10.0, 4.0, 7.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20633375644683838, -0.20029224455356598, -0.19425071775913239, -0.18820920586585999, -0.1821676790714264, -0.176126167178154, -0.1700846552848816, -0.164043128490448, -0.1580016165971756, -0.1519601047039032, -0.1459185779094696, -0.1398770660161972, -0.1338355541229248, -0.1277940273284912, -0.12175251543521881, -0.11571099609136581, -0.10966947674751282, -0.10362795740365982, -0.09758643805980682, -0.09154492616653442, -0.08550340682268143, -0.07946188747882843, -0.07342037558555603, -0.06737885624170303, -0.06133733689785004, -0.05529581755399704, -0.04925430193543434, -0.04321278631687164, -0.037171266973018646, -0.0311297494918108, -0.02508823201060295, -0.019046716392040253, -0.013005197048187256, -0.006963679566979408, -0.0009221620857715607, 0.005119355395436287, 0.011160872876644135, 0.017202390357851982, 0.02324390783905983, 0.029285423457622528, 0.035326942801475525, 0.04136846214532852, 0.04740997776389122, 0.05345149338245392, 0.059493012726306915, 0.06553453207015991, 0.07157604396343231, 0.07761756330728531, 0.0836590826511383, 0.0897006019949913, 0.0957421213388443, 0.1017836332321167, 0.1078251525759697, 0.11386667191982269, 0.11990818381309509, 0.1259497106075287, 0.1319912225008011, 0.1380327343940735, 0.14407426118850708, 0.15011577308177948, 0.15615728497505188, 0.16219881176948547, 0.16824032366275787, 0.17428183555603027, 0.18032336235046387]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 7.0, 11.0, 9.0, 8.0, 12.0, 17.0, 25.0, 30.0, 45.0, 48.0, 71.0, 97.0, 157.0, 235.0, 404.0, 617.0, 1022.0, 1801.0, 3506.0, 7958.0, 22793.0, 101242.0, 585567.0, 1886534.0, 1263603.0, 246248.0, 43808.0, 15285.0, 6953.0, 2763.0, 1429.0, 776.0, 428.0, 276.0, 180.0, 99.0, 66.0, 41.0, 34.0, 17.0, 19.0, 18.0, 10.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0457763671875, -0.04445934295654297, -0.04314231872558594, -0.041825294494628906, -0.040508270263671875, -0.039191246032714844, -0.03787422180175781, -0.03655719757080078, -0.03524017333984375, -0.03392314910888672, -0.03260612487792969, -0.031289100646972656, -0.029972076416015625, -0.028655052185058594, -0.027338027954101562, -0.02602100372314453, -0.0247039794921875, -0.02338695526123047, -0.022069931030273438, -0.020752906799316406, -0.019435882568359375, -0.018118858337402344, -0.016801834106445312, -0.015484809875488281, -0.01416778564453125, -0.012850761413574219, -0.011533737182617188, -0.010216712951660156, -0.008899688720703125, -0.007582664489746094, -0.0062656402587890625, -0.004948616027832031, -0.003631591796875, -0.0023145675659179688, -0.0009975433349609375, 0.00031948089599609375, 0.001636505126953125, 0.0029535293579101562, 0.0042705535888671875, 0.005587577819824219, 0.00690460205078125, 0.008221626281738281, 0.009538650512695312, 0.010855674743652344, 0.012172698974609375, 0.013489723205566406, 0.014806747436523438, 0.01612377166748047, 0.0174407958984375, 0.01875782012939453, 0.020074844360351562, 0.021391868591308594, 0.022708892822265625, 0.024025917053222656, 0.025342941284179688, 0.02665996551513672, 0.02797698974609375, 0.02929401397705078, 0.030611038208007812, 0.031928062438964844, 0.033245086669921875, 0.034562110900878906, 0.03587913513183594, 0.03719615936279297, 0.03851318359375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 1.0, 10.0, 11.0, 13.0, 18.0, 14.0, 22.0, 36.0, 28.0, 42.0, 55.0, 54.0, 57.0, 66.0, 60.0, 78.0, 67.0, 65.0, 51.0, 50.0, 32.0, 24.0, 33.0, 20.0, 19.0, 17.0, 8.0, 11.0, 17.0, 4.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.04998779296875, -0.04863452911376953, -0.04728126525878906, -0.045928001403808594, -0.044574737548828125, -0.043221473693847656, -0.04186820983886719, -0.04051494598388672, -0.03916168212890625, -0.03780841827392578, -0.03645515441894531, -0.035101890563964844, -0.033748626708984375, -0.032395362854003906, -0.031042098999023438, -0.02968883514404297, -0.0283355712890625, -0.02698230743408203, -0.025629043579101562, -0.024275779724121094, -0.022922515869140625, -0.021569252014160156, -0.020215988159179688, -0.01886272430419922, -0.01750946044921875, -0.01615619659423828, -0.014802932739257812, -0.013449668884277344, -0.012096405029296875, -0.010743141174316406, -0.009389877319335938, -0.008036613464355469, -0.006683349609375, -0.005330085754394531, -0.0039768218994140625, -0.0026235580444335938, -0.001270294189453125, 8.296966552734375e-05, 0.0014362335205078125, 0.0027894973754882812, 0.00414276123046875, 0.005496025085449219, 0.0068492889404296875, 0.008202552795410156, 0.009555816650390625, 0.010909080505371094, 0.012262344360351562, 0.013615608215332031, 0.0149688720703125, 0.01632213592529297, 0.017675399780273438, 0.019028663635253906, 0.020381927490234375, 0.021735191345214844, 0.023088455200195312, 0.02444171905517578, 0.02579498291015625, 0.02714824676513672, 0.028501510620117188, 0.029854774475097656, 0.031208038330078125, 0.032561302185058594, 0.03391456604003906, 0.03526782989501953, 0.03662109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 2.0, 5.0, 6.0, 8.0, 14.0, 16.0, 24.0, 30.0, 45.0, 62.0, 113.0, 207.0, 531.0, 1689.0, 10052.0, 568739.0, 3583417.0, 25204.0, 2740.0, 715.0, 287.0, 137.0, 77.0, 54.0, 30.0, 20.0, 17.0, 9.0, 7.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1595458984375, -0.15442657470703125, -0.1493072509765625, -0.14418792724609375, -0.139068603515625, -0.13394927978515625, -0.1288299560546875, -0.12371063232421875, -0.11859130859375, -0.11347198486328125, -0.1083526611328125, -0.10323333740234375, -0.098114013671875, -0.09299468994140625, -0.0878753662109375, -0.08275604248046875, -0.07763671875, -0.07251739501953125, -0.0673980712890625, -0.06227874755859375, -0.057159423828125, -0.05204010009765625, -0.0469207763671875, -0.04180145263671875, -0.03668212890625, -0.03156280517578125, -0.0264434814453125, -0.02132415771484375, -0.016204833984375, -0.01108551025390625, -0.0059661865234375, -0.00084686279296875, 0.0042724609375, 0.00939178466796875, 0.0145111083984375, 0.01963043212890625, 0.024749755859375, 0.02986907958984375, 0.0349884033203125, 0.04010772705078125, 0.04522705078125, 0.05034637451171875, 0.0554656982421875, 0.06058502197265625, 0.065704345703125, 0.07082366943359375, 0.0759429931640625, 0.08106231689453125, 0.086181640625, 0.09130096435546875, 0.0964202880859375, 0.10153961181640625, 0.106658935546875, 0.11177825927734375, 0.1168975830078125, 0.12201690673828125, 0.12713623046875, 0.13225555419921875, 0.1373748779296875, 0.14249420166015625, 0.147613525390625, 0.15273284912109375, 0.1578521728515625, 0.16297149658203125, 0.1680908203125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 3.0, 6.0, 6.0, 9.0, 6.0, 20.0, 21.0, 29.0, 48.0, 76.0, 121.0, 276.0, 638.0, 987.0, 858.0, 424.0, 212.0, 106.0, 69.0, 46.0, 30.0, 20.0, 18.0, 11.0, 16.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.088623046875, -0.0860738754272461, -0.08352470397949219, -0.08097553253173828, -0.07842636108398438, -0.07587718963623047, -0.07332801818847656, -0.07077884674072266, -0.06822967529296875, -0.06568050384521484, -0.06313133239746094, -0.06058216094970703, -0.058032989501953125, -0.05548381805419922, -0.05293464660644531, -0.050385475158691406, -0.0478363037109375, -0.045287132263183594, -0.04273796081542969, -0.04018878936767578, -0.037639617919921875, -0.03509044647216797, -0.03254127502441406, -0.029992103576660156, -0.02744293212890625, -0.024893760681152344, -0.022344589233398438, -0.01979541778564453, -0.017246246337890625, -0.014697074890136719, -0.012147903442382812, -0.009598731994628906, -0.007049560546875, -0.004500389099121094, -0.0019512176513671875, 0.0005979537963867188, 0.003147125244140625, 0.005696296691894531, 0.008245468139648438, 0.010794639587402344, 0.01334381103515625, 0.015892982482910156, 0.018442153930664062, 0.02099132537841797, 0.023540496826171875, 0.02608966827392578, 0.028638839721679688, 0.031188011169433594, 0.0337371826171875, 0.036286354064941406, 0.03883552551269531, 0.04138469696044922, 0.043933868408203125, 0.04648303985595703, 0.04903221130371094, 0.051581382751464844, 0.05413055419921875, 0.056679725646972656, 0.05922889709472656, 0.06177806854248047, 0.06432723999023438, 0.06687641143798828, 0.06942558288574219, 0.0719747543334961, 0.07452392578125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 14.0, 79.0, 289.0, 444.0, 136.0, 30.0, 6.0, 1.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5385679602622986, -0.5131241083145142, -0.4876803159713745, -0.4622364640235901, -0.43679264187812805, -0.411348819732666, -0.3859049677848816, -0.36046114563941956, -0.3350173234939575, -0.3095735013484955, -0.28412967920303345, -0.258685827255249, -0.233242005109787, -0.20779818296432495, -0.18235434591770172, -0.1569105088710785, -0.13146668672561646, -0.10602285712957382, -0.08057902753353119, -0.055135197937488556, -0.029691368341445923, -0.004247546195983887, 0.021196290850639343, 0.04664012789726257, 0.07208395004272461, 0.09752777963876724, 0.12297160923480988, 0.1484154462814331, 0.17385926842689514, 0.19930309057235718, 0.2247469276189804, 0.25019076466560364, 0.27563464641571045, 0.3010784685611725, 0.3265222907066345, 0.35196614265441895, 0.377409964799881, 0.402853786945343, 0.42829763889312744, 0.4537414610385895, 0.4791852831840515, 0.5046291351318359, 0.5300729274749756, 0.55551677942276, 0.5809606313705444, 0.6064044237136841, 0.6318482756614685, 0.6572921276092529, 0.6827359199523926, 0.708179771900177, 0.7336235642433167, 0.7590674161911011, 0.7845112085342407, 0.8099550604820251, 0.8353989124298096, 0.8608427047729492, 0.8862865567207336, 0.9117304086685181, 0.9371742010116577, 0.9626180529594421, 0.9880619049072266, 1.0135056972503662, 1.0389494895935059, 1.064393401145935, 1.0898371934890747]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 5.0, 9.0, 5.0, 14.0, 15.0, 9.0, 15.0, 31.0, 23.0, 29.0, 27.0, 33.0, 37.0, 38.0, 45.0, 51.0, 48.0, 50.0, 34.0, 40.0, 45.0, 39.0, 45.0, 34.0, 38.0, 34.0, 31.0, 23.0, 30.0, 20.0, 16.0, 16.0, 20.0, 9.0, 5.0, 4.0, 10.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14442944526672363, -0.13899552822113037, -0.1335616111755371, -0.12812769412994385, -0.12269377708435059, -0.11725986003875732, -0.11182594299316406, -0.1063920259475708, -0.10095810890197754, -0.09552419185638428, -0.09009027481079102, -0.08465635776519775, -0.07922244071960449, -0.07378852367401123, -0.06835460662841797, -0.06292068958282471, -0.057486772537231445, -0.052052855491638184, -0.04661893844604492, -0.04118502140045166, -0.0357511043548584, -0.030317187309265137, -0.024883270263671875, -0.019449353218078613, -0.014015436172485352, -0.00858151912689209, -0.003147602081298828, 0.0022863149642944336, 0.007720232009887695, 0.013154149055480957, 0.01858806610107422, 0.02402198314666748, 0.029455900192260742, 0.034889817237854004, 0.040323734283447266, 0.04575765132904053, 0.05119156837463379, 0.05662548542022705, 0.06205940246582031, 0.06749331951141357, 0.07292723655700684, 0.0783611536026001, 0.08379507064819336, 0.08922898769378662, 0.09466290473937988, 0.10009682178497314, 0.1055307388305664, 0.11096465587615967, 0.11639857292175293, 0.12183248996734619, 0.12726640701293945, 0.13270032405853271, 0.13813424110412598, 0.14356815814971924, 0.1490020751953125, 0.15443599224090576, 0.15986990928649902, 0.16530382633209229, 0.17073774337768555, 0.1761716604232788, 0.18160557746887207, 0.18703949451446533, 0.1924734115600586, 0.19790732860565186, 0.20334124565124512]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 7.0, 2.0, 9.0, 16.0, 9.0, 19.0, 27.0, 21.0, 40.0, 46.0, 64.0, 68.0, 119.0, 191.0, 264.0, 396.0, 609.0, 1080.0, 1893.0, 3425.0, 6888.0, 14668.0, 33302.0, 84995.0, 228485.0, 359525.0, 188455.0, 70446.0, 27750.0, 12226.0, 6051.0, 3103.0, 1676.0, 955.0, 553.0, 356.0, 242.0, 144.0, 112.0, 78.0, 55.0, 41.0, 38.0, 36.0, 18.0, 16.0, 2.0, 12.0, 8.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0484619140625, -0.0469660758972168, -0.045470237731933594, -0.04397439956665039, -0.04247856140136719, -0.040982723236083984, -0.03948688507080078, -0.03799104690551758, -0.036495208740234375, -0.03499937057495117, -0.03350353240966797, -0.032007694244384766, -0.030511856079101562, -0.02901601791381836, -0.027520179748535156, -0.026024341583251953, -0.02452850341796875, -0.023032665252685547, -0.021536827087402344, -0.02004098892211914, -0.018545150756835938, -0.017049312591552734, -0.015553474426269531, -0.014057636260986328, -0.012561798095703125, -0.011065959930419922, -0.009570121765136719, -0.008074283599853516, -0.0065784454345703125, -0.005082607269287109, -0.0035867691040039062, -0.002090930938720703, -0.0005950927734375, 0.0009007453918457031, 0.0023965835571289062, 0.0038924217224121094, 0.0053882598876953125, 0.006884098052978516, 0.008379936218261719, 0.009875774383544922, 0.011371612548828125, 0.012867450714111328, 0.014363288879394531, 0.015859127044677734, 0.017354965209960938, 0.01885080337524414, 0.020346641540527344, 0.021842479705810547, 0.02333831787109375, 0.024834156036376953, 0.026329994201660156, 0.02782583236694336, 0.029321670532226562, 0.030817508697509766, 0.03231334686279297, 0.03380918502807617, 0.035305023193359375, 0.03680086135864258, 0.03829669952392578, 0.039792537689208984, 0.04128837585449219, 0.04278421401977539, 0.044280052185058594, 0.0457758903503418, 0.047271728515625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 17.0, 20.0, 21.0, 23.0, 44.0, 36.0, 54.0, 51.0, 77.0, 77.0, 74.0, 77.0, 78.0, 78.0, 67.0, 49.0, 40.0, 31.0, 22.0, 15.0, 15.0, 8.0, 7.0, 9.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054779052734375, -0.05324363708496094, -0.051708221435546875, -0.05017280578613281, -0.04863739013671875, -0.04710197448730469, -0.045566558837890625, -0.04403114318847656, -0.0424957275390625, -0.04096031188964844, -0.039424896240234375, -0.03788948059082031, -0.03635406494140625, -0.03481864929199219, -0.033283233642578125, -0.03174781799316406, -0.03021240234375, -0.028676986694335938, -0.027141571044921875, -0.025606155395507812, -0.02407073974609375, -0.022535324096679688, -0.020999908447265625, -0.019464492797851562, -0.0179290771484375, -0.016393661499023438, -0.014858245849609375, -0.013322830200195312, -0.01178741455078125, -0.010251998901367188, -0.008716583251953125, -0.0071811676025390625, -0.005645751953125, -0.0041103363037109375, -0.002574920654296875, -0.0010395050048828125, 0.00049591064453125, 0.0020313262939453125, 0.003566741943359375, 0.0051021575927734375, 0.0066375732421875, 0.008172988891601562, 0.009708404541015625, 0.011243820190429688, 0.01277923583984375, 0.014314651489257812, 0.015850067138671875, 0.017385482788085938, 0.0189208984375, 0.020456314086914062, 0.021991729736328125, 0.023527145385742188, 0.02506256103515625, 0.026597976684570312, 0.028133392333984375, 0.029668807983398438, 0.0312042236328125, 0.03273963928222656, 0.034275054931640625, 0.03581047058105469, 0.03734588623046875, 0.03888130187988281, 0.040416717529296875, 0.04195213317871094, 0.043487548828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 3.0, 5.0, 3.0, 5.0, 3.0, 6.0, 13.0, 13.0, 14.0, 16.0, 21.0, 13.0, 41.0, 39.0, 73.0, 102.0, 163.0, 320.0, 685.0, 1787.0, 6452.0, 33649.0, 297467.0, 612143.0, 78531.0, 12065.0, 2846.0, 975.0, 430.0, 227.0, 133.0, 82.0, 68.0, 35.0, 25.0, 22.0, 24.0, 12.0, 11.0, 11.0, 7.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0982666015625, -0.09501361846923828, -0.09176063537597656, -0.08850765228271484, -0.08525466918945312, -0.0820016860961914, -0.07874870300292969, -0.07549571990966797, -0.07224273681640625, -0.06898975372314453, -0.06573677062988281, -0.062483787536621094, -0.059230804443359375, -0.055977821350097656, -0.05272483825683594, -0.04947185516357422, -0.0462188720703125, -0.04296588897705078, -0.03971290588378906, -0.036459922790527344, -0.033206939697265625, -0.029953956604003906, -0.026700973510742188, -0.02344799041748047, -0.02019500732421875, -0.01694202423095703, -0.013689041137695312, -0.010436058044433594, -0.007183074951171875, -0.003930091857910156, -0.0006771087646484375, 0.0025758743286132812, 0.005828857421875, 0.009081840515136719, 0.012334823608398438, 0.015587806701660156, 0.018840789794921875, 0.022093772888183594, 0.025346755981445312, 0.02859973907470703, 0.03185272216796875, 0.03510570526123047, 0.03835868835449219, 0.041611671447753906, 0.044864654541015625, 0.048117637634277344, 0.05137062072753906, 0.05462360382080078, 0.0578765869140625, 0.06112957000732422, 0.06438255310058594, 0.06763553619384766, 0.07088851928710938, 0.0741415023803711, 0.07739448547363281, 0.08064746856689453, 0.08390045166015625, 0.08715343475341797, 0.09040641784667969, 0.0936594009399414, 0.09691238403320312, 0.10016536712646484, 0.10341835021972656, 0.10667133331298828, 0.10992431640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 3.0, 3.0, 7.0, 13.0, 16.0, 12.0, 15.0, 18.0, 18.0, 24.0, 33.0, 31.0, 27.0, 42.0, 50.0, 33.0, 35.0, 43.0, 30.0, 51.0, 51.0, 51.0, 42.0, 38.0, 39.0, 37.0, 30.0, 34.0, 19.0, 19.0, 24.0, 12.0, 16.0, 19.0, 15.0, 8.0, 12.0, 4.0, 5.0, 4.0, 3.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0770263671875, -0.07472515106201172, -0.07242393493652344, -0.07012271881103516, -0.06782150268554688, -0.0655202865600586, -0.06321907043457031, -0.06091785430908203, -0.05861663818359375, -0.05631542205810547, -0.05401420593261719, -0.051712989807128906, -0.049411773681640625, -0.047110557556152344, -0.04480934143066406, -0.04250812530517578, -0.0402069091796875, -0.03790569305419922, -0.03560447692871094, -0.033303260803222656, -0.031002044677734375, -0.028700828552246094, -0.026399612426757812, -0.02409839630126953, -0.02179718017578125, -0.01949596405029297, -0.017194747924804688, -0.014893531799316406, -0.012592315673828125, -0.010291099548339844, -0.007989883422851562, -0.005688667297363281, -0.003387451171875, -0.0010862350463867188, 0.0012149810791015625, 0.0035161972045898438, 0.005817413330078125, 0.008118629455566406, 0.010419845581054688, 0.012721061706542969, 0.01502227783203125, 0.01732349395751953, 0.019624710083007812, 0.021925926208496094, 0.024227142333984375, 0.026528358459472656, 0.028829574584960938, 0.03113079071044922, 0.0334320068359375, 0.03573322296142578, 0.03803443908691406, 0.040335655212402344, 0.042636871337890625, 0.044938087463378906, 0.04723930358886719, 0.04954051971435547, 0.05184173583984375, 0.05414295196533203, 0.05644416809082031, 0.058745384216308594, 0.061046600341796875, 0.06334781646728516, 0.06564903259277344, 0.06795024871826172, 0.07025146484375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 7.0, 10.0, 6.0, 10.0, 18.0, 15.0, 34.0, 34.0, 39.0, 79.0, 102.0, 139.0, 275.0, 415.0, 755.0, 1355.0, 2784.0, 5537.0, 11549.0, 25277.0, 60290.0, 171414.0, 362629.0, 250366.0, 90037.0, 34601.0, 15468.0, 7371.0, 3615.0, 1893.0, 939.0, 556.0, 311.0, 222.0, 107.0, 88.0, 62.0, 46.0, 27.0, 18.0, 22.0, 9.0, 10.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.009735107421875, -0.009407281875610352, -0.009079456329345703, -0.008751630783081055, -0.008423805236816406, -0.008095979690551758, -0.007768154144287109, -0.007440328598022461, -0.0071125030517578125, -0.006784677505493164, -0.006456851959228516, -0.006129026412963867, -0.005801200866699219, -0.00547337532043457, -0.005145549774169922, -0.0048177242279052734, -0.004489898681640625, -0.0041620731353759766, -0.003834247589111328, -0.0035064220428466797, -0.0031785964965820312, -0.002850770950317383, -0.0025229454040527344, -0.002195119857788086, -0.0018672943115234375, -0.001539468765258789, -0.0012116432189941406, -0.0008838176727294922, -0.0005559921264648438, -0.0002281665802001953, 9.965896606445312e-05, 0.00042748451232910156, 0.00075531005859375, 0.0010831356048583984, 0.0014109611511230469, 0.0017387866973876953, 0.0020666122436523438, 0.002394437789916992, 0.0027222633361816406, 0.003050088882446289, 0.0033779144287109375, 0.003705739974975586, 0.004033565521240234, 0.004361391067504883, 0.004689216613769531, 0.00501704216003418, 0.005344867706298828, 0.0056726932525634766, 0.006000518798828125, 0.0063283443450927734, 0.006656169891357422, 0.00698399543762207, 0.007311820983886719, 0.007639646530151367, 0.007967472076416016, 0.008295297622680664, 0.008623123168945312, 0.008950948715209961, 0.00927877426147461, 0.009606599807739258, 0.009934425354003906, 0.010262250900268555, 0.010590076446533203, 0.010917901992797852, 0.0112457275390625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 5.0, 8.0, 5.0, 15.0, 17.0, 15.0, 13.0, 28.0, 38.0, 38.0, 56.0, 67.0, 73.0, 74.0, 85.0, 65.0, 75.0, 72.0, 59.0, 47.0, 35.0, 31.0, 23.0, 13.0, 14.0, 5.0, 10.0, 9.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.635883331298828e-06, -3.516674041748047e-06, -3.3974647521972656e-06, -3.2782554626464844e-06, -3.159046173095703e-06, -3.039836883544922e-06, -2.9206275939941406e-06, -2.8014183044433594e-06, -2.682209014892578e-06, -2.562999725341797e-06, -2.4437904357910156e-06, -2.3245811462402344e-06, -2.205371856689453e-06, -2.086162567138672e-06, -1.9669532775878906e-06, -1.8477439880371094e-06, -1.7285346984863281e-06, -1.6093254089355469e-06, -1.4901161193847656e-06, -1.3709068298339844e-06, -1.2516975402832031e-06, -1.1324882507324219e-06, -1.0132789611816406e-06, -8.940696716308594e-07, -7.748603820800781e-07, -6.556510925292969e-07, -5.364418029785156e-07, -4.172325134277344e-07, -2.980232238769531e-07, -1.7881393432617188e-07, -5.960464477539063e-08, 5.960464477539063e-08, 1.7881393432617188e-07, 2.980232238769531e-07, 4.172325134277344e-07, 5.364418029785156e-07, 6.556510925292969e-07, 7.748603820800781e-07, 8.940696716308594e-07, 1.0132789611816406e-06, 1.1324882507324219e-06, 1.2516975402832031e-06, 1.3709068298339844e-06, 1.4901161193847656e-06, 1.6093254089355469e-06, 1.7285346984863281e-06, 1.8477439880371094e-06, 1.9669532775878906e-06, 2.086162567138672e-06, 2.205371856689453e-06, 2.3245811462402344e-06, 2.4437904357910156e-06, 2.562999725341797e-06, 2.682209014892578e-06, 2.8014183044433594e-06, 2.9206275939941406e-06, 3.039836883544922e-06, 3.159046173095703e-06, 3.2782554626464844e-06, 3.3974647521972656e-06, 3.516674041748047e-06, 3.635883331298828e-06, 3.7550926208496094e-06, 3.874301910400391e-06, 3.993511199951172e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 9.0, 10.0, 14.0, 28.0, 29.0, 55.0, 67.0, 130.0, 177.0, 356.0, 596.0, 1248.0, 3146.0, 8908.0, 29277.0, 113315.0, 430678.0, 344859.0, 81590.0, 22153.0, 7060.0, 2558.0, 1042.0, 506.0, 287.0, 169.0, 102.0, 49.0, 39.0, 30.0, 16.0, 16.0, 14.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01306915283203125, -0.012564301490783691, -0.012059450149536133, -0.011554598808288574, -0.011049747467041016, -0.010544896125793457, -0.010040044784545898, -0.00953519344329834, -0.009030342102050781, -0.008525490760803223, -0.008020639419555664, -0.0075157880783081055, -0.007010936737060547, -0.006506085395812988, -0.00600123405456543, -0.005496382713317871, -0.0049915313720703125, -0.004486680030822754, -0.003981828689575195, -0.0034769773483276367, -0.002972126007080078, -0.0024672746658325195, -0.001962423324584961, -0.0014575719833374023, -0.0009527206420898438, -0.00044786930084228516, 5.698204040527344e-05, 0.000561833381652832, 0.0010666847229003906, 0.0015715360641479492, 0.002076387405395508, 0.0025812387466430664, 0.003086090087890625, 0.0035909414291381836, 0.004095792770385742, 0.004600644111633301, 0.005105495452880859, 0.005610346794128418, 0.0061151981353759766, 0.006620049476623535, 0.007124900817871094, 0.007629752159118652, 0.008134603500366211, 0.00863945484161377, 0.009144306182861328, 0.009649157524108887, 0.010154008865356445, 0.010658860206604004, 0.011163711547851562, 0.011668562889099121, 0.01217341423034668, 0.012678265571594238, 0.013183116912841797, 0.013687968254089355, 0.014192819595336914, 0.014697670936584473, 0.015202522277832031, 0.01570737361907959, 0.01621222496032715, 0.016717076301574707, 0.017221927642822266, 0.017726778984069824, 0.018231630325317383, 0.01873648166656494, 0.0192413330078125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 9.0, 4.0, 11.0, 10.0, 9.0, 19.0, 7.0, 24.0, 31.0, 27.0, 40.0, 49.0, 47.0, 59.0, 69.0, 77.0, 60.0, 69.0, 55.0, 44.0, 56.0, 38.0, 33.0, 21.0, 29.0, 15.0, 21.0, 15.0, 10.0, 12.0, 6.0, 6.0, 8.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0145416259765625, -0.014160990715026855, -0.013780355453491211, -0.013399720191955566, -0.013019084930419922, -0.012638449668884277, -0.012257814407348633, -0.011877179145812988, -0.011496543884277344, -0.0111159086227417, -0.010735273361206055, -0.01035463809967041, -0.009974002838134766, -0.009593367576599121, -0.009212732315063477, -0.008832097053527832, -0.008451461791992188, -0.008070826530456543, -0.0076901912689208984, -0.007309556007385254, -0.006928920745849609, -0.006548285484313965, -0.00616765022277832, -0.005787014961242676, -0.005406379699707031, -0.005025744438171387, -0.004645109176635742, -0.004264473915100098, -0.003883838653564453, -0.0035032033920288086, -0.003122568130493164, -0.0027419328689575195, -0.002361297607421875, -0.0019806623458862305, -0.001600027084350586, -0.0012193918228149414, -0.0008387565612792969, -0.00045812129974365234, -7.748603820800781e-05, 0.0003031492233276367, 0.0006837844848632812, 0.0010644197463989258, 0.0014450550079345703, 0.0018256902694702148, 0.0022063255310058594, 0.002586960792541504, 0.0029675960540771484, 0.003348231315612793, 0.0037288665771484375, 0.004109501838684082, 0.0044901371002197266, 0.004870772361755371, 0.005251407623291016, 0.00563204288482666, 0.006012678146362305, 0.006393313407897949, 0.006773948669433594, 0.007154583930969238, 0.007535219192504883, 0.007915854454040527, 0.008296489715576172, 0.008677124977111816, 0.009057760238647461, 0.009438395500183105, 0.00981903076171875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 12.0, 17.0, 97.0, 301.0, 440.0, 96.0, 31.0, 7.0, 3.0, 1.0, 2.0], "bins": [-1.073272705078125, -1.0544785261154175, -1.0356844663619995, -1.016890287399292, -0.9980961680412292, -0.9793020486831665, -0.9605079293251038, -0.941713809967041, -0.9229196310043335, -0.9041255116462708, -0.885331392288208, -0.8665372133255005, -0.8477430939674377, -0.828948974609375, -0.8101548552513123, -0.7913607358932495, -0.772566556930542, -0.7537724375724792, -0.7349783182144165, -0.716184139251709, -0.6973900198936462, -0.6785959005355835, -0.6598017811775208, -0.641007661819458, -0.6222135424613953, -0.6034194231033325, -0.5846253037452698, -0.5658311247825623, -0.5470370054244995, -0.5282428860664368, -0.509448766708374, -0.4906546175479889, -0.47186052799224854, -0.4530664086341858, -0.43427225947380066, -0.4154781401157379, -0.3966839909553528, -0.37788987159729004, -0.3590957522392273, -0.34030160307884216, -0.32150745391845703, -0.3027133345603943, -0.28391918540000916, -0.2651250660419464, -0.24633091688156128, -0.22753679752349854, -0.2087426632642746, -0.18994852900505066, -0.17115439474582672, -0.15236026048660278, -0.13356612622737885, -0.1147719994187355, -0.09597786515951157, -0.07718373090028763, -0.05838960409164429, -0.03959546983242035, -0.02080133557319641, -0.0020072031766176224, 0.016786929219961166, 0.035581059753894806, 0.054375194013118744, 0.07316932827234268, 0.09196345508098602, 0.11075758934020996, 0.1295517235994339]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 8.0, 12.0, 8.0, 14.0, 19.0, 18.0, 11.0, 30.0, 32.0, 32.0, 37.0, 43.0, 45.0, 47.0, 43.0, 60.0, 50.0, 47.0, 37.0, 47.0, 56.0, 36.0, 39.0, 32.0, 33.0, 23.0, 32.0, 18.0, 20.0, 15.0, 8.0, 14.0, 7.0, 6.0, 6.0, 1.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.2753797173500061, -0.2681107521057129, -0.26084181666374207, -0.25357285141944885, -0.24630391597747803, -0.23903495073318481, -0.2317660003900528, -0.22449705004692078, -0.21722809970378876, -0.20995914936065674, -0.20269019901752472, -0.1954212486743927, -0.1881522834300995, -0.18088334798812866, -0.17361438274383545, -0.16634543240070343, -0.1590764820575714, -0.1518075317144394, -0.14453858137130737, -0.13726963102817535, -0.13000068068504333, -0.12273172289133072, -0.1154627650976181, -0.10819381475448608, -0.10092486441135406, -0.09365591406822205, -0.08638696372509003, -0.07911800593137741, -0.07184905558824539, -0.06458010524511337, -0.057311151176691055, -0.05004219710826874, -0.04277324676513672, -0.0355042964220047, -0.028235342353582382, -0.020966390147805214, -0.013697437942028046, -0.006428487598896027, 0.0008404664695262909, 0.008109420537948608, 0.015378370881080627, 0.022647323086857796, 0.029916275292634964, 0.03718522936105728, 0.0444541797041893, 0.05172313004732132, 0.05899208411574364, 0.06626103818416595, 0.07352998852729797, 0.08079893887042999, 0.08806788921356201, 0.09533684700727463, 0.10260579735040665, 0.10987474769353867, 0.11714370548725128, 0.1244126558303833, 0.13168160617351532, 0.13895055651664734, 0.14621950685977936, 0.15348845720291138, 0.1607574224472046, 0.16802635788917542, 0.17529532313346863, 0.18256427347660065, 0.18983322381973267]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 7.0, 12.0, 15.0, 27.0, 42.0, 52.0, 103.0, 204.0, 312.0, 627.0, 1411.0, 4020.0, 19581.0, 247884.0, 2733711.0, 1111688.0, 59101.0, 10399.0, 3261.0, 922.0, 394.0, 218.0, 122.0, 55.0, 45.0, 29.0, 15.0, 9.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0843505859375, -0.08211612701416016, -0.07988166809082031, -0.07764720916748047, -0.07541275024414062, -0.07317829132080078, -0.07094383239746094, -0.0687093734741211, -0.06647491455078125, -0.0642404556274414, -0.06200599670410156, -0.05977153778076172, -0.057537078857421875, -0.05530261993408203, -0.05306816101074219, -0.050833702087402344, -0.0485992431640625, -0.046364784240722656, -0.04413032531738281, -0.04189586639404297, -0.039661407470703125, -0.03742694854736328, -0.03519248962402344, -0.032958030700683594, -0.03072357177734375, -0.028489112854003906, -0.026254653930664062, -0.02402019500732422, -0.021785736083984375, -0.01955127716064453, -0.017316818237304688, -0.015082359313964844, -0.012847900390625, -0.010613441467285156, -0.008378982543945312, -0.006144523620605469, -0.003910064697265625, -0.0016756057739257812, 0.0005588531494140625, 0.0027933120727539062, 0.00502777099609375, 0.007262229919433594, 0.009496688842773438, 0.011731147766113281, 0.013965606689453125, 0.01620006561279297, 0.018434524536132812, 0.020668983459472656, 0.0229034423828125, 0.025137901306152344, 0.027372360229492188, 0.02960681915283203, 0.031841278076171875, 0.03407573699951172, 0.03631019592285156, 0.038544654846191406, 0.04077911376953125, 0.043013572692871094, 0.04524803161621094, 0.04748249053955078, 0.049716949462890625, 0.05195140838623047, 0.05418586730957031, 0.056420326232910156, 0.05865478515625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 9.0, 11.0, 10.0, 20.0, 28.0, 30.0, 43.0, 51.0, 54.0, 66.0, 68.0, 74.0, 82.0, 63.0, 69.0, 60.0, 56.0, 43.0, 38.0, 33.0, 25.0, 19.0, 12.0, 10.0, 11.0, 5.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.06634521484375, -0.06473875045776367, -0.06313228607177734, -0.061525821685791016, -0.05991935729980469, -0.05831289291381836, -0.05670642852783203, -0.0550999641418457, -0.053493499755859375, -0.05188703536987305, -0.05028057098388672, -0.04867410659790039, -0.04706764221191406, -0.045461177825927734, -0.043854713439941406, -0.04224824905395508, -0.04064178466796875, -0.03903532028198242, -0.037428855895996094, -0.035822391510009766, -0.03421592712402344, -0.03260946273803711, -0.03100299835205078, -0.029396533966064453, -0.027790069580078125, -0.026183605194091797, -0.02457714080810547, -0.02297067642211914, -0.021364212036132812, -0.019757747650146484, -0.018151283264160156, -0.016544818878173828, -0.0149383544921875, -0.013331890106201172, -0.011725425720214844, -0.010118961334228516, -0.008512496948242188, -0.006906032562255859, -0.005299568176269531, -0.003693103790283203, -0.002086639404296875, -0.0004801750183105469, 0.0011262893676757812, 0.0027327537536621094, 0.0043392181396484375, 0.005945682525634766, 0.007552146911621094, 0.009158611297607422, 0.01076507568359375, 0.012371540069580078, 0.013978004455566406, 0.015584468841552734, 0.017190933227539062, 0.01879739761352539, 0.02040386199951172, 0.022010326385498047, 0.023616790771484375, 0.025223255157470703, 0.02682971954345703, 0.02843618392944336, 0.030042648315429688, 0.031649112701416016, 0.033255577087402344, 0.03486204147338867, 0.036468505859375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 9.0, 14.0, 11.0, 46.0, 77.0, 143.0, 315.0, 659.0, 2242.0, 26089.0, 2904105.0, 1241198.0, 16367.0, 1788.0, 600.0, 289.0, 152.0, 68.0, 49.0, 21.0, 20.0, 7.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09918212890625, -0.09520244598388672, -0.09122276306152344, -0.08724308013916016, -0.08326339721679688, -0.0792837142944336, -0.07530403137207031, -0.07132434844970703, -0.06734466552734375, -0.06336498260498047, -0.05938529968261719, -0.055405616760253906, -0.051425933837890625, -0.047446250915527344, -0.04346656799316406, -0.03948688507080078, -0.0355072021484375, -0.03152751922607422, -0.027547836303710938, -0.023568153381347656, -0.019588470458984375, -0.015608787536621094, -0.011629104614257812, -0.007649421691894531, -0.00366973876953125, 0.00030994415283203125, 0.0042896270751953125, 0.008269309997558594, 0.012248992919921875, 0.016228675842285156, 0.020208358764648438, 0.02418804168701172, 0.028167724609375, 0.03214740753173828, 0.03612709045410156, 0.040106773376464844, 0.044086456298828125, 0.048066139221191406, 0.05204582214355469, 0.05602550506591797, 0.06000518798828125, 0.06398487091064453, 0.06796455383300781, 0.0719442367553711, 0.07592391967773438, 0.07990360260009766, 0.08388328552246094, 0.08786296844482422, 0.0918426513671875, 0.09582233428955078, 0.09980201721191406, 0.10378170013427734, 0.10776138305664062, 0.1117410659790039, 0.11572074890136719, 0.11970043182373047, 0.12368011474609375, 0.12765979766845703, 0.1316394805908203, 0.1356191635131836, 0.13959884643554688, 0.14357852935791016, 0.14755821228027344, 0.15153789520263672, 0.155517578125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 16.0, 14.0, 34.0, 43.0, 79.0, 124.0, 371.0, 979.0, 1205.0, 631.0, 233.0, 119.0, 88.0, 46.0, 36.0, 20.0, 16.0, 6.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06396484375, -0.061209678649902344, -0.05845451354980469, -0.05569934844970703, -0.052944183349609375, -0.05018901824951172, -0.04743385314941406, -0.044678688049316406, -0.04192352294921875, -0.039168357849121094, -0.03641319274902344, -0.03365802764892578, -0.030902862548828125, -0.02814769744873047, -0.025392532348632812, -0.022637367248535156, -0.0198822021484375, -0.017127037048339844, -0.014371871948242188, -0.011616706848144531, -0.008861541748046875, -0.006106376647949219, -0.0033512115478515625, -0.0005960464477539062, 0.00215911865234375, 0.004914283752441406, 0.0076694488525390625, 0.010424613952636719, 0.013179779052734375, 0.01593494415283203, 0.018690109252929688, 0.021445274353027344, 0.024200439453125, 0.026955604553222656, 0.029710769653320312, 0.03246593475341797, 0.035221099853515625, 0.03797626495361328, 0.04073143005371094, 0.043486595153808594, 0.04624176025390625, 0.048996925354003906, 0.05175209045410156, 0.05450725555419922, 0.057262420654296875, 0.06001758575439453, 0.06277275085449219, 0.06552791595458984, 0.0682830810546875, 0.07103824615478516, 0.07379341125488281, 0.07654857635498047, 0.07930374145507812, 0.08205890655517578, 0.08481407165527344, 0.0875692367553711, 0.09032440185546875, 0.0930795669555664, 0.09583473205566406, 0.09858989715576172, 0.10134506225585938, 0.10410022735595703, 0.10685539245605469, 0.10961055755615234, 0.11236572265625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 128.0, 732.0, 123.0, 11.0, 4.0, 6.0, 3.0, 2.0, 4.0, 1.0], "bins": [-2.2881312370300293, -2.246814012527466, -2.2054970264434814, -2.164179801940918, -2.1228628158569336, -2.08154559135437, -2.0402286052703857, -1.9989113807678223, -1.9575942754745483, -1.9162771701812744, -1.8749600648880005, -1.8336429595947266, -1.792325735092163, -1.7510086297988892, -1.7096915245056152, -1.6683744192123413, -1.6270573139190674, -1.5857402086257935, -1.5444231033325195, -1.5031059980392456, -1.4617888927459717, -1.4204716682434082, -1.3791545629501343, -1.3378374576568604, -1.2965203523635864, -1.2552032470703125, -1.2138861417770386, -1.1725690364837646, -1.1312518119812012, -1.0899347066879272, -1.0486176013946533, -1.0073004961013794, -0.9659834504127502, -0.9246663451194763, -0.8833491802215576, -0.8420320749282837, -0.8007149696350098, -0.7593978643417358, -0.7180807590484619, -0.6767635941505432, -0.6354464888572693, -0.5941293835639954, -0.5528122186660767, -0.5114951133728027, -0.4701780080795288, -0.4288609027862549, -0.38754376769065857, -0.34622663259506226, -0.30490952730178833, -0.2635924220085144, -0.2222752869129181, -0.18095816671848297, -0.13964104652404785, -0.09832392632961273, -0.05700680613517761, -0.0156896710395813, 0.025627434253692627, 0.06694455444812775, 0.10826167464256287, 0.14957879483699799, 0.1908959150314331, 0.23221303522586823, 0.27353015542030334, 0.31484729051589966, 0.3561643958091736]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 9.0, 9.0, 11.0, 12.0, 7.0, 14.0, 22.0, 21.0, 26.0, 14.0, 32.0, 47.0, 32.0, 55.0, 47.0, 55.0, 48.0, 47.0, 36.0, 49.0, 48.0, 34.0, 38.0, 46.0, 40.0, 33.0, 32.0, 18.0, 22.0, 14.0, 10.0, 16.0, 19.0, 10.0, 11.0, 5.0, 1.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13735860586166382, -0.13228356838226318, -0.12720853090286255, -0.12213349342346191, -0.11705845594406128, -0.11198341846466064, -0.1069083884358406, -0.10183335095643997, -0.09675831347703934, -0.0916832759976387, -0.08660823851823807, -0.08153320103883743, -0.0764581710100174, -0.07138313353061676, -0.06630809605121613, -0.06123305857181549, -0.056158021092414856, -0.05108298361301422, -0.046007946133613586, -0.04093291237950325, -0.035857874900102615, -0.03078283742070198, -0.025707801803946495, -0.02063276618719101, -0.015557728707790375, -0.010482692159712315, -0.0054076556116342545, -0.0003326190635561943, 0.004742417484521866, 0.0098174549639225, 0.014892490580677986, 0.01996752619743347, 0.025042563676834106, 0.03011760115623474, 0.035192638635635376, 0.04026767238974571, 0.04534270986914635, 0.05041774734854698, 0.05549278110265732, 0.06056781858205795, 0.06564285606145859, 0.07071789354085922, 0.07579293102025986, 0.08086796849966049, 0.08594299852848053, 0.09101803600788116, 0.0960930734872818, 0.10116811096668243, 0.10624314844608307, 0.1113181859254837, 0.11639322340488434, 0.12146826088428497, 0.1265432983636856, 0.13161833584308624, 0.13669337332248688, 0.14176839590072632, 0.14684343338012695, 0.1519184708595276, 0.15699350833892822, 0.16206854581832886, 0.1671435832977295, 0.17221862077713013, 0.17729365825653076, 0.1823686957359314, 0.18744373321533203]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 9.0, 12.0, 18.0, 39.0, 32.0, 64.0, 88.0, 116.0, 176.0, 275.0, 422.0, 653.0, 1153.0, 2191.0, 4412.0, 9966.0, 25384.0, 73993.0, 232078.0, 402831.0, 193610.0, 61898.0, 21840.0, 8694.0, 3792.0, 1906.0, 1088.0, 667.0, 347.0, 264.0, 153.0, 115.0, 64.0, 50.0, 41.0, 33.0, 19.0, 16.0, 13.0, 8.0, 3.0, 8.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.042236328125, -0.0408477783203125, -0.039459228515625, -0.0380706787109375, -0.03668212890625, -0.0352935791015625, -0.033905029296875, -0.0325164794921875, -0.0311279296875, -0.0297393798828125, -0.028350830078125, -0.0269622802734375, -0.02557373046875, -0.0241851806640625, -0.022796630859375, -0.0214080810546875, -0.02001953125, -0.0186309814453125, -0.017242431640625, -0.0158538818359375, -0.01446533203125, -0.0130767822265625, -0.011688232421875, -0.0102996826171875, -0.0089111328125, -0.0075225830078125, -0.006134033203125, -0.0047454833984375, -0.00335693359375, -0.0019683837890625, -0.000579833984375, 0.0008087158203125, 0.002197265625, 0.0035858154296875, 0.004974365234375, 0.0063629150390625, 0.00775146484375, 0.0091400146484375, 0.010528564453125, 0.0119171142578125, 0.0133056640625, 0.0146942138671875, 0.016082763671875, 0.0174713134765625, 0.01885986328125, 0.0202484130859375, 0.021636962890625, 0.0230255126953125, 0.0244140625, 0.0258026123046875, 0.027191162109375, 0.0285797119140625, 0.02996826171875, 0.0313568115234375, 0.032745361328125, 0.0341339111328125, 0.0355224609375, 0.0369110107421875, 0.038299560546875, 0.0396881103515625, 0.04107666015625, 0.0424652099609375, 0.043853759765625, 0.0452423095703125, 0.046630859375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 5.0, 6.0, 8.0, 11.0, 19.0, 19.0, 32.0, 50.0, 50.0, 55.0, 61.0, 73.0, 86.0, 89.0, 64.0, 62.0, 69.0, 51.0, 47.0, 36.0, 25.0, 25.0, 20.0, 8.0, 11.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.059539794921875, -0.05809307098388672, -0.05664634704589844, -0.055199623107910156, -0.053752899169921875, -0.052306175231933594, -0.05085945129394531, -0.04941272735595703, -0.04796600341796875, -0.04651927947998047, -0.04507255554199219, -0.043625831604003906, -0.042179107666015625, -0.040732383728027344, -0.03928565979003906, -0.03783893585205078, -0.0363922119140625, -0.03494548797607422, -0.03349876403808594, -0.032052040100097656, -0.030605316162109375, -0.029158592224121094, -0.027711868286132812, -0.02626514434814453, -0.02481842041015625, -0.02337169647216797, -0.021924972534179688, -0.020478248596191406, -0.019031524658203125, -0.017584800720214844, -0.016138076782226562, -0.014691352844238281, -0.01324462890625, -0.011797904968261719, -0.010351181030273438, -0.008904457092285156, -0.007457733154296875, -0.006011009216308594, -0.0045642852783203125, -0.0031175613403320312, -0.00167083740234375, -0.00022411346435546875, 0.0012226104736328125, 0.0026693344116210938, 0.004116058349609375, 0.005562782287597656, 0.0070095062255859375, 0.008456230163574219, 0.0099029541015625, 0.011349678039550781, 0.012796401977539062, 0.014243125915527344, 0.015689849853515625, 0.017136573791503906, 0.018583297729492188, 0.02003002166748047, 0.02147674560546875, 0.02292346954345703, 0.024370193481445312, 0.025816917419433594, 0.027263641357421875, 0.028710365295410156, 0.030157089233398438, 0.03160381317138672, 0.033050537109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 4.0, 6.0, 7.0, 7.0, 11.0, 12.0, 14.0, 12.0, 25.0, 22.0, 32.0, 40.0, 72.0, 91.0, 156.0, 361.0, 840.0, 2773.0, 12700.0, 84956.0, 639063.0, 268525.0, 30564.0, 5661.0, 1439.0, 527.0, 224.0, 115.0, 68.0, 50.0, 37.0, 20.0, 17.0, 16.0, 16.0, 14.0, 15.0, 11.0, 4.0, 7.0, 8.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.08563232421875, -0.08301734924316406, -0.08040237426757812, -0.07778739929199219, -0.07517242431640625, -0.07255744934082031, -0.06994247436523438, -0.06732749938964844, -0.0647125244140625, -0.06209754943847656, -0.059482574462890625, -0.05686759948730469, -0.05425262451171875, -0.05163764953613281, -0.049022674560546875, -0.04640769958496094, -0.043792724609375, -0.04117774963378906, -0.038562774658203125, -0.03594779968261719, -0.03333282470703125, -0.030717849731445312, -0.028102874755859375, -0.025487899780273438, -0.0228729248046875, -0.020257949829101562, -0.017642974853515625, -0.015027999877929688, -0.01241302490234375, -0.009798049926757812, -0.007183074951171875, -0.0045680999755859375, -0.001953125, 0.0006618499755859375, 0.003276824951171875, 0.0058917999267578125, 0.00850677490234375, 0.011121749877929688, 0.013736724853515625, 0.016351699829101562, 0.0189666748046875, 0.021581649780273438, 0.024196624755859375, 0.026811599731445312, 0.02942657470703125, 0.03204154968261719, 0.034656524658203125, 0.03727149963378906, 0.039886474609375, 0.04250144958496094, 0.045116424560546875, 0.04773139953613281, 0.05034637451171875, 0.05296134948730469, 0.055576324462890625, 0.05819129943847656, 0.0608062744140625, 0.06342124938964844, 0.06603622436523438, 0.06865119934082031, 0.07126617431640625, 0.07388114929199219, 0.07649612426757812, 0.07911109924316406, 0.08172607421875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 8.0, 2.0, 7.0, 7.0, 11.0, 10.0, 14.0, 15.0, 14.0, 12.0, 10.0, 25.0, 27.0, 21.0, 26.0, 31.0, 30.0, 33.0, 46.0, 35.0, 40.0, 41.0, 41.0, 37.0, 44.0, 43.0, 37.0, 42.0, 37.0, 36.0, 37.0, 29.0, 24.0, 23.0, 13.0, 20.0, 15.0, 13.0, 7.0, 9.0, 10.0, 6.0, 5.0, 2.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.056427001953125, -0.05462169647216797, -0.05281639099121094, -0.051011085510253906, -0.049205780029296875, -0.047400474548339844, -0.04559516906738281, -0.04378986358642578, -0.04198455810546875, -0.04017925262451172, -0.03837394714355469, -0.036568641662597656, -0.034763336181640625, -0.032958030700683594, -0.031152725219726562, -0.02934741973876953, -0.0275421142578125, -0.02573680877685547, -0.023931503295898438, -0.022126197814941406, -0.020320892333984375, -0.018515586853027344, -0.016710281372070312, -0.014904975891113281, -0.01309967041015625, -0.011294364929199219, -0.009489059448242188, -0.007683753967285156, -0.005878448486328125, -0.004073143005371094, -0.0022678375244140625, -0.00046253204345703125, 0.0013427734375, 0.0031480789184570312, 0.0049533843994140625, 0.006758689880371094, 0.008563995361328125, 0.010369300842285156, 0.012174606323242188, 0.013979911804199219, 0.01578521728515625, 0.01759052276611328, 0.019395828247070312, 0.021201133728027344, 0.023006439208984375, 0.024811744689941406, 0.026617050170898438, 0.02842235565185547, 0.0302276611328125, 0.03203296661376953, 0.03383827209472656, 0.035643577575683594, 0.037448883056640625, 0.039254188537597656, 0.04105949401855469, 0.04286479949951172, 0.04467010498046875, 0.04647541046142578, 0.04828071594238281, 0.050086021423339844, 0.051891326904296875, 0.053696632385253906, 0.05550193786621094, 0.05730724334716797, 0.059112548828125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 16.0, 19.0, 20.0, 36.0, 89.0, 132.0, 240.0, 397.0, 767.0, 1541.0, 3280.0, 7147.0, 16558.0, 38628.0, 89749.0, 182319.0, 264445.0, 223901.0, 122630.0, 54652.0, 23316.0, 9953.0, 4482.0, 2082.0, 999.0, 479.0, 268.0, 155.0, 95.0, 39.0, 30.0, 26.0, 20.0, 14.0, 8.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007083892822265625, -0.006879746913909912, -0.006675601005554199, -0.006471455097198486, -0.0062673091888427734, -0.0060631632804870605, -0.005859017372131348, -0.005654871463775635, -0.005450725555419922, -0.005246579647064209, -0.005042433738708496, -0.004838287830352783, -0.00463414192199707, -0.004429996013641357, -0.0042258501052856445, -0.004021704196929932, -0.0038175582885742188, -0.003613412380218506, -0.003409266471862793, -0.00320512056350708, -0.003000974655151367, -0.0027968287467956543, -0.0025926828384399414, -0.0023885369300842285, -0.0021843910217285156, -0.0019802451133728027, -0.0017760992050170898, -0.001571953296661377, -0.001367807388305664, -0.0011636614799499512, -0.0009595155715942383, -0.0007553696632385254, -0.0005512237548828125, -0.0003470778465270996, -0.00014293193817138672, 6.121397018432617e-05, 0.00026535987854003906, 0.00046950578689575195, 0.0006736516952514648, 0.0008777976036071777, 0.0010819435119628906, 0.0012860894203186035, 0.0014902353286743164, 0.0016943812370300293, 0.0018985271453857422, 0.002102673053741455, 0.002306818962097168, 0.002510964870452881, 0.0027151107788085938, 0.0029192566871643066, 0.0031234025955200195, 0.0033275485038757324, 0.0035316944122314453, 0.003735840320587158, 0.003939986228942871, 0.004144132137298584, 0.004348278045654297, 0.00455242395401001, 0.004756569862365723, 0.0049607157707214355, 0.0051648616790771484, 0.005369007587432861, 0.005573153495788574, 0.005777299404144287, 0.0059814453125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 10.0, 1.0, 5.0, 4.0, 6.0, 9.0, 21.0, 20.0, 17.0, 20.0, 17.0, 19.0, 53.0, 39.0, 39.0, 43.0, 29.0, 46.0, 83.0, 53.0, 39.0, 46.0, 42.0, 67.0, 42.0, 25.0, 27.0, 27.0, 22.0, 32.0, 19.0, 21.0, 8.0, 12.0, 4.0, 16.0, 8.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1457672119140625e-06, -2.0759180188179016e-06, -2.0060688257217407e-06, -1.93621963262558e-06, -1.866370439529419e-06, -1.796521246433258e-06, -1.7266720533370972e-06, -1.6568228602409363e-06, -1.5869736671447754e-06, -1.5171244740486145e-06, -1.4472752809524536e-06, -1.3774260878562927e-06, -1.3075768947601318e-06, -1.237727701663971e-06, -1.16787850856781e-06, -1.0980293154716492e-06, -1.0281801223754883e-06, -9.583309292793274e-07, -8.884817361831665e-07, -8.186325430870056e-07, -7.487833499908447e-07, -6.789341568946838e-07, -6.09084963798523e-07, -5.392357707023621e-07, -4.6938657760620117e-07, -3.995373845100403e-07, -3.296881914138794e-07, -2.598389983177185e-07, -1.8998980522155762e-07, -1.2014061212539673e-07, -5.029141902923584e-08, 1.955777406692505e-08, 8.940696716308594e-08, 1.5925616025924683e-07, 2.2910535335540771e-07, 2.989545464515686e-07, 3.688037395477295e-07, 4.386529326438904e-07, 5.085021257400513e-07, 5.783513188362122e-07, 6.48200511932373e-07, 7.180497050285339e-07, 7.878988981246948e-07, 8.577480912208557e-07, 9.275972843170166e-07, 9.974464774131775e-07, 1.0672956705093384e-06, 1.1371448636054993e-06, 1.2069940567016602e-06, 1.276843249797821e-06, 1.346692442893982e-06, 1.4165416359901428e-06, 1.4863908290863037e-06, 1.5562400221824646e-06, 1.6260892152786255e-06, 1.6959384083747864e-06, 1.7657876014709473e-06, 1.8356367945671082e-06, 1.905485987663269e-06, 1.97533518075943e-06, 2.045184373855591e-06, 2.1150335669517517e-06, 2.1848827600479126e-06, 2.2547319531440735e-06, 2.3245811462402344e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 9.0, 9.0, 17.0, 16.0, 49.0, 90.0, 189.0, 483.0, 1686.0, 8096.0, 57368.0, 366586.0, 495704.0, 101084.0, 13634.0, 2415.0, 626.0, 245.0, 125.0, 47.0, 28.0, 10.0, 5.0, 5.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012603759765625, -0.012102365493774414, -0.011600971221923828, -0.011099576950073242, -0.010598182678222656, -0.01009678840637207, -0.009595394134521484, -0.009093999862670898, -0.008592605590820312, -0.008091211318969727, -0.007589817047119141, -0.007088422775268555, -0.006587028503417969, -0.006085634231567383, -0.005584239959716797, -0.005082845687866211, -0.004581451416015625, -0.004080057144165039, -0.003578662872314453, -0.003077268600463867, -0.0025758743286132812, -0.0020744800567626953, -0.0015730857849121094, -0.0010716915130615234, -0.0005702972412109375, -6.890296936035156e-05, 0.0004324913024902344, 0.0009338855743408203, 0.0014352798461914062, 0.0019366741180419922, 0.002438068389892578, 0.002939462661743164, 0.00344085693359375, 0.003942251205444336, 0.004443645477294922, 0.004945039749145508, 0.005446434020996094, 0.00594782829284668, 0.006449222564697266, 0.0069506168365478516, 0.0074520111083984375, 0.007953405380249023, 0.00845479965209961, 0.008956193923950195, 0.009457588195800781, 0.009958982467651367, 0.010460376739501953, 0.010961771011352539, 0.011463165283203125, 0.011964559555053711, 0.012465953826904297, 0.012967348098754883, 0.013468742370605469, 0.013970136642456055, 0.01447153091430664, 0.014972925186157227, 0.015474319458007812, 0.0159757137298584, 0.016477108001708984, 0.01697850227355957, 0.017479896545410156, 0.017981290817260742, 0.018482685089111328, 0.018984079360961914, 0.0194854736328125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 6.0, 4.0, 6.0, 9.0, 13.0, 23.0, 23.0, 25.0, 45.0, 34.0, 58.0, 55.0, 75.0, 79.0, 95.0, 79.0, 77.0, 60.0, 62.0, 42.0, 29.0, 40.0, 13.0, 11.0, 10.0, 8.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013916015625, -0.013561844825744629, -0.013207674026489258, -0.012853503227233887, -0.012499332427978516, -0.012145161628723145, -0.011790990829467773, -0.011436820030212402, -0.011082649230957031, -0.01072847843170166, -0.010374307632446289, -0.010020136833190918, -0.009665966033935547, -0.009311795234680176, -0.008957624435424805, -0.008603453636169434, -0.008249282836914062, -0.007895112037658691, -0.00754094123840332, -0.007186770439147949, -0.006832599639892578, -0.006478428840637207, -0.006124258041381836, -0.005770087242126465, -0.005415916442871094, -0.005061745643615723, -0.0047075748443603516, -0.0043534040451049805, -0.003999233245849609, -0.0036450624465942383, -0.003290891647338867, -0.002936720848083496, -0.002582550048828125, -0.002228379249572754, -0.0018742084503173828, -0.0015200376510620117, -0.0011658668518066406, -0.0008116960525512695, -0.00045752525329589844, -0.00010335445404052734, 0.00025081634521484375, 0.0006049871444702148, 0.0009591579437255859, 0.001313328742980957, 0.0016674995422363281, 0.0020216703414916992, 0.0023758411407470703, 0.0027300119400024414, 0.0030841827392578125, 0.0034383535385131836, 0.0037925243377685547, 0.004146695137023926, 0.004500865936279297, 0.004855036735534668, 0.005209207534790039, 0.00556337833404541, 0.005917549133300781, 0.006271719932556152, 0.0066258907318115234, 0.0069800615310668945, 0.007334232330322266, 0.007688403129577637, 0.008042573928833008, 0.008396744728088379, 0.00875091552734375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 11.0, 49.0, 132.0, 370.0, 331.0, 78.0, 22.0, 10.0, 4.0, 1.0], "bins": [-0.8570353388786316, -0.8422336578369141, -0.8274319767951965, -0.812630295753479, -0.7978286147117615, -0.783026933670044, -0.7682251930236816, -0.7534235119819641, -0.7386218309402466, -0.723820149898529, -0.7090184688568115, -0.694216787815094, -0.6794151067733765, -0.6646133661270142, -0.6498117446899414, -0.6350100040435791, -0.6202083826065063, -0.6054067015647888, -0.5906050205230713, -0.5758033394813538, -0.5610016584396362, -0.5461999177932739, -0.5313982963562012, -0.5165965557098389, -0.5017948746681213, -0.4869931936264038, -0.4721915125846863, -0.45738983154296875, -0.44258812069892883, -0.4277864396572113, -0.4129847586154938, -0.39818307757377625, -0.38338136672973633, -0.3685796856880188, -0.35377800464630127, -0.33897632360458374, -0.3241746127605438, -0.3093729317188263, -0.29457125067710876, -0.27976956963539124, -0.2649678587913513, -0.2501661777496338, -0.23536448180675507, -0.22056280076503754, -0.2057611048221588, -0.19095942378044128, -0.17615774273872375, -0.16135606169700623, -0.1465543657541275, -0.13175268471240997, -0.11695098876953125, -0.10214930772781372, -0.0873476192355156, -0.07254593074321747, -0.05774424970149994, -0.04294256120920181, -0.028140872716903687, -0.01333918608725071, 0.0014625005424022675, 0.016264185309410095, 0.03106587380170822, 0.04586756229400635, 0.06066924333572388, 0.075470931828022, 0.09027262032032013]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 7.0, 8.0, 7.0, 16.0, 15.0, 9.0, 17.0, 14.0, 21.0, 17.0, 30.0, 29.0, 32.0, 33.0, 37.0, 34.0, 31.0, 31.0, 34.0, 28.0, 33.0, 43.0, 49.0, 34.0, 38.0, 40.0, 36.0, 34.0, 33.0, 24.0, 26.0, 23.0, 16.0, 16.0, 14.0, 19.0, 10.0, 7.0, 11.0, 6.0, 6.0, 4.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.15890008211135864, -0.15406078100204468, -0.14922146499156952, -0.14438216388225555, -0.1395428478717804, -0.13470354676246643, -0.12986423075199127, -0.1250249296426773, -0.12018562108278275, -0.11534631252288818, -0.11050700396299362, -0.10566769540309906, -0.1008283942937851, -0.09598907828330994, -0.09114977717399597, -0.08631046861410141, -0.08147116005420685, -0.07663185149431229, -0.07179254293441772, -0.06695323437452316, -0.0621139295399189, -0.05727462098002434, -0.052435316145420074, -0.04759600758552551, -0.04275669902563095, -0.03791739046573639, -0.03307808190584183, -0.028238777071237564, -0.023399468511343002, -0.01856015995144844, -0.013720853254199028, -0.008881546556949615, -0.004042237997055054, 0.0007970696315169334, 0.005636377260088921, 0.010475684888660908, 0.015314992517232895, 0.020154301077127457, 0.02499360777437687, 0.029832914471626282, 0.034672223031520844, 0.039511531591415405, 0.04435084015130997, 0.04919014498591423, 0.05402945354580879, 0.058868762105703354, 0.06370806694030762, 0.06854737550020218, 0.07338668406009674, 0.0782259926199913, 0.08306530117988586, 0.08790460973978043, 0.09274391829967499, 0.09758321940898895, 0.10242252796888351, 0.10726183652877808, 0.11210114508867264, 0.1169404536485672, 0.12177976220846176, 0.12661907076835632, 0.1314583718776703, 0.13629768788814545, 0.1411369889974594, 0.14597630500793457, 0.15081560611724854]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 6.0, 9.0, 7.0, 28.0, 32.0, 48.0, 104.0, 148.0, 349.0, 978.0, 4665.0, 30127.0, 714549.0, 3006138.0, 402902.0, 24253.0, 6362.0, 2707.0, 471.0, 171.0, 97.0, 48.0, 20.0, 15.0, 10.0, 9.0, 5.0, 3.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.058013916015625, -0.05622434616088867, -0.054434776306152344, -0.052645206451416016, -0.05085563659667969, -0.04906606674194336, -0.04727649688720703, -0.0454869270324707, -0.043697357177734375, -0.04190778732299805, -0.04011821746826172, -0.03832864761352539, -0.03653907775878906, -0.034749507904052734, -0.032959938049316406, -0.031170368194580078, -0.02938079833984375, -0.027591228485107422, -0.025801658630371094, -0.024012088775634766, -0.022222518920898438, -0.02043294906616211, -0.01864337921142578, -0.016853809356689453, -0.015064239501953125, -0.013274669647216797, -0.011485099792480469, -0.00969552993774414, -0.007905960083007812, -0.006116390228271484, -0.004326820373535156, -0.002537250518798828, -0.0007476806640625, 0.0010418891906738281, 0.0028314590454101562, 0.004621028900146484, 0.0064105987548828125, 0.00820016860961914, 0.009989738464355469, 0.011779308319091797, 0.013568878173828125, 0.015358448028564453, 0.01714801788330078, 0.01893758773803711, 0.020727157592773438, 0.022516727447509766, 0.024306297302246094, 0.026095867156982422, 0.02788543701171875, 0.029675006866455078, 0.031464576721191406, 0.033254146575927734, 0.03504371643066406, 0.03683328628540039, 0.03862285614013672, 0.04041242599487305, 0.042201995849609375, 0.0439915657043457, 0.04578113555908203, 0.04757070541381836, 0.04936027526855469, 0.051149845123291016, 0.052939414978027344, 0.05472898483276367, 0.0565185546875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 11.0, 6.0, 16.0, 17.0, 16.0, 46.0, 46.0, 64.0, 84.0, 84.0, 88.0, 75.0, 79.0, 73.0, 64.0, 56.0, 45.0, 38.0, 25.0, 26.0, 13.0, 7.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06317138671875, -0.061519622802734375, -0.05986785888671875, -0.058216094970703125, -0.0565643310546875, -0.054912567138671875, -0.05326080322265625, -0.051609039306640625, -0.049957275390625, -0.048305511474609375, -0.04665374755859375, -0.045001983642578125, -0.0433502197265625, -0.041698455810546875, -0.04004669189453125, -0.038394927978515625, -0.0367431640625, -0.035091400146484375, -0.03343963623046875, -0.031787872314453125, -0.0301361083984375, -0.028484344482421875, -0.02683258056640625, -0.025180816650390625, -0.023529052734375, -0.021877288818359375, -0.02022552490234375, -0.018573760986328125, -0.0169219970703125, -0.015270233154296875, -0.01361846923828125, -0.011966705322265625, -0.01031494140625, -0.008663177490234375, -0.00701141357421875, -0.005359649658203125, -0.0037078857421875, -0.002056121826171875, -0.00040435791015625, 0.001247406005859375, 0.002899169921875, 0.004550933837890625, 0.00620269775390625, 0.007854461669921875, 0.0095062255859375, 0.011157989501953125, 0.01280975341796875, 0.014461517333984375, 0.01611328125, 0.017765045166015625, 0.01941680908203125, 0.021068572998046875, 0.0227203369140625, 0.024372100830078125, 0.02602386474609375, 0.027675628662109375, 0.029327392578125, 0.030979156494140625, 0.03263092041015625, 0.034282684326171875, 0.0359344482421875, 0.037586212158203125, 0.03923797607421875, 0.040889739990234375, 0.04254150390625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 7.0, 7.0, 13.0, 19.0, 36.0, 67.0, 111.0, 255.0, 553.0, 1553.0, 7216.0, 60789.0, 2064140.0, 1990352.0, 59376.0, 7146.0, 1636.0, 517.0, 212.0, 116.0, 66.0, 24.0, 21.0, 19.0, 14.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0540771484375, -0.052332401275634766, -0.05058765411376953, -0.0488429069519043, -0.04709815979003906, -0.04535341262817383, -0.043608665466308594, -0.04186391830444336, -0.040119171142578125, -0.03837442398071289, -0.036629676818847656, -0.03488492965698242, -0.03314018249511719, -0.03139543533325195, -0.02965068817138672, -0.027905941009521484, -0.02616119384765625, -0.024416446685791016, -0.02267169952392578, -0.020926952362060547, -0.019182205200195312, -0.017437458038330078, -0.015692710876464844, -0.01394796371459961, -0.012203216552734375, -0.01045846939086914, -0.008713722229003906, -0.006968975067138672, -0.0052242279052734375, -0.003479480743408203, -0.0017347335815429688, 1.0013580322265625e-05, 0.0017547607421875, 0.0034995079040527344, 0.005244255065917969, 0.006989002227783203, 0.008733749389648438, 0.010478496551513672, 0.012223243713378906, 0.01396799087524414, 0.015712738037109375, 0.01745748519897461, 0.019202232360839844, 0.020946979522705078, 0.022691726684570312, 0.024436473846435547, 0.02618122100830078, 0.027925968170166016, 0.02967071533203125, 0.031415462493896484, 0.03316020965576172, 0.03490495681762695, 0.03664970397949219, 0.03839445114135742, 0.040139198303222656, 0.04188394546508789, 0.043628692626953125, 0.04537343978881836, 0.047118186950683594, 0.04886293411254883, 0.05060768127441406, 0.0523524284362793, 0.05409717559814453, 0.055841922760009766, 0.057586669921875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 7.0, 14.0, 10.0, 24.0, 24.0, 32.0, 63.0, 123.0, 257.0, 470.0, 765.0, 835.0, 640.0, 396.0, 154.0, 96.0, 50.0, 30.0, 19.0, 17.0, 13.0, 9.0, 9.0, 6.0, 3.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048004150390625, -0.046779632568359375, -0.04555511474609375, -0.044330596923828125, -0.0431060791015625, -0.041881561279296875, -0.04065704345703125, -0.039432525634765625, -0.0382080078125, -0.036983489990234375, -0.03575897216796875, -0.034534454345703125, -0.0333099365234375, -0.032085418701171875, -0.03086090087890625, -0.029636383056640625, -0.028411865234375, -0.027187347412109375, -0.02596282958984375, -0.024738311767578125, -0.0235137939453125, -0.022289276123046875, -0.02106475830078125, -0.019840240478515625, -0.01861572265625, -0.017391204833984375, -0.01616668701171875, -0.014942169189453125, -0.0137176513671875, -0.012493133544921875, -0.01126861572265625, -0.010044097900390625, -0.008819580078125, -0.007595062255859375, -0.00637054443359375, -0.005146026611328125, -0.0039215087890625, -0.002696990966796875, -0.00147247314453125, -0.000247955322265625, 0.0009765625, 0.002201080322265625, 0.00342559814453125, 0.004650115966796875, 0.0058746337890625, 0.007099151611328125, 0.00832366943359375, 0.009548187255859375, 0.010772705078125, 0.011997222900390625, 0.01322174072265625, 0.014446258544921875, 0.0156707763671875, 0.016895294189453125, 0.01811981201171875, 0.019344329833984375, 0.02056884765625, 0.021793365478515625, 0.02301788330078125, 0.024242401123046875, 0.0254669189453125, 0.026691436767578125, 0.02791595458984375, 0.029140472412109375, 0.030364990234375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 10.0, 9.0, 34.0, 61.0, 138.0, 177.0, 230.0, 161.0, 95.0, 45.0, 22.0, 11.0, 7.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.24436144530773163, -0.23857563734054565, -0.23278982937335968, -0.2270040214061737, -0.22121821343898773, -0.21543240547180176, -0.20964659750461578, -0.2038607895374298, -0.19807498157024384, -0.19228917360305786, -0.1865033656358719, -0.1807175576686859, -0.17493174970149994, -0.16914594173431396, -0.163360133767128, -0.15757432579994202, -0.15178851783275604, -0.14600270986557007, -0.1402169018983841, -0.13443109393119812, -0.12864528596401215, -0.12285947799682617, -0.1170736700296402, -0.11128786206245422, -0.10550205409526825, -0.09971624612808228, -0.0939304381608963, -0.08814463019371033, -0.08235882222652435, -0.07657301425933838, -0.0707872062921524, -0.06500139832496643, -0.05921559035778046, -0.05342978239059448, -0.04764397442340851, -0.041858166456222534, -0.03607235848903656, -0.030286550521850586, -0.024500742554664612, -0.018714934587478638, -0.012929126620292664, -0.0071433186531066895, -0.0013575106859207153, 0.004428297281265259, 0.010214105248451233, 0.015999913215637207, 0.02178572118282318, 0.027571529150009155, 0.03335733711719513, 0.039143145084381104, 0.04492895305156708, 0.05071476101875305, 0.056500568985939026, 0.062286376953125, 0.06807218492031097, 0.07385799288749695, 0.07964380085468292, 0.0854296088218689, 0.09121541678905487, 0.09700122475624084, 0.10278703272342682, 0.10857284069061279, 0.11435864865779877, 0.12014445662498474, 0.12593026459217072]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 5.0, 9.0, 11.0, 12.0, 17.0, 12.0, 22.0, 20.0, 23.0, 30.0, 25.0, 32.0, 28.0, 30.0, 29.0, 46.0, 47.0, 40.0, 40.0, 37.0, 43.0, 42.0, 38.0, 33.0, 30.0, 44.0, 25.0, 23.0, 24.0, 21.0, 20.0, 21.0, 18.0, 22.0, 17.0, 13.0, 8.0, 10.0, 2.0, 6.0, 4.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0653415322303772, -0.06312014162540436, -0.06089874356985092, -0.058677349239587784, -0.056455954909324646, -0.05423456057906151, -0.05201316624879837, -0.04979177191853523, -0.047570377588272095, -0.04534898325800896, -0.04312758892774582, -0.04090619459748268, -0.03868480026721954, -0.036463405936956406, -0.03424201160669327, -0.03202061727643013, -0.029799222946166992, -0.027577828615903854, -0.025356434285640717, -0.02313503995537758, -0.02091364562511444, -0.018692251294851303, -0.016470856964588165, -0.014249462634325027, -0.01202806830406189, -0.009806673973798752, -0.007585279643535614, -0.005363885313272476, -0.0031424909830093384, -0.0009210966527462006, 0.0013002976775169373, 0.003521692007780075, 0.005743086338043213, 0.00796448066830635, 0.010185874998569489, 0.012407269328832626, 0.014628663659095764, 0.016850057989358902, 0.01907145231962204, 0.021292846649885178, 0.023514240980148315, 0.025735635310411453, 0.02795702964067459, 0.03017842397093773, 0.03239981830120087, 0.034621212631464005, 0.03684260696172714, 0.03906400129199028, 0.04128539562225342, 0.043506789952516556, 0.045728184282779694, 0.04794957861304283, 0.05017097294330597, 0.05239236727356911, 0.054613761603832245, 0.05683515593409538, 0.05905655026435852, 0.06127794459462166, 0.0634993389248848, 0.06572073698043823, 0.06794212758541107, 0.07016351819038391, 0.07238491624593735, 0.07460631430149078, 0.07682770490646362]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 12.0, 14.0, 31.0, 34.0, 41.0, 75.0, 105.0, 163.0, 212.0, 346.0, 497.0, 778.0, 1587.0, 3298.0, 7674.0, 19451.0, 57789.0, 201247.0, 435772.0, 219641.0, 63162.0, 20965.0, 7978.0, 3580.0, 1617.0, 905.0, 503.0, 347.0, 209.0, 155.0, 95.0, 70.0, 42.0, 44.0, 32.0, 20.0, 21.0, 12.0, 10.0, 7.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041534423828125, -0.04021739959716797, -0.03890037536621094, -0.037583351135253906, -0.036266326904296875, -0.034949302673339844, -0.03363227844238281, -0.03231525421142578, -0.03099822998046875, -0.02968120574951172, -0.028364181518554688, -0.027047157287597656, -0.025730133056640625, -0.024413108825683594, -0.023096084594726562, -0.02177906036376953, -0.0204620361328125, -0.01914501190185547, -0.017827987670898438, -0.016510963439941406, -0.015193939208984375, -0.013876914978027344, -0.012559890747070312, -0.011242866516113281, -0.00992584228515625, -0.008608818054199219, -0.0072917938232421875, -0.005974769592285156, -0.004657745361328125, -0.0033407211303710938, -0.0020236968994140625, -0.0007066726684570312, 0.0006103515625, 0.0019273757934570312, 0.0032444000244140625, 0.004561424255371094, 0.005878448486328125, 0.007195472717285156, 0.008512496948242188, 0.009829521179199219, 0.01114654541015625, 0.012463569641113281, 0.013780593872070312, 0.015097618103027344, 0.016414642333984375, 0.017731666564941406, 0.019048690795898438, 0.02036571502685547, 0.0216827392578125, 0.02299976348876953, 0.024316787719726562, 0.025633811950683594, 0.026950836181640625, 0.028267860412597656, 0.029584884643554688, 0.03090190887451172, 0.03221893310546875, 0.03353595733642578, 0.03485298156738281, 0.036170005798339844, 0.037487030029296875, 0.038804054260253906, 0.04012107849121094, 0.04143810272216797, 0.042755126953125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 5.0, 6.0, 11.0, 9.0, 20.0, 33.0, 35.0, 41.0, 54.0, 79.0, 72.0, 87.0, 83.0, 84.0, 70.0, 68.0, 57.0, 53.0, 36.0, 28.0, 21.0, 10.0, 15.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.06170654296875, -0.06018495559692383, -0.058663368225097656, -0.057141780853271484, -0.05562019348144531, -0.05409860610961914, -0.05257701873779297, -0.0510554313659668, -0.049533843994140625, -0.04801225662231445, -0.04649066925048828, -0.04496908187866211, -0.04344749450683594, -0.041925907135009766, -0.040404319763183594, -0.03888273239135742, -0.03736114501953125, -0.03583955764770508, -0.034317970275878906, -0.032796382904052734, -0.03127479553222656, -0.02975320816040039, -0.02823162078857422, -0.026710033416748047, -0.025188446044921875, -0.023666858673095703, -0.02214527130126953, -0.02062368392944336, -0.019102096557617188, -0.017580509185791016, -0.016058921813964844, -0.014537334442138672, -0.0130157470703125, -0.011494159698486328, -0.009972572326660156, -0.008450984954833984, -0.0069293975830078125, -0.005407810211181641, -0.0038862228393554688, -0.002364635467529297, -0.000843048095703125, 0.0006785392761230469, 0.0022001266479492188, 0.0037217140197753906, 0.0052433013916015625, 0.006764888763427734, 0.008286476135253906, 0.009808063507080078, 0.01132965087890625, 0.012851238250732422, 0.014372825622558594, 0.015894412994384766, 0.017416000366210938, 0.01893758773803711, 0.02045917510986328, 0.021980762481689453, 0.023502349853515625, 0.025023937225341797, 0.02654552459716797, 0.02806711196899414, 0.029588699340820312, 0.031110286712646484, 0.032631874084472656, 0.03415346145629883, 0.035675048828125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 9.0, 5.0, 9.0, 7.0, 11.0, 11.0, 22.0, 14.0, 30.0, 20.0, 26.0, 34.0, 54.0, 104.0, 211.0, 491.0, 1553.0, 7079.0, 50968.0, 546761.0, 398288.0, 35228.0, 5355.0, 1291.0, 395.0, 174.0, 97.0, 57.0, 49.0, 28.0, 34.0, 21.0, 16.0, 18.0, 17.0, 10.0, 10.0, 6.0, 5.0, 8.0, 2.0, 4.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.08648681640625, -0.08385944366455078, -0.08123207092285156, -0.07860469818115234, -0.07597732543945312, -0.0733499526977539, -0.07072257995605469, -0.06809520721435547, -0.06546783447265625, -0.06284046173095703, -0.06021308898925781, -0.057585716247558594, -0.054958343505859375, -0.052330970764160156, -0.04970359802246094, -0.04707622528076172, -0.0444488525390625, -0.04182147979736328, -0.03919410705566406, -0.036566734313964844, -0.033939361572265625, -0.031311988830566406, -0.028684616088867188, -0.02605724334716797, -0.02342987060546875, -0.02080249786376953, -0.018175125122070312, -0.015547752380371094, -0.012920379638671875, -0.010293006896972656, -0.0076656341552734375, -0.005038261413574219, -0.002410888671875, 0.00021648406982421875, 0.0028438568115234375, 0.005471229553222656, 0.008098602294921875, 0.010725975036621094, 0.013353347778320312, 0.01598072052001953, 0.01860809326171875, 0.02123546600341797, 0.023862838745117188, 0.026490211486816406, 0.029117584228515625, 0.031744956970214844, 0.03437232971191406, 0.03699970245361328, 0.0396270751953125, 0.04225444793701172, 0.04488182067871094, 0.047509193420410156, 0.050136566162109375, 0.052763938903808594, 0.05539131164550781, 0.05801868438720703, 0.06064605712890625, 0.06327342987060547, 0.06590080261230469, 0.0685281753540039, 0.07115554809570312, 0.07378292083740234, 0.07641029357910156, 0.07903766632080078, 0.0816650390625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 7.0, 5.0, 2.0, 5.0, 3.0, 11.0, 5.0, 10.0, 17.0, 17.0, 13.0, 18.0, 20.0, 31.0, 36.0, 25.0, 33.0, 30.0, 37.0, 32.0, 41.0, 46.0, 46.0, 52.0, 33.0, 49.0, 40.0, 38.0, 33.0, 28.0, 27.0, 25.0, 25.0, 25.0, 20.0, 19.0, 16.0, 23.0, 10.0, 10.0, 8.0, 9.0, 4.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.062042236328125, -0.060151100158691406, -0.05825996398925781, -0.05636882781982422, -0.054477691650390625, -0.05258655548095703, -0.05069541931152344, -0.048804283142089844, -0.04691314697265625, -0.045022010803222656, -0.04313087463378906, -0.04123973846435547, -0.039348602294921875, -0.03745746612548828, -0.03556632995605469, -0.033675193786621094, -0.0317840576171875, -0.029892921447753906, -0.028001785278320312, -0.02611064910888672, -0.024219512939453125, -0.02232837677001953, -0.020437240600585938, -0.018546104431152344, -0.01665496826171875, -0.014763832092285156, -0.012872695922851562, -0.010981559753417969, -0.009090423583984375, -0.007199287414550781, -0.0053081512451171875, -0.0034170150756835938, -0.00152587890625, 0.00036525726318359375, 0.0022563934326171875, 0.004147529602050781, 0.006038665771484375, 0.007929801940917969, 0.009820938110351562, 0.011712074279785156, 0.01360321044921875, 0.015494346618652344, 0.017385482788085938, 0.01927661895751953, 0.021167755126953125, 0.02305889129638672, 0.024950027465820312, 0.026841163635253906, 0.0287322998046875, 0.030623435974121094, 0.03251457214355469, 0.03440570831298828, 0.036296844482421875, 0.03818798065185547, 0.04007911682128906, 0.041970252990722656, 0.04386138916015625, 0.045752525329589844, 0.04764366149902344, 0.04953479766845703, 0.051425933837890625, 0.05331707000732422, 0.05520820617675781, 0.057099342346191406, 0.058990478515625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 3.0, 5.0, 6.0, 13.0, 18.0, 20.0, 46.0, 64.0, 91.0, 141.0, 218.0, 373.0, 690.0, 1286.0, 2884.0, 6486.0, 15551.0, 40188.0, 106681.0, 242339.0, 313723.0, 191032.0, 77102.0, 28711.0, 11554.0, 4768.0, 2134.0, 1069.0, 522.0, 301.0, 175.0, 113.0, 83.0, 51.0, 23.0, 35.0, 15.0, 10.0, 12.0, 4.0, 7.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007152557373046875, -0.006924271583557129, -0.006695985794067383, -0.006467700004577637, -0.006239414215087891, -0.0060111284255981445, -0.0057828426361083984, -0.005554556846618652, -0.005326271057128906, -0.00509798526763916, -0.004869699478149414, -0.004641413688659668, -0.004413127899169922, -0.004184842109680176, -0.00395655632019043, -0.0037282705307006836, -0.0034999847412109375, -0.0032716989517211914, -0.0030434131622314453, -0.0028151273727416992, -0.002586841583251953, -0.002358555793762207, -0.002130270004272461, -0.0019019842147827148, -0.0016736984252929688, -0.0014454126358032227, -0.0012171268463134766, -0.0009888410568237305, -0.0007605552673339844, -0.0005322694778442383, -0.0003039836883544922, -7.56978988647461e-05, 0.000152587890625, 0.0003808736801147461, 0.0006091594696044922, 0.0008374452590942383, 0.0010657310485839844, 0.0012940168380737305, 0.0015223026275634766, 0.0017505884170532227, 0.0019788742065429688, 0.002207159996032715, 0.002435445785522461, 0.002663731575012207, 0.002892017364501953, 0.0031203031539916992, 0.0033485889434814453, 0.0035768747329711914, 0.0038051605224609375, 0.004033446311950684, 0.00426173210144043, 0.004490017890930176, 0.004718303680419922, 0.004946589469909668, 0.005174875259399414, 0.00540316104888916, 0.005631446838378906, 0.005859732627868652, 0.0060880184173583984, 0.0063163042068481445, 0.006544589996337891, 0.006772875785827637, 0.007001161575317383, 0.007229447364807129, 0.007457733154296875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 6.0, 16.0, 12.0, 12.0, 11.0, 14.0, 16.0, 31.0, 29.0, 31.0, 32.0, 39.0, 34.0, 43.0, 87.0, 52.0, 55.0, 59.0, 28.0, 41.0, 36.0, 35.0, 36.0, 35.0, 33.0, 15.0, 23.0, 37.0, 17.0, 9.0, 9.0, 11.0, 7.0, 5.0, 9.0, 6.0, 6.0, 3.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.7881393432617188e-06, -1.7238780856132507e-06, -1.6596168279647827e-06, -1.5953555703163147e-06, -1.5310943126678467e-06, -1.4668330550193787e-06, -1.4025717973709106e-06, -1.3383105397224426e-06, -1.2740492820739746e-06, -1.2097880244255066e-06, -1.1455267667770386e-06, -1.0812655091285706e-06, -1.0170042514801025e-06, -9.527429938316345e-07, -8.884817361831665e-07, -8.242204785346985e-07, -7.599592208862305e-07, -6.956979632377625e-07, -6.314367055892944e-07, -5.671754479408264e-07, -5.029141902923584e-07, -4.386529326438904e-07, -3.7439167499542236e-07, -3.1013041734695435e-07, -2.4586915969848633e-07, -1.816079020500183e-07, -1.1734664440155029e-07, -5.3085386753082275e-08, 1.1175870895385742e-08, 7.543712854385376e-08, 1.3969838619232178e-07, 2.039596438407898e-07, 2.682209014892578e-07, 3.3248215913772583e-07, 3.9674341678619385e-07, 4.6100467443466187e-07, 5.252659320831299e-07, 5.895271897315979e-07, 6.537884473800659e-07, 7.180497050285339e-07, 7.82310962677002e-07, 8.4657222032547e-07, 9.10833477973938e-07, 9.75094735622406e-07, 1.039355993270874e-06, 1.103617250919342e-06, 1.16787850856781e-06, 1.232139766216278e-06, 1.296401023864746e-06, 1.3606622815132141e-06, 1.4249235391616821e-06, 1.4891847968101501e-06, 1.5534460544586182e-06, 1.6177073121070862e-06, 1.6819685697555542e-06, 1.7462298274040222e-06, 1.8104910850524902e-06, 1.8747523427009583e-06, 1.9390136003494263e-06, 2.0032748579978943e-06, 2.0675361156463623e-06, 2.1317973732948303e-06, 2.1960586309432983e-06, 2.2603198885917664e-06, 2.3245811462402344e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 6.0, 16.0, 23.0, 43.0, 92.0, 168.0, 329.0, 790.0, 3351.0, 36217.0, 557073.0, 423061.0, 23454.0, 2615.0, 748.0, 256.0, 134.0, 82.0, 39.0, 25.0, 16.0, 6.0, 6.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0253143310546875, -0.02458953857421875, -0.02386474609375, -0.02313995361328125, -0.0224151611328125, -0.02169036865234375, -0.020965576171875, -0.02024078369140625, -0.0195159912109375, -0.01879119873046875, -0.01806640625, -0.01734161376953125, -0.0166168212890625, -0.01589202880859375, -0.015167236328125, -0.01444244384765625, -0.0137176513671875, -0.01299285888671875, -0.01226806640625, -0.01154327392578125, -0.0108184814453125, -0.01009368896484375, -0.009368896484375, -0.00864410400390625, -0.0079193115234375, -0.00719451904296875, -0.0064697265625, -0.00574493408203125, -0.0050201416015625, -0.00429534912109375, -0.003570556640625, -0.00284576416015625, -0.0021209716796875, -0.00139617919921875, -0.00067138671875, 5.340576171875e-05, 0.0007781982421875, 0.00150299072265625, 0.002227783203125, 0.00295257568359375, 0.0036773681640625, 0.00440216064453125, 0.005126953125, 0.00585174560546875, 0.0065765380859375, 0.00730133056640625, 0.008026123046875, 0.00875091552734375, 0.0094757080078125, 0.01020050048828125, 0.01092529296875, 0.01165008544921875, 0.0123748779296875, 0.01309967041015625, 0.013824462890625, 0.01454925537109375, 0.0152740478515625, 0.01599884033203125, 0.0167236328125, 0.01744842529296875, 0.0181732177734375, 0.01889801025390625, 0.019622802734375, 0.02034759521484375, 0.0210723876953125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 4.0, 9.0, 9.0, 15.0, 20.0, 52.0, 42.0, 73.0, 75.0, 88.0, 98.0, 92.0, 98.0, 75.0, 70.0, 44.0, 45.0, 24.0, 23.0, 16.0, 10.0, 2.0, 8.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012603759765625, -0.012183785438537598, -0.011763811111450195, -0.011343836784362793, -0.01092386245727539, -0.010503888130187988, -0.010083913803100586, -0.009663939476013184, -0.009243965148925781, -0.008823990821838379, -0.008404016494750977, -0.007984042167663574, -0.007564067840576172, -0.0071440935134887695, -0.006724119186401367, -0.006304144859313965, -0.0058841705322265625, -0.00546419620513916, -0.005044221878051758, -0.0046242475509643555, -0.004204273223876953, -0.0037842988967895508, -0.0033643245697021484, -0.002944350242614746, -0.0025243759155273438, -0.0021044015884399414, -0.001684427261352539, -0.0012644529342651367, -0.0008444786071777344, -0.00042450428009033203, -4.5299530029296875e-06, 0.00041544437408447266, 0.000835418701171875, 0.0012553930282592773, 0.0016753673553466797, 0.002095341682434082, 0.0025153160095214844, 0.0029352903366088867, 0.003355264663696289, 0.0037752389907836914, 0.004195213317871094, 0.004615187644958496, 0.0050351619720458984, 0.005455136299133301, 0.005875110626220703, 0.0062950849533081055, 0.006715059280395508, 0.00713503360748291, 0.0075550079345703125, 0.007974982261657715, 0.008394956588745117, 0.00881493091583252, 0.009234905242919922, 0.009654879570007324, 0.010074853897094727, 0.010494828224182129, 0.010914802551269531, 0.011334776878356934, 0.011754751205444336, 0.012174725532531738, 0.01259469985961914, 0.013014674186706543, 0.013434648513793945, 0.013854622840881348, 0.01427459716796875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 36.0, 645.0, 304.0, 20.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6131685972213745, -1.5801267623901367, -1.5470848083496094, -1.5140429735183716, -1.4810011386871338, -1.4479591846466064, -1.4149173498153687, -1.3818755149841309, -1.3488335609436035, -1.3157917261123657, -1.2827497720718384, -1.2497079372406006, -1.2166661024093628, -1.1836241483688354, -1.1505823135375977, -1.1175404787063599, -1.084498643875122, -1.0514568090438843, -1.018414855003357, -0.9853730201721191, -0.9523311257362366, -0.919289231300354, -0.8862473964691162, -0.8532055020332336, -0.8201636075973511, -0.7871217131614685, -0.7540798783302307, -0.7210379838943481, -0.6879960894584656, -0.654954195022583, -0.6219123601913452, -0.5888704657554626, -0.5558285713195801, -0.5227866768836975, -0.48974481225013733, -0.45670294761657715, -0.4236610531806946, -0.3906191885471344, -0.3575773239135742, -0.32453542947769165, -0.29149356484413147, -0.2584517002105713, -0.22540980577468872, -0.19236794114112854, -0.15932606160640717, -0.1262841820716858, -0.09324231743812561, -0.060200437903404236, -0.02715855836868286, 0.005883317440748215, 0.03892519325017929, 0.07196706533432007, 0.10500894486904144, 0.13805082440376282, 0.171092689037323, 0.20413456857204437, 0.23717644810676575, 0.2702183127403259, 0.3032602071762085, 0.3363020718097687, 0.36934393644332886, 0.4023858308792114, 0.4354276955127716, 0.4684695601463318, 0.5015114545822144]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 4.0, 9.0, 11.0, 11.0, 13.0, 12.0, 17.0, 17.0, 23.0, 16.0, 24.0, 26.0, 26.0, 21.0, 36.0, 42.0, 47.0, 46.0, 47.0, 43.0, 35.0, 36.0, 38.0, 41.0, 32.0, 42.0, 28.0, 35.0, 29.0, 28.0, 18.0, 24.0, 19.0, 18.0, 15.0, 10.0, 13.0, 9.0, 11.0, 5.0, 2.0, 8.0, 3.0, 5.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15021425485610962, -0.14529690146446228, -0.14037956297397614, -0.13546222448349, -0.13054487109184265, -0.1256275177001953, -0.12071017920970917, -0.11579283326864243, -0.11087548732757568, -0.10595814138650894, -0.1010407954454422, -0.09612344950437546, -0.09120610356330872, -0.08628875762224197, -0.08137141168117523, -0.07645406574010849, -0.07153671979904175, -0.066619373857975, -0.061702027916908264, -0.05678468197584152, -0.05186733603477478, -0.04694999009370804, -0.042032644152641296, -0.037115298211574554, -0.03219795227050781, -0.02728060632944107, -0.02236326038837433, -0.017445914447307587, -0.012528568506240845, -0.007611222565174103, -0.002693876624107361, 0.002223469316959381, 0.007140815258026123, 0.012058161199092865, 0.016975507140159607, 0.02189285308122635, 0.02681019902229309, 0.03172754496335983, 0.036644890904426575, 0.04156223684549332, 0.04647958278656006, 0.0513969287276268, 0.05631427466869354, 0.061231620609760284, 0.06614896655082703, 0.07106631249189377, 0.07598365843296051, 0.08090100437402725, 0.085818350315094, 0.09073569625616074, 0.09565304219722748, 0.10057038813829422, 0.10548773407936096, 0.1104050800204277, 0.11532242596149445, 0.12023977190256119, 0.12515711784362793, 0.13007447123527527, 0.1349918097257614, 0.13990914821624756, 0.1448265016078949, 0.14974385499954224, 0.15466119349002838, 0.15957853198051453, 0.16449588537216187]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 7.0, 9.0, 8.0, 18.0, 21.0, 44.0, 49.0, 94.0, 209.0, 1890.0, 26395.0, 2734634.0, 1407310.0, 19444.0, 3473.0, 410.0, 89.0, 68.0, 36.0, 24.0, 13.0, 11.0, 8.0, 8.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.09454345703125, -0.09198284149169922, -0.08942222595214844, -0.08686161041259766, -0.08430099487304688, -0.0817403793334961, -0.07917976379394531, -0.07661914825439453, -0.07405853271484375, -0.07149791717529297, -0.06893730163574219, -0.0663766860961914, -0.06381607055664062, -0.061255455017089844, -0.05869483947753906, -0.05613422393798828, -0.0535736083984375, -0.05101299285888672, -0.04845237731933594, -0.045891761779785156, -0.043331146240234375, -0.040770530700683594, -0.03820991516113281, -0.03564929962158203, -0.03308868408203125, -0.03052806854248047, -0.027967453002929688, -0.025406837463378906, -0.022846221923828125, -0.020285606384277344, -0.017724990844726562, -0.015164375305175781, -0.012603759765625, -0.010043144226074219, -0.0074825286865234375, -0.004921913146972656, -0.002361297607421875, 0.00019931793212890625, 0.0027599334716796875, 0.005320549011230469, 0.00788116455078125, 0.010441780090332031, 0.013002395629882812, 0.015563011169433594, 0.018123626708984375, 0.020684242248535156, 0.023244857788085938, 0.02580547332763672, 0.0283660888671875, 0.03092670440673828, 0.03348731994628906, 0.036047935485839844, 0.038608551025390625, 0.041169166564941406, 0.04372978210449219, 0.04629039764404297, 0.04885101318359375, 0.05141162872314453, 0.05397224426269531, 0.056532859802246094, 0.059093475341796875, 0.061654090881347656, 0.06421470642089844, 0.06677532196044922, 0.0693359375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 5.0, 14.0, 15.0, 18.0, 31.0, 43.0, 48.0, 72.0, 79.0, 78.0, 95.0, 83.0, 84.0, 67.0, 63.0, 60.0, 37.0, 32.0, 29.0, 10.0, 15.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06298828125, -0.06136751174926758, -0.059746742248535156, -0.058125972747802734, -0.05650520324707031, -0.05488443374633789, -0.05326366424560547, -0.05164289474487305, -0.050022125244140625, -0.0484013557434082, -0.04678058624267578, -0.04515981674194336, -0.04353904724121094, -0.041918277740478516, -0.040297508239746094, -0.03867673873901367, -0.03705596923828125, -0.03543519973754883, -0.033814430236816406, -0.032193660736083984, -0.030572891235351562, -0.02895212173461914, -0.02733135223388672, -0.025710582733154297, -0.024089813232421875, -0.022469043731689453, -0.02084827423095703, -0.01922750473022461, -0.017606735229492188, -0.015985965728759766, -0.014365196228027344, -0.012744426727294922, -0.0111236572265625, -0.009502887725830078, -0.007882118225097656, -0.006261348724365234, -0.0046405792236328125, -0.0030198097229003906, -0.0013990402221679688, 0.00022172927856445312, 0.001842498779296875, 0.003463268280029297, 0.005084037780761719, 0.006704807281494141, 0.008325576782226562, 0.009946346282958984, 0.011567115783691406, 0.013187885284423828, 0.01480865478515625, 0.016429424285888672, 0.018050193786621094, 0.019670963287353516, 0.021291732788085938, 0.02291250228881836, 0.02453327178955078, 0.026154041290283203, 0.027774810791015625, 0.029395580291748047, 0.03101634979248047, 0.03263711929321289, 0.03425788879394531, 0.035878658294677734, 0.037499427795410156, 0.03912019729614258, 0.040740966796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 9.0, 19.0, 14.0, 33.0, 57.0, 97.0, 191.0, 293.0, 577.0, 1145.0, 3097.0, 11109.0, 65507.0, 1102961.0, 2810313.0, 170328.0, 20508.0, 4778.0, 1707.0, 683.0, 377.0, 199.0, 111.0, 60.0, 46.0, 23.0, 18.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0305023193359375, -0.02942061424255371, -0.028338909149169922, -0.027257204055786133, -0.026175498962402344, -0.025093793869018555, -0.024012088775634766, -0.022930383682250977, -0.021848678588867188, -0.0207669734954834, -0.01968526840209961, -0.01860356330871582, -0.01752185821533203, -0.016440153121948242, -0.015358448028564453, -0.014276742935180664, -0.013195037841796875, -0.012113332748413086, -0.011031627655029297, -0.009949922561645508, -0.008868217468261719, -0.00778651237487793, -0.006704807281494141, -0.0056231021881103516, -0.0045413970947265625, -0.0034596920013427734, -0.0023779869079589844, -0.0012962818145751953, -0.00021457672119140625, 0.0008671283721923828, 0.0019488334655761719, 0.003030538558959961, 0.00411224365234375, 0.005193948745727539, 0.006275653839111328, 0.007357358932495117, 0.008439064025878906, 0.009520769119262695, 0.010602474212646484, 0.011684179306030273, 0.012765884399414062, 0.013847589492797852, 0.01492929458618164, 0.01601099967956543, 0.01709270477294922, 0.018174409866333008, 0.019256114959716797, 0.020337820053100586, 0.021419525146484375, 0.022501230239868164, 0.023582935333251953, 0.024664640426635742, 0.02574634552001953, 0.02682805061340332, 0.02790975570678711, 0.0289914608001709, 0.030073165893554688, 0.031154870986938477, 0.032236576080322266, 0.033318281173706055, 0.034399986267089844, 0.03548169136047363, 0.03656339645385742, 0.03764510154724121, 0.038726806640625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 4.0, 11.0, 23.0, 24.0, 50.0, 76.0, 146.0, 244.0, 416.0, 702.0, 822.0, 637.0, 424.0, 221.0, 117.0, 60.0, 36.0, 14.0, 10.0, 11.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0330810546875, -0.03223586082458496, -0.03139066696166992, -0.030545473098754883, -0.029700279235839844, -0.028855085372924805, -0.028009891510009766, -0.027164697647094727, -0.026319503784179688, -0.02547430992126465, -0.02462911605834961, -0.02378392219543457, -0.02293872833251953, -0.022093534469604492, -0.021248340606689453, -0.020403146743774414, -0.019557952880859375, -0.018712759017944336, -0.017867565155029297, -0.017022371292114258, -0.01617717742919922, -0.01533198356628418, -0.01448678970336914, -0.013641595840454102, -0.012796401977539062, -0.011951208114624023, -0.011106014251708984, -0.010260820388793945, -0.009415626525878906, -0.008570432662963867, -0.007725238800048828, -0.006880044937133789, -0.00603485107421875, -0.005189657211303711, -0.004344463348388672, -0.003499269485473633, -0.0026540756225585938, -0.0018088817596435547, -0.0009636878967285156, -0.00011849403381347656, 0.0007266998291015625, 0.0015718936920166016, 0.0024170875549316406, 0.0032622814178466797, 0.004107475280761719, 0.004952669143676758, 0.005797863006591797, 0.006643056869506836, 0.007488250732421875, 0.008333444595336914, 0.009178638458251953, 0.010023832321166992, 0.010869026184082031, 0.01171422004699707, 0.01255941390991211, 0.013404607772827148, 0.014249801635742188, 0.015094995498657227, 0.015940189361572266, 0.016785383224487305, 0.017630577087402344, 0.018475770950317383, 0.019320964813232422, 0.02016615867614746, 0.0210113525390625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 14.0, 133.0, 642.0, 198.0, 20.0, 5.0, 0.0, 1.0, 1.0], "bins": [-0.9201670289039612, -0.9041988849639893, -0.8882306814193726, -0.8722624778747559, -0.8562943339347839, -0.840326189994812, -0.8243579864501953, -0.8083897829055786, -0.7924216389656067, -0.7764534950256348, -0.7604852914810181, -0.7445170879364014, -0.7285489439964294, -0.7125808000564575, -0.6966125965118408, -0.6806443929672241, -0.6646762490272522, -0.6487081050872803, -0.6327399015426636, -0.6167716979980469, -0.600803554058075, -0.584835410118103, -0.5688672065734863, -0.5528990030288696, -0.5369308590888977, -0.5209627151489258, -0.5049945116043091, -0.48902633786201477, -0.47305816411972046, -0.45708999037742615, -0.44112181663513184, -0.4251536428928375, -0.4091854989528656, -0.3932173252105713, -0.377249151468277, -0.36128097772598267, -0.34531280398368835, -0.32934463024139404, -0.31337645649909973, -0.2974082827568054, -0.2814401090145111, -0.2654719352722168, -0.24950376152992249, -0.23353558778762817, -0.21756741404533386, -0.20159924030303955, -0.18563106656074524, -0.16966289281845093, -0.15369471907615662, -0.1377265453338623, -0.121758371591568, -0.10579019784927368, -0.08982202410697937, -0.07385385036468506, -0.05788567662239075, -0.041917502880096436, -0.025949321687221527, -0.009981147944927216, 0.005987025797367096, 0.021955199539661407, 0.03792337328195572, 0.05389154702425003, 0.06985972076654434, 0.08582789450883865, 0.10179606825113297]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 11.0, 13.0, 8.0, 13.0, 15.0, 15.0, 19.0, 23.0, 27.0, 34.0, 27.0, 29.0, 36.0, 41.0, 36.0, 39.0, 46.0, 41.0, 48.0, 43.0, 42.0, 39.0, 33.0, 33.0, 34.0, 31.0, 30.0, 31.0, 33.0, 22.0, 17.0, 13.0, 17.0, 15.0, 4.0, 6.0, 11.0, 7.0, 4.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07391500473022461, -0.07149159163236618, -0.06906817853450775, -0.06664475798606873, -0.0642213448882103, -0.06179793179035187, -0.05937451496720314, -0.05695109814405441, -0.054527685046195984, -0.052104271948337555, -0.04968085512518883, -0.0472574383020401, -0.04483402520418167, -0.04241061210632324, -0.039987195283174515, -0.03756377846002579, -0.03514036536216736, -0.03271695226430893, -0.030293535441160202, -0.027870120480656624, -0.025446705520153046, -0.023023290559649467, -0.02059987559914589, -0.01817646063864231, -0.015753045678138733, -0.013329630717635155, -0.010906215757131577, -0.008482800796627998, -0.00605938583612442, -0.003635970875620842, -0.0012125559151172638, 0.0012108590453863144, 0.0036342740058898926, 0.006057688966393471, 0.008481103926897049, 0.010904518887400627, 0.013327933847904205, 0.015751348808407784, 0.01817476376891136, 0.02059817872941494, 0.023021593689918518, 0.025445008650422096, 0.027868423610925674, 0.030291838571429253, 0.03271525353193283, 0.03513866662979126, 0.03756208345293999, 0.039985500276088715, 0.042408913373947144, 0.04483232647180557, 0.0472557432949543, 0.04967916011810303, 0.052102573215961456, 0.054525986313819885, 0.05694940313696861, 0.05937281996011734, 0.06179623305797577, 0.0642196461558342, 0.06664305925369263, 0.06906647980213165, 0.07148989289999008, 0.07391330599784851, 0.07633672654628754, 0.07876013964414597, 0.0811835527420044]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 4.0, 7.0, 5.0, 10.0, 20.0, 13.0, 28.0, 35.0, 54.0, 57.0, 91.0, 137.0, 177.0, 225.0, 336.0, 580.0, 984.0, 1932.0, 4300.0, 10188.0, 26504.0, 78218.0, 248626.0, 405743.0, 179094.0, 56216.0, 19800.0, 7766.0, 3346.0, 1636.0, 879.0, 480.0, 300.0, 195.0, 146.0, 98.0, 76.0, 52.0, 47.0, 39.0, 32.0, 15.0, 17.0, 17.0, 15.0, 5.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.031494140625, -0.03045654296875, -0.0294189453125, -0.02838134765625, -0.02734375, -0.02630615234375, -0.0252685546875, -0.02423095703125, -0.023193359375, -0.02215576171875, -0.0211181640625, -0.02008056640625, -0.01904296875, -0.01800537109375, -0.0169677734375, -0.01593017578125, -0.014892578125, -0.01385498046875, -0.0128173828125, -0.01177978515625, -0.0107421875, -0.00970458984375, -0.0086669921875, -0.00762939453125, -0.006591796875, -0.00555419921875, -0.0045166015625, -0.00347900390625, -0.00244140625, -0.00140380859375, -0.0003662109375, 0.00067138671875, 0.001708984375, 0.00274658203125, 0.0037841796875, 0.00482177734375, 0.005859375, 0.00689697265625, 0.0079345703125, 0.00897216796875, 0.010009765625, 0.01104736328125, 0.0120849609375, 0.01312255859375, 0.01416015625, 0.01519775390625, 0.0162353515625, 0.01727294921875, 0.018310546875, 0.01934814453125, 0.0203857421875, 0.02142333984375, 0.0224609375, 0.02349853515625, 0.0245361328125, 0.02557373046875, 0.026611328125, 0.02764892578125, 0.0286865234375, 0.02972412109375, 0.03076171875, 0.03179931640625, 0.0328369140625, 0.03387451171875, 0.034912109375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 7.0, 6.0, 10.0, 9.0, 16.0, 23.0, 41.0, 45.0, 63.0, 78.0, 89.0, 96.0, 104.0, 90.0, 69.0, 71.0, 56.0, 36.0, 33.0, 32.0, 10.0, 12.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06475830078125, -0.0630197525024414, -0.06128120422363281, -0.05954265594482422, -0.057804107666015625, -0.05606555938720703, -0.05432701110839844, -0.052588462829589844, -0.05084991455078125, -0.049111366271972656, -0.04737281799316406, -0.04563426971435547, -0.043895721435546875, -0.04215717315673828, -0.04041862487792969, -0.038680076599121094, -0.0369415283203125, -0.035202980041503906, -0.03346443176269531, -0.03172588348388672, -0.029987335205078125, -0.02824878692626953, -0.026510238647460938, -0.024771690368652344, -0.02303314208984375, -0.021294593811035156, -0.019556045532226562, -0.01781749725341797, -0.016078948974609375, -0.014340400695800781, -0.012601852416992188, -0.010863304138183594, -0.009124755859375, -0.007386207580566406, -0.0056476593017578125, -0.003909111022949219, -0.002170562744140625, -0.00043201446533203125, 0.0013065338134765625, 0.0030450820922851562, 0.00478363037109375, 0.006522178649902344, 0.008260726928710938, 0.009999275207519531, 0.011737823486328125, 0.013476371765136719, 0.015214920043945312, 0.016953468322753906, 0.0186920166015625, 0.020430564880371094, 0.022169113159179688, 0.02390766143798828, 0.025646209716796875, 0.02738475799560547, 0.029123306274414062, 0.030861854553222656, 0.03260040283203125, 0.034338951110839844, 0.03607749938964844, 0.03781604766845703, 0.039554595947265625, 0.04129314422607422, 0.04303169250488281, 0.044770240783691406, 0.0465087890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 10.0, 7.0, 14.0, 14.0, 15.0, 14.0, 19.0, 30.0, 25.0, 29.0, 31.0, 63.0, 109.0, 215.0, 713.0, 3470.0, 35653.0, 603061.0, 380283.0, 21227.0, 2421.0, 541.0, 205.0, 91.0, 48.0, 40.0, 25.0, 31.0, 27.0, 18.0, 26.0, 13.0, 16.0, 6.0, 6.0, 8.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09893798828125, -0.09601974487304688, -0.09310150146484375, -0.09018325805664062, -0.0872650146484375, -0.08434677124023438, -0.08142852783203125, -0.07851028442382812, -0.075592041015625, -0.07267379760742188, -0.06975555419921875, -0.06683731079101562, -0.0639190673828125, -0.061000823974609375, -0.05808258056640625, -0.055164337158203125, -0.05224609375, -0.049327850341796875, -0.04640960693359375, -0.043491363525390625, -0.0405731201171875, -0.037654876708984375, -0.03473663330078125, -0.031818389892578125, -0.028900146484375, -0.025981903076171875, -0.02306365966796875, -0.020145416259765625, -0.0172271728515625, -0.014308929443359375, -0.01139068603515625, -0.008472442626953125, -0.00555419921875, -0.002635955810546875, 0.00028228759765625, 0.003200531005859375, 0.0061187744140625, 0.009037017822265625, 0.01195526123046875, 0.014873504638671875, 0.017791748046875, 0.020709991455078125, 0.02362823486328125, 0.026546478271484375, 0.0294647216796875, 0.032382965087890625, 0.03530120849609375, 0.038219451904296875, 0.0411376953125, 0.044055938720703125, 0.04697418212890625, 0.049892425537109375, 0.0528106689453125, 0.055728912353515625, 0.05864715576171875, 0.061565399169921875, 0.064483642578125, 0.06740188598632812, 0.07032012939453125, 0.07323837280273438, 0.0761566162109375, 0.07907485961914062, 0.08199310302734375, 0.08491134643554688, 0.08782958984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 6.0, 6.0, 6.0, 17.0, 14.0, 20.0, 24.0, 20.0, 35.0, 26.0, 29.0, 28.0, 25.0, 40.0, 33.0, 38.0, 39.0, 39.0, 39.0, 43.0, 40.0, 50.0, 41.0, 36.0, 39.0, 38.0, 25.0, 22.0, 23.0, 25.0, 25.0, 14.0, 19.0, 13.0, 10.0, 11.0, 11.0, 7.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.060302734375, -0.05832862854003906, -0.056354522705078125, -0.05438041687011719, -0.05240631103515625, -0.05043220520019531, -0.048458099365234375, -0.04648399353027344, -0.0445098876953125, -0.04253578186035156, -0.040561676025390625, -0.03858757019042969, -0.03661346435546875, -0.03463935852050781, -0.032665252685546875, -0.030691146850585938, -0.028717041015625, -0.026742935180664062, -0.024768829345703125, -0.022794723510742188, -0.02082061767578125, -0.018846511840820312, -0.016872406005859375, -0.014898300170898438, -0.0129241943359375, -0.010950088500976562, -0.008975982666015625, -0.0070018768310546875, -0.00502777099609375, -0.0030536651611328125, -0.001079559326171875, 0.0008945465087890625, 0.00286865234375, 0.0048427581787109375, 0.006816864013671875, 0.008790969848632812, 0.01076507568359375, 0.012739181518554688, 0.014713287353515625, 0.016687393188476562, 0.0186614990234375, 0.020635604858398438, 0.022609710693359375, 0.024583816528320312, 0.02655792236328125, 0.028532028198242188, 0.030506134033203125, 0.03248023986816406, 0.034454345703125, 0.03642845153808594, 0.038402557373046875, 0.04037666320800781, 0.04235076904296875, 0.04432487487792969, 0.046298980712890625, 0.04827308654785156, 0.0502471923828125, 0.05222129821777344, 0.054195404052734375, 0.05616950988769531, 0.05814361572265625, 0.06011772155761719, 0.062091827392578125, 0.06406593322753906, 0.0660400390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 9.0, 18.0, 26.0, 25.0, 50.0, 84.0, 142.0, 221.0, 369.0, 641.0, 1161.0, 2115.0, 3998.0, 7687.0, 15550.0, 33332.0, 74075.0, 161998.0, 268978.0, 241164.0, 127554.0, 57096.0, 26174.0, 12500.0, 6259.0, 3251.0, 1739.0, 966.0, 553.0, 312.0, 178.0, 108.0, 82.0, 43.0, 25.0, 21.0, 14.0, 11.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00533294677734375, -0.005175352096557617, -0.005017757415771484, -0.0048601627349853516, -0.004702568054199219, -0.004544973373413086, -0.004387378692626953, -0.00422978401184082, -0.0040721893310546875, -0.003914594650268555, -0.003756999969482422, -0.003599405288696289, -0.0034418106079101562, -0.0032842159271240234, -0.0031266212463378906, -0.002969026565551758, -0.002811431884765625, -0.002653837203979492, -0.0024962425231933594, -0.0023386478424072266, -0.0021810531616210938, -0.002023458480834961, -0.0018658638000488281, -0.0017082691192626953, -0.0015506744384765625, -0.0013930797576904297, -0.0012354850769042969, -0.001077890396118164, -0.0009202957153320312, -0.0007627010345458984, -0.0006051063537597656, -0.0004475116729736328, -0.0002899169921875, -0.0001323223114013672, 2.5272369384765625e-05, 0.00018286705017089844, 0.00034046173095703125, 0.0004980564117431641, 0.0006556510925292969, 0.0008132457733154297, 0.0009708404541015625, 0.0011284351348876953, 0.0012860298156738281, 0.001443624496459961, 0.0016012191772460938, 0.0017588138580322266, 0.0019164085388183594, 0.002074003219604492, 0.002231597900390625, 0.002389192581176758, 0.0025467872619628906, 0.0027043819427490234, 0.0028619766235351562, 0.003019571304321289, 0.003177165985107422, 0.0033347606658935547, 0.0034923553466796875, 0.0036499500274658203, 0.003807544708251953, 0.003965139389038086, 0.004122734069824219, 0.0042803287506103516, 0.004437923431396484, 0.004595518112182617, 0.00475311279296875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 8.0, 6.0, 8.0, 7.0, 18.0, 14.0, 19.0, 29.0, 28.0, 22.0, 28.0, 31.0, 36.0, 50.0, 39.0, 46.0, 34.0, 56.0, 38.0, 48.0, 90.0, 49.0, 41.0, 38.0, 30.0, 24.0, 28.0, 22.0, 24.0, 17.0, 16.0, 8.0, 9.0, 11.0, 4.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8477439880371094e-06, -1.7862766981124878e-06, -1.7248094081878662e-06, -1.6633421182632446e-06, -1.601874828338623e-06, -1.5404075384140015e-06, -1.4789402484893799e-06, -1.4174729585647583e-06, -1.3560056686401367e-06, -1.2945383787155151e-06, -1.2330710887908936e-06, -1.171603798866272e-06, -1.1101365089416504e-06, -1.0486692190170288e-06, -9.872019290924072e-07, -9.257346391677856e-07, -8.642673492431641e-07, -8.028000593185425e-07, -7.413327693939209e-07, -6.798654794692993e-07, -6.183981895446777e-07, -5.569308996200562e-07, -4.954636096954346e-07, -4.33996319770813e-07, -3.725290298461914e-07, -3.110617399215698e-07, -2.4959444999694824e-07, -1.8812716007232666e-07, -1.2665987014770508e-07, -6.51925802230835e-08, -3.725290298461914e-09, 5.774199962615967e-08, 1.1920928955078125e-07, 1.8067657947540283e-07, 2.421438694000244e-07, 3.03611159324646e-07, 3.650784492492676e-07, 4.2654573917388916e-07, 4.880130290985107e-07, 5.494803190231323e-07, 6.109476089477539e-07, 6.724148988723755e-07, 7.338821887969971e-07, 7.953494787216187e-07, 8.568167686462402e-07, 9.182840585708618e-07, 9.797513484954834e-07, 1.041218638420105e-06, 1.1026859283447266e-06, 1.1641532182693481e-06, 1.2256205081939697e-06, 1.2870877981185913e-06, 1.3485550880432129e-06, 1.4100223779678345e-06, 1.471489667892456e-06, 1.5329569578170776e-06, 1.5944242477416992e-06, 1.6558915376663208e-06, 1.7173588275909424e-06, 1.778826117515564e-06, 1.8402934074401855e-06, 1.9017606973648071e-06, 1.9632279872894287e-06, 2.0246952772140503e-06, 2.086162567138672e-06]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 9.0, 9.0, 14.0, 21.0, 27.0, 31.0, 64.0, 134.0, 246.0, 650.0, 1684.0, 5601.0, 21785.0, 108421.0, 444827.0, 365061.0, 76857.0, 16381.0, 4358.0, 1358.0, 516.0, 210.0, 98.0, 57.0, 37.0, 20.0, 20.0, 16.0, 7.0, 9.0, 8.0, 6.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01180267333984375, -0.011473894119262695, -0.01114511489868164, -0.010816335678100586, -0.010487556457519531, -0.010158777236938477, -0.009829998016357422, -0.009501218795776367, -0.009172439575195312, -0.008843660354614258, -0.008514881134033203, -0.008186101913452148, -0.007857322692871094, -0.007528543472290039, -0.007199764251708984, -0.00687098503112793, -0.006542205810546875, -0.00621342658996582, -0.005884647369384766, -0.005555868148803711, -0.005227088928222656, -0.0048983097076416016, -0.004569530487060547, -0.004240751266479492, -0.0039119720458984375, -0.003583192825317383, -0.003254413604736328, -0.0029256343841552734, -0.0025968551635742188, -0.002268075942993164, -0.0019392967224121094, -0.0016105175018310547, -0.00128173828125, -0.0009529590606689453, -0.0006241798400878906, -0.00029540061950683594, 3.337860107421875e-05, 0.00036215782165527344, 0.0006909370422363281, 0.0010197162628173828, 0.0013484954833984375, 0.0016772747039794922, 0.002006053924560547, 0.0023348331451416016, 0.0026636123657226562, 0.002992391586303711, 0.0033211708068847656, 0.0036499500274658203, 0.003978729248046875, 0.00430750846862793, 0.004636287689208984, 0.004965066909790039, 0.005293846130371094, 0.0056226253509521484, 0.005951404571533203, 0.006280183792114258, 0.0066089630126953125, 0.006937742233276367, 0.007266521453857422, 0.0075953006744384766, 0.007924079895019531, 0.008252859115600586, 0.00858163833618164, 0.008910417556762695, 0.00923919677734375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 8.0, 8.0, 10.0, 17.0, 15.0, 12.0, 28.0, 28.0, 30.0, 29.0, 39.0, 43.0, 65.0, 66.0, 60.0, 66.0, 66.0, 59.0, 46.0, 47.0, 42.0, 39.0, 38.0, 26.0, 17.0, 9.0, 17.0, 14.0, 10.0, 11.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0069732666015625, -0.006726980209350586, -0.006480693817138672, -0.006234407424926758, -0.005988121032714844, -0.00574183464050293, -0.005495548248291016, -0.0052492618560791016, -0.0050029754638671875, -0.0047566890716552734, -0.004510402679443359, -0.004264116287231445, -0.004017829895019531, -0.003771543502807617, -0.003525257110595703, -0.003278970718383789, -0.003032684326171875, -0.002786397933959961, -0.002540111541748047, -0.002293825149536133, -0.0020475387573242188, -0.0018012523651123047, -0.0015549659729003906, -0.0013086795806884766, -0.0010623931884765625, -0.0008161067962646484, -0.0005698204040527344, -0.0003235340118408203, -7.724761962890625e-05, 0.0001690387725830078, 0.0004153251647949219, 0.0006616115570068359, 0.00090789794921875, 0.001154184341430664, 0.0014004707336425781, 0.0016467571258544922, 0.0018930435180664062, 0.0021393299102783203, 0.0023856163024902344, 0.0026319026947021484, 0.0028781890869140625, 0.0031244754791259766, 0.0033707618713378906, 0.0036170482635498047, 0.0038633346557617188, 0.004109621047973633, 0.004355907440185547, 0.004602193832397461, 0.004848480224609375, 0.005094766616821289, 0.005341053009033203, 0.005587339401245117, 0.005833625793457031, 0.006079912185668945, 0.006326198577880859, 0.0065724849700927734, 0.0068187713623046875, 0.0070650577545166016, 0.007311344146728516, 0.00755763053894043, 0.007803916931152344, 0.008050203323364258, 0.008296489715576172, 0.008542776107788086, 0.0087890625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 12.0, 17.0, 17.0, 45.0, 94.0, 175.0, 228.0, 160.0, 98.0, 57.0, 42.0, 22.0, 14.0, 5.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1190265566110611, -0.11316927522420883, -0.10731199383735657, -0.1014547049999237, -0.09559742361307144, -0.08974014222621918, -0.08388285338878632, -0.07802557200193405, -0.07216829061508179, -0.06631100922822952, -0.06045372411608696, -0.0545964390039444, -0.04873915761709213, -0.04288187623023987, -0.037024591118097305, -0.031167306005954742, -0.025310024619102478, -0.019452741369605064, -0.01359545812010765, -0.007738174870610237, -0.0018808916211128235, 0.00397639162838459, 0.009833674877882004, 0.015690959990024567, 0.02154824137687683, 0.027405524626374245, 0.03326280787587166, 0.03912009298801422, 0.044977374374866486, 0.05083465576171875, 0.05669194087386131, 0.06254922598600388, 0.06840649247169495, 0.07426377385854721, 0.08012105524539948, 0.08597834408283234, 0.0918356254696846, 0.09769290685653687, 0.10355019569396973, 0.10940747708082199, 0.11526475846767426, 0.12112203985452652, 0.12697932124137878, 0.13283661007881165, 0.1386938989162445, 0.14455117285251617, 0.15040846168994904, 0.1562657356262207, 0.16212302446365356, 0.16798031330108643, 0.1738375872373581, 0.17969487607479095, 0.18555215001106262, 0.19140943884849548, 0.19726672768592834, 0.2031240165233612, 0.20898129045963287, 0.21483857929706573, 0.2206958532333374, 0.22655314207077026, 0.23241043090820312, 0.2382677048444748, 0.24412499368190765, 0.24998226761817932, 0.2558395564556122]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 5.0, 1.0, 9.0, 13.0, 7.0, 9.0, 12.0, 26.0, 24.0, 17.0, 23.0, 24.0, 23.0, 27.0, 28.0, 38.0, 39.0, 44.0, 36.0, 41.0, 30.0, 36.0, 45.0, 42.0, 41.0, 40.0, 40.0, 32.0, 34.0, 32.0, 30.0, 26.0, 36.0, 18.0, 17.0, 7.0, 10.0, 10.0, 11.0, 5.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1458072066307068, -0.14067105948925018, -0.13553489744663239, -0.13039875030517578, -0.12526260316371918, -0.12012644857168198, -0.11499029397964478, -0.10985414683818817, -0.10471799224615097, -0.09958183765411377, -0.09444569051265717, -0.08930953592061996, -0.08417338132858276, -0.07903723418712616, -0.07390107959508896, -0.06876492500305176, -0.06362877786159515, -0.05849262699484825, -0.05335647612810135, -0.04822032153606415, -0.043084170669317245, -0.03794801980257034, -0.03281186521053314, -0.02767571434378624, -0.022539563477039337, -0.017403412610292435, -0.012267259880900383, -0.007131108082830906, -0.001994956284761429, 0.0031411945819854736, 0.008277347311377525, 0.013413500040769577, 0.01854965090751648, 0.023685801774263382, 0.028821954503655434, 0.033958107233047485, 0.03909425809979439, 0.04423040896654129, 0.04936656355857849, 0.054502714425325394, 0.059638865292072296, 0.0647750198841095, 0.0699111670255661, 0.0750473216176033, 0.0801834762096405, 0.0853196233510971, 0.09045577794313431, 0.09559193253517151, 0.10072807967662811, 0.10586423426866531, 0.11100038141012192, 0.11613653600215912, 0.12127268314361572, 0.12640884518623352, 0.13154499232769012, 0.13668113946914673, 0.14181730151176453, 0.14695344865322113, 0.15208961069583893, 0.15722575783729553, 0.16236190497875214, 0.16749805212020874, 0.17263421416282654, 0.17777036130428314, 0.18290650844573975]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 7.0, 13.0, 14.0, 23.0, 30.0, 57.0, 102.0, 316.0, 2322.0, 24708.0, 2484769.0, 1654202.0, 22271.0, 4595.0, 613.0, 87.0, 53.0, 30.0, 28.0, 15.0, 9.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0760498046875, -0.0736703872680664, -0.07129096984863281, -0.06891155242919922, -0.06653213500976562, -0.06415271759033203, -0.06177330017089844, -0.059393882751464844, -0.05701446533203125, -0.054635047912597656, -0.05225563049316406, -0.04987621307373047, -0.047496795654296875, -0.04511737823486328, -0.04273796081542969, -0.040358543395996094, -0.0379791259765625, -0.035599708557128906, -0.03322029113769531, -0.03084087371826172, -0.028461456298828125, -0.02608203887939453, -0.023702621459960938, -0.021323204040527344, -0.01894378662109375, -0.016564369201660156, -0.014184951782226562, -0.011805534362792969, -0.009426116943359375, -0.007046699523925781, -0.0046672821044921875, -0.0022878646850585938, 9.1552734375e-05, 0.0024709701538085938, 0.0048503875732421875, 0.007229804992675781, 0.009609222412109375, 0.011988639831542969, 0.014368057250976562, 0.016747474670410156, 0.01912689208984375, 0.021506309509277344, 0.023885726928710938, 0.02626514434814453, 0.028644561767578125, 0.03102397918701172, 0.03340339660644531, 0.035782814025878906, 0.0381622314453125, 0.040541648864746094, 0.04292106628417969, 0.04530048370361328, 0.047679901123046875, 0.05005931854248047, 0.05243873596191406, 0.054818153381347656, 0.05719757080078125, 0.059576988220214844, 0.06195640563964844, 0.06433582305908203, 0.06671524047851562, 0.06909465789794922, 0.07147407531738281, 0.0738534927368164, 0.07623291015625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 8.0, 19.0, 16.0, 38.0, 36.0, 59.0, 68.0, 88.0, 88.0, 75.0, 101.0, 78.0, 74.0, 68.0, 50.0, 33.0, 29.0, 31.0, 12.0, 9.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058929443359375, -0.05723714828491211, -0.05554485321044922, -0.05385255813598633, -0.05216026306152344, -0.05046796798706055, -0.048775672912597656, -0.047083377838134766, -0.045391082763671875, -0.043698787689208984, -0.042006492614746094, -0.0403141975402832, -0.03862190246582031, -0.03692960739135742, -0.03523731231689453, -0.03354501724243164, -0.03185272216796875, -0.03016042709350586, -0.02846813201904297, -0.026775836944580078, -0.025083541870117188, -0.023391246795654297, -0.021698951721191406, -0.020006656646728516, -0.018314361572265625, -0.016622066497802734, -0.014929771423339844, -0.013237476348876953, -0.011545181274414062, -0.009852886199951172, -0.008160591125488281, -0.006468296051025391, -0.0047760009765625, -0.0030837059020996094, -0.0013914108276367188, 0.0003008842468261719, 0.0019931793212890625, 0.003685474395751953, 0.005377769470214844, 0.007070064544677734, 0.008762359619140625, 0.010454654693603516, 0.012146949768066406, 0.013839244842529297, 0.015531539916992188, 0.017223834991455078, 0.01891613006591797, 0.02060842514038086, 0.02230072021484375, 0.02399301528930664, 0.02568531036376953, 0.027377605438232422, 0.029069900512695312, 0.030762195587158203, 0.032454490661621094, 0.034146785736083984, 0.035839080810546875, 0.037531375885009766, 0.039223670959472656, 0.04091596603393555, 0.04260826110839844, 0.04430055618286133, 0.04599285125732422, 0.04768514633178711, 0.04937744140625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 20.0, 38.0, 54.0, 91.0, 129.0, 238.0, 514.0, 1396.0, 6608.0, 81504.0, 3540940.0, 541698.0, 17014.0, 2594.0, 739.0, 297.0, 150.0, 107.0, 56.0, 42.0, 25.0, 15.0, 8.0, 6.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053955078125, -0.052355289459228516, -0.05075550079345703, -0.04915571212768555, -0.04755592346191406, -0.04595613479614258, -0.044356346130371094, -0.04275655746459961, -0.041156768798828125, -0.03955698013305664, -0.037957191467285156, -0.03635740280151367, -0.03475761413574219, -0.0331578254699707, -0.03155803680419922, -0.029958248138427734, -0.02835845947265625, -0.026758670806884766, -0.02515888214111328, -0.023559093475341797, -0.021959304809570312, -0.020359516143798828, -0.018759727478027344, -0.01715993881225586, -0.015560150146484375, -0.01396036148071289, -0.012360572814941406, -0.010760784149169922, -0.009160995483398438, -0.007561206817626953, -0.005961418151855469, -0.004361629486083984, -0.0027618408203125, -0.0011620521545410156, 0.00043773651123046875, 0.002037525177001953, 0.0036373138427734375, 0.005237102508544922, 0.006836891174316406, 0.00843667984008789, 0.010036468505859375, 0.01163625717163086, 0.013236045837402344, 0.014835834503173828, 0.016435623168945312, 0.018035411834716797, 0.01963520050048828, 0.021234989166259766, 0.02283477783203125, 0.024434566497802734, 0.02603435516357422, 0.027634143829345703, 0.029233932495117188, 0.030833721160888672, 0.032433509826660156, 0.03403329849243164, 0.035633087158203125, 0.03723287582397461, 0.038832664489746094, 0.04043245315551758, 0.04203224182128906, 0.04363203048706055, 0.04523181915283203, 0.046831607818603516, 0.048431396484375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 7.0, 5.0, 12.0, 29.0, 43.0, 135.0, 441.0, 1016.0, 1309.0, 675.0, 251.0, 90.0, 32.0, 8.0, 14.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035186767578125, -0.03389120101928711, -0.03259563446044922, -0.03130006790161133, -0.030004501342773438, -0.028708934783935547, -0.027413368225097656, -0.026117801666259766, -0.024822235107421875, -0.023526668548583984, -0.022231101989746094, -0.020935535430908203, -0.019639968872070312, -0.018344402313232422, -0.01704883575439453, -0.01575326919555664, -0.01445770263671875, -0.01316213607788086, -0.011866569519042969, -0.010571002960205078, -0.009275436401367188, -0.007979869842529297, -0.006684303283691406, -0.005388736724853516, -0.004093170166015625, -0.0027976036071777344, -0.0015020370483398438, -0.00020647048950195312, 0.0010890960693359375, 0.002384662628173828, 0.0036802291870117188, 0.004975795745849609, 0.0062713623046875, 0.007566928863525391, 0.008862495422363281, 0.010158061981201172, 0.011453628540039062, 0.012749195098876953, 0.014044761657714844, 0.015340328216552734, 0.016635894775390625, 0.017931461334228516, 0.019227027893066406, 0.020522594451904297, 0.021818161010742188, 0.023113727569580078, 0.02440929412841797, 0.02570486068725586, 0.02700042724609375, 0.02829599380493164, 0.02959156036376953, 0.030887126922607422, 0.03218269348144531, 0.0334782600402832, 0.034773826599121094, 0.036069393157958984, 0.037364959716796875, 0.038660526275634766, 0.039956092834472656, 0.04125165939331055, 0.04254722595214844, 0.04384279251098633, 0.04513835906982422, 0.04643392562866211, 0.0477294921875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 27.0, 110.0, 363.0, 355.0, 118.0, 21.0, 5.0, 1.0, 3.0], "bins": [-0.4615025818347931, -0.45355406403541565, -0.4456055462360382, -0.43765705823898315, -0.4297085404396057, -0.42176002264022827, -0.41381150484085083, -0.4058629870414734, -0.39791446924209595, -0.3899659514427185, -0.38201743364334106, -0.3740689158439636, -0.36612042784690857, -0.35817191004753113, -0.3502233922481537, -0.34227487444877625, -0.3343263864517212, -0.32637786865234375, -0.3184293508529663, -0.31048083305358887, -0.3025323450565338, -0.29458382725715637, -0.28663530945777893, -0.2786867916584015, -0.27073827385902405, -0.2627897560596466, -0.25484123826026917, -0.24689273536205292, -0.23894421756267548, -0.23099571466445923, -0.2230471968650818, -0.21509867906570435, -0.2071501910686493, -0.19920167326927185, -0.1912531703710556, -0.18330465257167816, -0.17535613477230072, -0.16740763187408447, -0.15945911407470703, -0.1515105962753296, -0.14356207847595215, -0.1356135606765747, -0.12766505777835846, -0.11971653997898102, -0.11176802217960358, -0.10381951183080673, -0.09587100148200989, -0.08792248368263245, -0.0799739807844162, -0.07202547043561935, -0.06407695263624191, -0.05612844228744507, -0.048179928213357925, -0.04023141413927078, -0.03228290379047394, -0.024334389716386795, -0.016385871917009354, -0.008437358774244785, -0.000488845631480217, 0.007459666579961777, 0.01540818065404892, 0.023356694728136063, 0.03130520507693291, 0.03925371915102005, 0.04720223322510719]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 5.0, 6.0, 9.0, 10.0, 10.0, 12.0, 11.0, 22.0, 15.0, 21.0, 26.0, 26.0, 19.0, 35.0, 33.0, 32.0, 46.0, 30.0, 48.0, 39.0, 34.0, 35.0, 48.0, 34.0, 45.0, 37.0, 41.0, 30.0, 34.0, 24.0, 29.0, 21.0, 22.0, 25.0, 13.0, 13.0, 7.0, 12.0, 8.0, 9.0, 11.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04703885316848755, -0.04540310427546501, -0.043767355382442474, -0.04213160648941994, -0.0404958575963974, -0.03886010870337486, -0.037224359810352325, -0.03558861091732979, -0.03395286202430725, -0.032317113131284714, -0.030681364238262177, -0.02904561534523964, -0.027409866452217102, -0.025774117559194565, -0.024138368666172028, -0.02250261977314949, -0.020866870880126953, -0.019231121987104416, -0.01759537309408188, -0.01595962420105934, -0.014323875308036804, -0.012688126415014267, -0.01105237752199173, -0.009416628628969193, -0.007780879735946655, -0.006145130842924118, -0.004509381949901581, -0.0028736330568790436, -0.0012378841638565063, 0.0003978647291660309, 0.002033613622188568, 0.0036693625152111053, 0.005305111408233643, 0.00694086030125618, 0.008576609194278717, 0.010212358087301254, 0.011848106980323792, 0.013483855873346329, 0.015119604766368866, 0.016755353659391403, 0.01839110255241394, 0.020026851445436478, 0.021662600338459015, 0.023298349231481552, 0.02493409812450409, 0.026569847017526627, 0.028205595910549164, 0.0298413448035717, 0.03147709369659424, 0.033112842589616776, 0.03474859148263931, 0.03638434037566185, 0.03802008926868439, 0.039655838161706924, 0.04129158705472946, 0.042927335947752, 0.044563084840774536, 0.04619883373379707, 0.04783458262681961, 0.04947033151984215, 0.051106080412864685, 0.05274182930588722, 0.05437757819890976, 0.0560133270919323, 0.057649075984954834]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 8.0, 9.0, 10.0, 19.0, 28.0, 34.0, 40.0, 53.0, 69.0, 117.0, 161.0, 256.0, 374.0, 643.0, 1004.0, 2025.0, 4346.0, 10901.0, 31719.0, 101208.0, 322877.0, 377703.0, 131051.0, 39719.0, 13339.0, 5249.0, 2345.0, 1160.0, 698.0, 412.0, 266.0, 212.0, 134.0, 96.0, 74.0, 54.0, 42.0, 31.0, 16.0, 14.0, 11.0, 9.0, 6.0, 6.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0310211181640625, -0.030023813247680664, -0.029026508331298828, -0.028029203414916992, -0.027031898498535156, -0.02603459358215332, -0.025037288665771484, -0.02403998374938965, -0.023042678833007812, -0.022045373916625977, -0.02104806900024414, -0.020050764083862305, -0.01905345916748047, -0.018056154251098633, -0.017058849334716797, -0.01606154441833496, -0.015064239501953125, -0.014066934585571289, -0.013069629669189453, -0.012072324752807617, -0.011075019836425781, -0.010077714920043945, -0.00908041000366211, -0.008083105087280273, -0.0070858001708984375, -0.0060884952545166016, -0.005091190338134766, -0.00409388542175293, -0.0030965805053710938, -0.002099275588989258, -0.0011019706726074219, -0.00010466575622558594, 0.00089263916015625, 0.001889944076538086, 0.002887248992919922, 0.003884553909301758, 0.004881858825683594, 0.00587916374206543, 0.006876468658447266, 0.007873773574829102, 0.008871078491210938, 0.009868383407592773, 0.01086568832397461, 0.011862993240356445, 0.012860298156738281, 0.013857603073120117, 0.014854907989501953, 0.01585221290588379, 0.016849517822265625, 0.01784682273864746, 0.018844127655029297, 0.019841432571411133, 0.02083873748779297, 0.021836042404174805, 0.02283334732055664, 0.023830652236938477, 0.024827957153320312, 0.02582526206970215, 0.026822566986083984, 0.02781987190246582, 0.028817176818847656, 0.029814481735229492, 0.030811786651611328, 0.031809091567993164, 0.032806396484375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 8.0, 16.0, 19.0, 30.0, 40.0, 53.0, 70.0, 75.0, 77.0, 99.0, 108.0, 71.0, 81.0, 61.0, 57.0, 42.0, 32.0, 19.0, 16.0, 11.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.065673828125, -0.06399154663085938, -0.06230926513671875, -0.060626983642578125, -0.0589447021484375, -0.057262420654296875, -0.05558013916015625, -0.053897857666015625, -0.052215576171875, -0.050533294677734375, -0.04885101318359375, -0.047168731689453125, -0.0454864501953125, -0.043804168701171875, -0.04212188720703125, -0.040439605712890625, -0.03875732421875, -0.037075042724609375, -0.03539276123046875, -0.033710479736328125, -0.0320281982421875, -0.030345916748046875, -0.02866363525390625, -0.026981353759765625, -0.025299072265625, -0.023616790771484375, -0.02193450927734375, -0.020252227783203125, -0.0185699462890625, -0.016887664794921875, -0.01520538330078125, -0.013523101806640625, -0.0118408203125, -0.010158538818359375, -0.00847625732421875, -0.006793975830078125, -0.0051116943359375, -0.003429412841796875, -0.00174713134765625, -6.4849853515625e-05, 0.001617431640625, 0.003299713134765625, 0.00498199462890625, 0.006664276123046875, 0.0083465576171875, 0.010028839111328125, 0.01171112060546875, 0.013393402099609375, 0.01507568359375, 0.016757965087890625, 0.01844024658203125, 0.020122528076171875, 0.0218048095703125, 0.023487091064453125, 0.02516937255859375, 0.026851654052734375, 0.028533935546875, 0.030216217041015625, 0.03189849853515625, 0.033580780029296875, 0.0352630615234375, 0.036945343017578125, 0.03862762451171875, 0.040309906005859375, 0.0419921875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 12.0, 9.0, 9.0, 9.0, 13.0, 16.0, 9.0, 20.0, 20.0, 29.0, 24.0, 22.0, 28.0, 46.0, 64.0, 117.0, 299.0, 818.0, 4075.0, 30770.0, 407368.0, 554574.0, 43084.0, 5198.0, 1081.0, 341.0, 148.0, 73.0, 49.0, 30.0, 23.0, 18.0, 15.0, 17.0, 15.0, 13.0, 17.0, 10.0, 11.0, 5.0, 9.0, 10.0, 4.0, 12.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0], "bins": [-0.0772705078125, -0.07506752014160156, -0.07286453247070312, -0.07066154479980469, -0.06845855712890625, -0.06625556945800781, -0.06405258178710938, -0.06184959411621094, -0.0596466064453125, -0.05744361877441406, -0.055240631103515625, -0.05303764343261719, -0.05083465576171875, -0.04863166809082031, -0.046428680419921875, -0.04422569274902344, -0.042022705078125, -0.03981971740722656, -0.037616729736328125, -0.03541374206542969, -0.03321075439453125, -0.031007766723632812, -0.028804779052734375, -0.026601791381835938, -0.0243988037109375, -0.022195816040039062, -0.019992828369140625, -0.017789840698242188, -0.01558685302734375, -0.013383865356445312, -0.011180877685546875, -0.008977890014648438, -0.00677490234375, -0.0045719146728515625, -0.002368927001953125, -0.0001659393310546875, 0.00203704833984375, 0.0042400360107421875, 0.006443023681640625, 0.008646011352539062, 0.0108489990234375, 0.013051986694335938, 0.015254974365234375, 0.017457962036132812, 0.01966094970703125, 0.021863937377929688, 0.024066925048828125, 0.026269912719726562, 0.028472900390625, 0.030675888061523438, 0.032878875732421875, 0.03508186340332031, 0.03728485107421875, 0.03948783874511719, 0.041690826416015625, 0.04389381408691406, 0.0460968017578125, 0.04829978942871094, 0.050502777099609375, 0.05270576477050781, 0.05490875244140625, 0.05711174011230469, 0.059314727783203125, 0.06151771545410156, 0.063720703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 6.0, 5.0, 7.0, 5.0, 5.0, 7.0, 8.0, 10.0, 11.0, 11.0, 18.0, 12.0, 14.0, 18.0, 18.0, 15.0, 22.0, 33.0, 21.0, 37.0, 38.0, 37.0, 40.0, 39.0, 31.0, 43.0, 30.0, 48.0, 24.0, 35.0, 33.0, 31.0, 35.0, 22.0, 23.0, 29.0, 27.0, 18.0, 18.0, 21.0, 10.0, 10.0, 14.0, 13.0, 14.0, 7.0, 11.0, 3.0, 7.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0426025390625, -0.04111003875732422, -0.03961753845214844, -0.038125038146972656, -0.036632537841796875, -0.035140037536621094, -0.03364753723144531, -0.03215503692626953, -0.03066253662109375, -0.02917003631591797, -0.027677536010742188, -0.026185035705566406, -0.024692535400390625, -0.023200035095214844, -0.021707534790039062, -0.02021503448486328, -0.0187225341796875, -0.01723003387451172, -0.015737533569335938, -0.014245033264160156, -0.012752532958984375, -0.011260032653808594, -0.009767532348632812, -0.008275032043457031, -0.00678253173828125, -0.005290031433105469, -0.0037975311279296875, -0.0023050308227539062, -0.000812530517578125, 0.0006799697875976562, 0.0021724700927734375, 0.0036649703979492188, 0.005157470703125, 0.006649971008300781, 0.008142471313476562, 0.009634971618652344, 0.011127471923828125, 0.012619972229003906, 0.014112472534179688, 0.015604972839355469, 0.01709747314453125, 0.01858997344970703, 0.020082473754882812, 0.021574974060058594, 0.023067474365234375, 0.024559974670410156, 0.026052474975585938, 0.02754497528076172, 0.0290374755859375, 0.03052997589111328, 0.03202247619628906, 0.033514976501464844, 0.035007476806640625, 0.036499977111816406, 0.03799247741699219, 0.03948497772216797, 0.04097747802734375, 0.04246997833251953, 0.04396247863769531, 0.045454978942871094, 0.046947479248046875, 0.048439979553222656, 0.04993247985839844, 0.05142498016357422, 0.05291748046875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 7.0, 6.0, 14.0, 12.0, 27.0, 44.0, 71.0, 107.0, 151.0, 220.0, 395.0, 832.0, 1416.0, 2815.0, 5834.0, 13423.0, 33945.0, 98807.0, 260171.0, 341201.0, 184017.0, 63951.0, 22782.0, 9433.0, 4185.0, 2103.0, 1106.0, 601.0, 337.0, 189.0, 124.0, 80.0, 52.0, 30.0, 24.0, 11.0, 13.0, 6.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0061798095703125, -0.005994200706481934, -0.005808591842651367, -0.005622982978820801, -0.005437374114990234, -0.005251765251159668, -0.0050661563873291016, -0.004880547523498535, -0.004694938659667969, -0.004509329795837402, -0.004323720932006836, -0.0041381120681762695, -0.003952503204345703, -0.0037668943405151367, -0.0035812854766845703, -0.003395676612854004, -0.0032100677490234375, -0.003024458885192871, -0.0028388500213623047, -0.0026532411575317383, -0.002467632293701172, -0.0022820234298706055, -0.002096414566040039, -0.0019108057022094727, -0.0017251968383789062, -0.0015395879745483398, -0.0013539791107177734, -0.001168370246887207, -0.0009827613830566406, -0.0007971525192260742, -0.0006115436553955078, -0.0004259347915649414, -0.000240325927734375, -5.4717063903808594e-05, 0.0001308917999267578, 0.0003165006637573242, 0.0005021095275878906, 0.000687718391418457, 0.0008733272552490234, 0.0010589361190795898, 0.0012445449829101562, 0.0014301538467407227, 0.001615762710571289, 0.0018013715744018555, 0.001986980438232422, 0.0021725893020629883, 0.0023581981658935547, 0.002543807029724121, 0.0027294158935546875, 0.002915024757385254, 0.0031006336212158203, 0.0032862424850463867, 0.003471851348876953, 0.0036574602127075195, 0.003843069076538086, 0.004028677940368652, 0.004214286804199219, 0.004399895668029785, 0.0045855045318603516, 0.004771113395690918, 0.004956722259521484, 0.005142331123352051, 0.005327939987182617, 0.005513548851013184, 0.00569915771484375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 8.0, 5.0, 6.0, 11.0, 10.0, 9.0, 23.0, 28.0, 30.0, 39.0, 32.0, 40.0, 30.0, 39.0, 38.0, 51.0, 37.0, 56.0, 54.0, 47.0, 47.0, 43.0, 52.0, 25.0, 45.0, 22.0, 27.0, 27.0, 16.0, 14.0, 14.0, 12.0, 11.0, 9.0, 8.0, 7.0, 5.0, 2.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6093254089355469e-06, -1.5506520867347717e-06, -1.4919787645339966e-06, -1.4333054423332214e-06, -1.3746321201324463e-06, -1.3159587979316711e-06, -1.257285475730896e-06, -1.1986121535301208e-06, -1.1399388313293457e-06, -1.0812655091285706e-06, -1.0225921869277954e-06, -9.639188647270203e-07, -9.052455425262451e-07, -8.4657222032547e-07, -7.878988981246948e-07, -7.292255759239197e-07, -6.705522537231445e-07, -6.118789315223694e-07, -5.532056093215942e-07, -4.945322871208191e-07, -4.3585896492004395e-07, -3.771856427192688e-07, -3.1851232051849365e-07, -2.598389983177185e-07, -2.0116567611694336e-07, -1.424923539161682e-07, -8.381903171539307e-08, -2.514570951461792e-08, 3.3527612686157227e-08, 9.220093488693237e-08, 1.5087425708770752e-07, 2.0954757928848267e-07, 2.682209014892578e-07, 3.2689422369003296e-07, 3.855675458908081e-07, 4.4424086809158325e-07, 5.029141902923584e-07, 5.615875124931335e-07, 6.202608346939087e-07, 6.789341568946838e-07, 7.37607479095459e-07, 7.962808012962341e-07, 8.549541234970093e-07, 9.136274456977844e-07, 9.723007678985596e-07, 1.0309740900993347e-06, 1.0896474123001099e-06, 1.148320734500885e-06, 1.2069940567016602e-06, 1.2656673789024353e-06, 1.3243407011032104e-06, 1.3830140233039856e-06, 1.4416873455047607e-06, 1.5003606677055359e-06, 1.559033989906311e-06, 1.6177073121070862e-06, 1.6763806343078613e-06, 1.7350539565086365e-06, 1.7937272787094116e-06, 1.8524006009101868e-06, 1.911073923110962e-06, 1.969747245311737e-06, 2.028420567512512e-06, 2.0870938897132874e-06, 2.1457672119140625e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 3.0, 7.0, 16.0, 21.0, 48.0, 77.0, 127.0, 223.0, 516.0, 1507.0, 5743.0, 34746.0, 280234.0, 585653.0, 118903.0, 15842.0, 3156.0, 922.0, 371.0, 198.0, 95.0, 60.0, 25.0, 16.0, 15.0, 13.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0108642578125, -0.010480284690856934, -0.010096311569213867, -0.0097123384475708, -0.009328365325927734, -0.008944392204284668, -0.008560419082641602, -0.008176445960998535, -0.007792472839355469, -0.007408499717712402, -0.007024526596069336, -0.0066405534744262695, -0.006256580352783203, -0.005872607231140137, -0.00548863410949707, -0.005104660987854004, -0.0047206878662109375, -0.004336714744567871, -0.003952741622924805, -0.0035687685012817383, -0.003184795379638672, -0.0028008222579956055, -0.002416849136352539, -0.0020328760147094727, -0.0016489028930664062, -0.0012649297714233398, -0.0008809566497802734, -0.000496983528137207, -0.00011301040649414062, 0.0002709627151489258, 0.0006549358367919922, 0.0010389089584350586, 0.001422882080078125, 0.0018068552017211914, 0.002190828323364258, 0.0025748014450073242, 0.0029587745666503906, 0.003342747688293457, 0.0037267208099365234, 0.00411069393157959, 0.004494667053222656, 0.004878640174865723, 0.005262613296508789, 0.0056465864181518555, 0.006030559539794922, 0.006414532661437988, 0.006798505783081055, 0.007182478904724121, 0.0075664520263671875, 0.007950425148010254, 0.00833439826965332, 0.008718371391296387, 0.009102344512939453, 0.00948631763458252, 0.009870290756225586, 0.010254263877868652, 0.010638236999511719, 0.011022210121154785, 0.011406183242797852, 0.011790156364440918, 0.012174129486083984, 0.01255810260772705, 0.012942075729370117, 0.013326048851013184, 0.01371002197265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 3.0, 4.0, 6.0, 6.0, 4.0, 6.0, 9.0, 11.0, 13.0, 20.0, 37.0, 41.0, 43.0, 51.0, 72.0, 85.0, 77.0, 79.0, 84.0, 76.0, 51.0, 37.0, 47.0, 28.0, 27.0, 17.0, 18.0, 14.0, 11.0, 10.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007251739501953125, -0.007016599178314209, -0.006781458854675293, -0.006546318531036377, -0.006311178207397461, -0.006076037883758545, -0.005840897560119629, -0.005605757236480713, -0.005370616912841797, -0.005135476589202881, -0.004900336265563965, -0.004665195941925049, -0.004430055618286133, -0.004194915294647217, -0.003959774971008301, -0.0037246346473693848, -0.0034894943237304688, -0.0032543540000915527, -0.0030192136764526367, -0.0027840733528137207, -0.0025489330291748047, -0.0023137927055358887, -0.0020786523818969727, -0.0018435120582580566, -0.0016083717346191406, -0.0013732314109802246, -0.0011380910873413086, -0.0009029507637023926, -0.0006678104400634766, -0.00043267011642456055, -0.00019752979278564453, 3.7610530853271484e-05, 0.0002727508544921875, 0.0005078911781311035, 0.0007430315017700195, 0.0009781718254089355, 0.0012133121490478516, 0.0014484524726867676, 0.0016835927963256836, 0.0019187331199645996, 0.0021538734436035156, 0.0023890137672424316, 0.0026241540908813477, 0.0028592944145202637, 0.0030944347381591797, 0.0033295750617980957, 0.0035647153854370117, 0.0037998557090759277, 0.004034996032714844, 0.00427013635635376, 0.004505276679992676, 0.004740417003631592, 0.004975557327270508, 0.005210697650909424, 0.00544583797454834, 0.005680978298187256, 0.005916118621826172, 0.006151258945465088, 0.006386399269104004, 0.00662153959274292, 0.006856679916381836, 0.007091820240020752, 0.007326960563659668, 0.007562100887298584, 0.0077972412109375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 7.0, 16.0, 34.0, 62.0, 158.0, 224.0, 241.0, 133.0, 66.0, 26.0, 18.0, 9.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2651014029979706, -0.2591797113418579, -0.25325801968574524, -0.24733632802963257, -0.2414146214723587, -0.23549292981624603, -0.22957123816013336, -0.2236495465040207, -0.21772783994674683, -0.21180614829063416, -0.20588445663452148, -0.1999627649784088, -0.19404105842113495, -0.18811936676502228, -0.1821976751089096, -0.17627598345279694, -0.17035429179668427, -0.1644326001405716, -0.15851090848445892, -0.15258920192718506, -0.1466675102710724, -0.14074581861495972, -0.13482412695884705, -0.12890243530273438, -0.12298073619604111, -0.11705904453992844, -0.11113734543323517, -0.1052156537771225, -0.09929396212100983, -0.09337226301431656, -0.08745057135820389, -0.08152887225151062, -0.07560718804597855, -0.06968549638986588, -0.06376379728317261, -0.057842105627059937, -0.05192041024565697, -0.045998714864254, -0.04007702320814133, -0.03415532782673836, -0.028233632445335388, -0.02231193706393242, -0.0163902435451746, -0.010468550026416779, -0.004546854645013809, 0.0013748407363891602, 0.007296532392501831, 0.0132182277739048, 0.01913992315530777, 0.02506161853671074, 0.03098331205546856, 0.03690500557422638, 0.04282670095562935, 0.04874839633703232, 0.05467008799314499, 0.06059178337454796, 0.06651347875595093, 0.0724351704120636, 0.07835686951875687, 0.08427856117486954, 0.0902002602815628, 0.09612195193767548, 0.10204364359378815, 0.10796533524990082, 0.11388703435659409]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 6.0, 4.0, 5.0, 6.0, 9.0, 9.0, 13.0, 19.0, 22.0, 32.0, 23.0, 31.0, 36.0, 44.0, 28.0, 37.0, 39.0, 50.0, 37.0, 53.0, 53.0, 39.0, 53.0, 44.0, 39.0, 39.0, 33.0, 28.0, 32.0, 31.0, 21.0, 12.0, 11.0, 16.0, 10.0, 12.0, 5.0, 4.0, 8.0, 9.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16776782274246216, -0.16294652223587036, -0.15812523663043976, -0.15330393612384796, -0.14848263561725616, -0.14366135001182556, -0.13884004950523376, -0.13401874899864197, -0.12919744849205017, -0.12437615543603897, -0.11955485492944717, -0.11473356187343597, -0.10991226136684418, -0.10509096831083298, -0.10026967525482178, -0.09544837474822998, -0.09062708914279938, -0.08580579608678818, -0.08098449558019638, -0.07616320252418518, -0.07134190201759338, -0.06652060896158218, -0.061699315905570984, -0.056878019124269485, -0.05205672234296799, -0.04723542556166649, -0.04241412878036499, -0.03759283572435379, -0.03277153894305229, -0.027950242161750793, -0.023128947243094444, -0.018307652324438095, -0.013486355543136597, -0.008665059693157673, -0.003843763843178749, 0.0009775320068001747, 0.0057988278567790985, 0.010620124638080597, 0.015441419556736946, 0.020262714475393295, 0.025084011256694794, 0.029905308037996292, 0.03472660481929779, 0.03954789787530899, 0.04436919465661049, 0.04919049143791199, 0.05401178449392319, 0.058833081275224686, 0.06365437805652618, 0.06847567111253738, 0.07329697161912918, 0.07811826467514038, 0.08293956518173218, 0.08776085823774338, 0.09258215129375458, 0.09740345180034637, 0.10222474485635757, 0.10704603791236877, 0.11186733841896057, 0.11668863147497177, 0.12150992453098297, 0.12633122503757477, 0.13115252554416656, 0.13597381114959717, 0.14079511165618896]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 18.0, 15.0, 37.0, 40.0, 59.0, 132.0, 308.0, 1675.0, 7320.0, 33557.0, 703032.0, 3067852.0, 347150.0, 23709.0, 5970.0, 2389.0, 705.0, 128.0, 64.0, 34.0, 27.0, 17.0, 4.0, 4.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.049896240234375, -0.0483555793762207, -0.046814918518066406, -0.04527425765991211, -0.04373359680175781, -0.042192935943603516, -0.04065227508544922, -0.03911161422729492, -0.037570953369140625, -0.03603029251098633, -0.03448963165283203, -0.032948970794677734, -0.03140830993652344, -0.02986764907836914, -0.028326988220214844, -0.026786327362060547, -0.02524566650390625, -0.023705005645751953, -0.022164344787597656, -0.02062368392944336, -0.019083023071289062, -0.017542362213134766, -0.01600170135498047, -0.014461040496826172, -0.012920379638671875, -0.011379718780517578, -0.009839057922363281, -0.008298397064208984, -0.0067577362060546875, -0.005217075347900391, -0.0036764144897460938, -0.002135753631591797, -0.0005950927734375, 0.0009455680847167969, 0.0024862289428710938, 0.004026889801025391, 0.0055675506591796875, 0.007108211517333984, 0.008648872375488281, 0.010189533233642578, 0.011730194091796875, 0.013270854949951172, 0.014811515808105469, 0.016352176666259766, 0.017892837524414062, 0.01943349838256836, 0.020974159240722656, 0.022514820098876953, 0.02405548095703125, 0.025596141815185547, 0.027136802673339844, 0.02867746353149414, 0.030218124389648438, 0.031758785247802734, 0.03329944610595703, 0.03484010696411133, 0.036380767822265625, 0.03792142868041992, 0.03946208953857422, 0.041002750396728516, 0.04254341125488281, 0.04408407211303711, 0.045624732971191406, 0.0471653938293457, 0.0487060546875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 7.0, 17.0, 19.0, 24.0, 33.0, 44.0, 53.0, 77.0, 57.0, 108.0, 78.0, 80.0, 70.0, 91.0, 53.0, 38.0, 50.0, 29.0, 26.0, 16.0, 8.0, 7.0, 6.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.057952880859375, -0.05637216567993164, -0.05479145050048828, -0.05321073532104492, -0.05163002014160156, -0.0500493049621582, -0.048468589782714844, -0.046887874603271484, -0.045307159423828125, -0.043726444244384766, -0.042145729064941406, -0.04056501388549805, -0.03898429870605469, -0.03740358352661133, -0.03582286834716797, -0.03424215316772461, -0.03266143798828125, -0.03108072280883789, -0.02950000762939453, -0.027919292449951172, -0.026338577270507812, -0.024757862091064453, -0.023177146911621094, -0.021596431732177734, -0.020015716552734375, -0.018435001373291016, -0.016854286193847656, -0.015273571014404297, -0.013692855834960938, -0.012112140655517578, -0.010531425476074219, -0.00895071029663086, -0.0073699951171875, -0.005789279937744141, -0.004208564758300781, -0.002627849578857422, -0.0010471343994140625, 0.0005335807800292969, 0.0021142959594726562, 0.0036950111389160156, 0.005275726318359375, 0.006856441497802734, 0.008437156677246094, 0.010017871856689453, 0.011598587036132812, 0.013179302215576172, 0.014760017395019531, 0.01634073257446289, 0.01792144775390625, 0.01950216293334961, 0.02108287811279297, 0.022663593292236328, 0.024244308471679688, 0.025825023651123047, 0.027405738830566406, 0.028986454010009766, 0.030567169189453125, 0.032147884368896484, 0.033728599548339844, 0.0353093147277832, 0.03689002990722656, 0.03847074508666992, 0.04005146026611328, 0.04163217544555664, 0.043212890625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 1.0, 4.0, 11.0, 14.0, 28.0, 17.0, 43.0, 48.0, 82.0, 136.0, 198.0, 384.0, 594.0, 1059.0, 1919.0, 3613.0, 7492.0, 17886.0, 54848.0, 279342.0, 2238958.0, 1364761.0, 158190.0, 38219.0, 13626.0, 6080.0, 2951.0, 1547.0, 876.0, 486.0, 317.0, 180.0, 128.0, 78.0, 56.0, 36.0, 20.0, 10.0, 13.0, 4.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.02130126953125, -0.020610809326171875, -0.01992034912109375, -0.019229888916015625, -0.0185394287109375, -0.017848968505859375, -0.01715850830078125, -0.016468048095703125, -0.015777587890625, -0.015087127685546875, -0.01439666748046875, -0.013706207275390625, -0.0130157470703125, -0.012325286865234375, -0.01163482666015625, -0.010944366455078125, -0.01025390625, -0.009563446044921875, -0.00887298583984375, -0.008182525634765625, -0.0074920654296875, -0.006801605224609375, -0.00611114501953125, -0.005420684814453125, -0.004730224609375, -0.004039764404296875, -0.00334930419921875, -0.002658843994140625, -0.0019683837890625, -0.001277923583984375, -0.00058746337890625, 0.000102996826171875, 0.00079345703125, 0.001483917236328125, 0.00217437744140625, 0.002864837646484375, 0.0035552978515625, 0.004245758056640625, 0.00493621826171875, 0.005626678466796875, 0.006317138671875, 0.007007598876953125, 0.00769805908203125, 0.008388519287109375, 0.0090789794921875, 0.009769439697265625, 0.01045989990234375, 0.011150360107421875, 0.0118408203125, 0.012531280517578125, 0.01322174072265625, 0.013912200927734375, 0.0146026611328125, 0.015293121337890625, 0.01598358154296875, 0.016674041748046875, 0.017364501953125, 0.018054962158203125, 0.01874542236328125, 0.019435882568359375, 0.0201263427734375, 0.020816802978515625, 0.02150726318359375, 0.022197723388671875, 0.02288818359375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 4.0, 10.0, 19.0, 11.0, 16.0, 37.0, 91.0, 184.0, 374.0, 658.0, 849.0, 711.0, 508.0, 257.0, 133.0, 65.0, 36.0, 19.0, 14.0, 13.0, 8.0, 11.0, 8.0, 4.0, 0.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.036865234375, -0.03586101531982422, -0.03485679626464844, -0.033852577209472656, -0.032848358154296875, -0.031844139099121094, -0.030839920043945312, -0.02983570098876953, -0.02883148193359375, -0.02782726287841797, -0.026823043823242188, -0.025818824768066406, -0.024814605712890625, -0.023810386657714844, -0.022806167602539062, -0.02180194854736328, -0.0207977294921875, -0.01979351043701172, -0.018789291381835938, -0.017785072326660156, -0.016780853271484375, -0.015776634216308594, -0.014772415161132812, -0.013768196105957031, -0.01276397705078125, -0.011759757995605469, -0.010755538940429688, -0.009751319885253906, -0.008747100830078125, -0.007742881774902344, -0.0067386627197265625, -0.005734443664550781, -0.004730224609375, -0.0037260055541992188, -0.0027217864990234375, -0.0017175674438476562, -0.000713348388671875, 0.00029087066650390625, 0.0012950897216796875, 0.0022993087768554688, 0.00330352783203125, 0.004307746887207031, 0.0053119659423828125, 0.006316184997558594, 0.007320404052734375, 0.008324623107910156, 0.009328842163085938, 0.010333061218261719, 0.0113372802734375, 0.012341499328613281, 0.013345718383789062, 0.014349937438964844, 0.015354156494140625, 0.016358375549316406, 0.017362594604492188, 0.01836681365966797, 0.01937103271484375, 0.02037525177001953, 0.021379470825195312, 0.022383689880371094, 0.023387908935546875, 0.024392127990722656, 0.025396347045898438, 0.02640056610107422, 0.02740478515625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 31.0, 85.0, 225.0, 313.0, 227.0, 79.0, 31.0, 8.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.43116649985313416, -0.4231215715408325, -0.4150766432285309, -0.40703171491622925, -0.3989867866039276, -0.390941858291626, -0.38289692997932434, -0.3748520016670227, -0.36680710315704346, -0.3587621748447418, -0.3507172465324402, -0.34267231822013855, -0.3346273899078369, -0.3265824615955353, -0.31853753328323364, -0.3104926347732544, -0.30244767665863037, -0.29440274834632874, -0.2863578200340271, -0.27831289172172546, -0.27026796340942383, -0.2622230350971222, -0.25417810678482056, -0.24613319337368011, -0.23808826506137848, -0.23004333674907684, -0.2219984084367752, -0.21395348012447357, -0.20590856671333313, -0.1978636384010315, -0.18981871008872986, -0.18177378177642822, -0.1737288534641266, -0.16568392515182495, -0.15763899683952332, -0.14959406852722168, -0.14154914021492004, -0.1335042119026184, -0.12545929849147797, -0.11741437017917633, -0.10936944931745529, -0.10132452100515366, -0.09327960014343262, -0.08523467183113098, -0.07718974351882935, -0.06914481520652771, -0.06109989061951637, -0.053054966032505035, -0.0450100377202034, -0.036965109407901764, -0.028920184820890427, -0.02087525837123394, -0.012830331921577454, -0.004785403609275818, 0.0032595209777355194, 0.011304445564746857, 0.019349373877048492, 0.02739430032670498, 0.035439226776361465, 0.0434841513633728, 0.05152907967567444, 0.059574007987976074, 0.06761893630027771, 0.07566385716199875, 0.08370878547430038]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 10.0, 7.0, 11.0, 13.0, 16.0, 16.0, 19.0, 25.0, 24.0, 28.0, 41.0, 39.0, 46.0, 38.0, 46.0, 37.0, 48.0, 40.0, 55.0, 47.0, 43.0, 48.0, 41.0, 39.0, 40.0, 31.0, 38.0, 25.0, 9.0, 16.0, 15.0, 11.0, 8.0, 11.0, 3.0, 2.0, 5.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.08533340692520142, -0.08290427923202515, -0.08047515898942947, -0.0780460312962532, -0.07561691105365753, -0.07318778336048126, -0.07075865566730499, -0.06832952797412872, -0.06590040773153305, -0.06347128003835678, -0.06104215979576111, -0.05861303210258484, -0.05618390813469887, -0.0537547841668129, -0.05132565647363663, -0.048896532505750656, -0.046467408537864685, -0.044038284569978714, -0.04160916060209274, -0.03918003290891647, -0.0367509089410305, -0.03432178497314453, -0.03189265727996826, -0.02946353331208229, -0.02703440934419632, -0.02460528537631035, -0.022176159545779228, -0.019747033715248108, -0.017317909747362137, -0.014888784848153591, -0.012459659948945045, -0.010030534118413925, -0.007601410150527954, -0.005172285251319408, -0.0027431603521108627, -0.00031403545290231705, 0.0021150894463062286, 0.004544214345514774, 0.00697333924472332, 0.00940246507525444, 0.011831589043140411, 0.014260713942348957, 0.016689838841557503, 0.019118964672088623, 0.021548088639974594, 0.023977212607860565, 0.026406338438391685, 0.028835464268922806, 0.03126458823680878, 0.03369371220469475, 0.03612283617258072, 0.03855196386575699, 0.04098108783364296, 0.04341021180152893, 0.0458393394947052, 0.04826846346259117, 0.05069758743047714, 0.05312671139836311, 0.055555835366249084, 0.057984963059425354, 0.060414087027311325, 0.0628432109951973, 0.06527233868837357, 0.06770145893096924, 0.07013058662414551]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 10.0, 7.0, 13.0, 15.0, 28.0, 36.0, 54.0, 70.0, 89.0, 146.0, 204.0, 340.0, 425.0, 739.0, 1401.0, 2667.0, 5989.0, 15535.0, 47155.0, 161452.0, 412866.0, 274763.0, 82060.0, 25121.0, 9104.0, 3786.0, 1766.0, 1006.0, 523.0, 360.0, 252.0, 179.0, 109.0, 76.0, 64.0, 34.0, 27.0, 26.0, 15.0, 11.0, 9.0, 13.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03277587890625, -0.03170919418334961, -0.03064250946044922, -0.029575824737548828, -0.028509140014648438, -0.027442455291748047, -0.026375770568847656, -0.025309085845947266, -0.024242401123046875, -0.023175716400146484, -0.022109031677246094, -0.021042346954345703, -0.019975662231445312, -0.018908977508544922, -0.01784229278564453, -0.01677560806274414, -0.01570892333984375, -0.01464223861694336, -0.013575553894042969, -0.012508869171142578, -0.011442184448242188, -0.010375499725341797, -0.009308815002441406, -0.008242130279541016, -0.007175445556640625, -0.006108760833740234, -0.005042076110839844, -0.003975391387939453, -0.0029087066650390625, -0.0018420219421386719, -0.0007753372192382812, 0.0002913475036621094, 0.0013580322265625, 0.0024247169494628906, 0.0034914016723632812, 0.004558086395263672, 0.0056247711181640625, 0.006691455841064453, 0.007758140563964844, 0.008824825286865234, 0.009891510009765625, 0.010958194732666016, 0.012024879455566406, 0.013091564178466797, 0.014158248901367188, 0.015224933624267578, 0.01629161834716797, 0.01735830307006836, 0.01842498779296875, 0.01949167251586914, 0.02055835723876953, 0.021625041961669922, 0.022691726684570312, 0.023758411407470703, 0.024825096130371094, 0.025891780853271484, 0.026958465576171875, 0.028025150299072266, 0.029091835021972656, 0.030158519744873047, 0.031225204467773438, 0.03229188919067383, 0.03335857391357422, 0.03442525863647461, 0.035491943359375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 8.0, 8.0, 9.0, 26.0, 30.0, 34.0, 43.0, 58.0, 76.0, 75.0, 87.0, 82.0, 89.0, 77.0, 68.0, 69.0, 43.0, 39.0, 13.0, 28.0, 14.0, 8.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.057098388671875, -0.05556678771972656, -0.054035186767578125, -0.05250358581542969, -0.05097198486328125, -0.04944038391113281, -0.047908782958984375, -0.04637718200683594, -0.0448455810546875, -0.04331398010253906, -0.041782379150390625, -0.04025077819824219, -0.03871917724609375, -0.03718757629394531, -0.035655975341796875, -0.03412437438964844, -0.0325927734375, -0.031061172485351562, -0.029529571533203125, -0.027997970581054688, -0.02646636962890625, -0.024934768676757812, -0.023403167724609375, -0.021871566772460938, -0.0203399658203125, -0.018808364868164062, -0.017276763916015625, -0.015745162963867188, -0.01421356201171875, -0.012681961059570312, -0.011150360107421875, -0.009618759155273438, -0.008087158203125, -0.0065555572509765625, -0.005023956298828125, -0.0034923553466796875, -0.00196075439453125, -0.0004291534423828125, 0.001102447509765625, 0.0026340484619140625, 0.0041656494140625, 0.0056972503662109375, 0.007228851318359375, 0.008760452270507812, 0.01029205322265625, 0.011823654174804688, 0.013355255126953125, 0.014886856079101562, 0.01641845703125, 0.017950057983398438, 0.019481658935546875, 0.021013259887695312, 0.02254486083984375, 0.024076461791992188, 0.025608062744140625, 0.027139663696289062, 0.0286712646484375, 0.030202865600585938, 0.031734466552734375, 0.03326606750488281, 0.03479766845703125, 0.03632926940917969, 0.037860870361328125, 0.03939247131347656, 0.040924072265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 5.0, 1.0, 7.0, 5.0, 10.0, 14.0, 10.0, 17.0, 18.0, 30.0, 31.0, 41.0, 60.0, 56.0, 107.0, 153.0, 261.0, 516.0, 1005.0, 2010.0, 4935.0, 13740.0, 45521.0, 185273.0, 495550.0, 220351.0, 52653.0, 15944.0, 5536.0, 2279.0, 1032.0, 483.0, 303.0, 173.0, 124.0, 70.0, 58.0, 47.0, 28.0, 20.0, 19.0, 13.0, 7.0, 7.0, 6.0, 5.0, 7.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03570556640625, -0.034455299377441406, -0.03320503234863281, -0.03195476531982422, -0.030704498291015625, -0.02945423126220703, -0.028203964233398438, -0.026953697204589844, -0.02570343017578125, -0.024453163146972656, -0.023202896118164062, -0.02195262908935547, -0.020702362060546875, -0.01945209503173828, -0.018201828002929688, -0.016951560974121094, -0.0157012939453125, -0.014451026916503906, -0.013200759887695312, -0.011950492858886719, -0.010700225830078125, -0.009449958801269531, -0.008199691772460938, -0.006949424743652344, -0.00569915771484375, -0.004448890686035156, -0.0031986236572265625, -0.0019483566284179688, -0.000698089599609375, 0.0005521774291992188, 0.0018024444580078125, 0.0030527114868164062, 0.004302978515625, 0.005553245544433594, 0.0068035125732421875, 0.008053779602050781, 0.009304046630859375, 0.010554313659667969, 0.011804580688476562, 0.013054847717285156, 0.01430511474609375, 0.015555381774902344, 0.016805648803710938, 0.01805591583251953, 0.019306182861328125, 0.02055644989013672, 0.021806716918945312, 0.023056983947753906, 0.0243072509765625, 0.025557518005371094, 0.026807785034179688, 0.02805805206298828, 0.029308319091796875, 0.03055858612060547, 0.03180885314941406, 0.033059120178222656, 0.03430938720703125, 0.035559654235839844, 0.03680992126464844, 0.03806018829345703, 0.039310455322265625, 0.04056072235107422, 0.04181098937988281, 0.043061256408691406, 0.0443115234375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 4.0, 2.0, 7.0, 7.0, 10.0, 14.0, 13.0, 8.0, 15.0, 19.0, 23.0, 24.0, 30.0, 19.0, 31.0, 29.0, 32.0, 42.0, 38.0, 36.0, 37.0, 46.0, 30.0, 35.0, 41.0, 35.0, 26.0, 40.0, 23.0, 25.0, 31.0, 26.0, 20.0, 19.0, 19.0, 24.0, 15.0, 12.0, 19.0, 9.0, 13.0, 10.0, 11.0, 6.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.059417724609375, -0.05767536163330078, -0.05593299865722656, -0.054190635681152344, -0.052448272705078125, -0.050705909729003906, -0.04896354675292969, -0.04722118377685547, -0.04547882080078125, -0.04373645782470703, -0.04199409484863281, -0.040251731872558594, -0.038509368896484375, -0.036767005920410156, -0.03502464294433594, -0.03328227996826172, -0.0315399169921875, -0.02979755401611328, -0.028055191040039062, -0.026312828063964844, -0.024570465087890625, -0.022828102111816406, -0.021085739135742188, -0.01934337615966797, -0.01760101318359375, -0.01585865020751953, -0.014116287231445312, -0.012373924255371094, -0.010631561279296875, -0.008889198303222656, -0.0071468353271484375, -0.005404472351074219, -0.003662109375, -0.0019197463989257812, -0.0001773834228515625, 0.0015649795532226562, 0.003307342529296875, 0.005049705505371094, 0.0067920684814453125, 0.008534431457519531, 0.01027679443359375, 0.012019157409667969, 0.013761520385742188, 0.015503883361816406, 0.017246246337890625, 0.018988609313964844, 0.020730972290039062, 0.02247333526611328, 0.0242156982421875, 0.02595806121826172, 0.027700424194335938, 0.029442787170410156, 0.031185150146484375, 0.032927513122558594, 0.03466987609863281, 0.03641223907470703, 0.03815460205078125, 0.03989696502685547, 0.04163932800292969, 0.043381690979003906, 0.045124053955078125, 0.046866416931152344, 0.04860877990722656, 0.05035114288330078, 0.052093505859375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 6.0, 6.0, 10.0, 12.0, 16.0, 33.0, 39.0, 77.0, 105.0, 178.0, 332.0, 545.0, 950.0, 1813.0, 3490.0, 7010.0, 14243.0, 29800.0, 64136.0, 137515.0, 245042.0, 255004.0, 152120.0, 70852.0, 33294.0, 15690.0, 7734.0, 3907.0, 2023.0, 1099.0, 611.0, 330.0, 187.0, 134.0, 83.0, 44.0, 25.0, 19.0, 14.0, 10.0, 7.0, 7.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0046539306640625, -0.004493832588195801, -0.0043337345123291016, -0.004173636436462402, -0.004013538360595703, -0.003853440284729004, -0.0036933422088623047, -0.0035332441329956055, -0.0033731460571289062, -0.003213047981262207, -0.003052949905395508, -0.0028928518295288086, -0.0027327537536621094, -0.00257265567779541, -0.002412557601928711, -0.0022524595260620117, -0.0020923614501953125, -0.0019322633743286133, -0.001772165298461914, -0.0016120672225952148, -0.0014519691467285156, -0.0012918710708618164, -0.0011317729949951172, -0.000971674919128418, -0.0008115768432617188, -0.0006514787673950195, -0.0004913806915283203, -0.0003312826156616211, -0.00017118453979492188, -1.1086463928222656e-05, 0.00014901161193847656, 0.0003091096878051758, 0.000469207763671875, 0.0006293058395385742, 0.0007894039154052734, 0.0009495019912719727, 0.0011096000671386719, 0.001269698143005371, 0.0014297962188720703, 0.0015898942947387695, 0.0017499923706054688, 0.001910090446472168, 0.002070188522338867, 0.0022302865982055664, 0.0023903846740722656, 0.002550482749938965, 0.002710580825805664, 0.0028706789016723633, 0.0030307769775390625, 0.0031908750534057617, 0.003350973129272461, 0.00351107120513916, 0.0036711692810058594, 0.0038312673568725586, 0.003991365432739258, 0.004151463508605957, 0.004311561584472656, 0.0044716596603393555, 0.004631757736206055, 0.004791855812072754, 0.004951953887939453, 0.005112051963806152, 0.0052721500396728516, 0.005432248115539551, 0.00559234619140625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 4.0, 8.0, 3.0, 9.0, 7.0, 18.0, 14.0, 13.0, 11.0, 11.0, 46.0, 32.0, 33.0, 33.0, 28.0, 84.0, 46.0, 58.0, 38.0, 37.0, 86.0, 31.0, 41.0, 41.0, 36.0, 65.0, 17.0, 27.0, 13.0, 19.0, 32.0, 9.0, 6.0, 13.0, 6.0, 10.0, 3.0, 3.0, 3.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.384185791015625e-06, -2.312473952770233e-06, -2.2407621145248413e-06, -2.1690502762794495e-06, -2.0973384380340576e-06, -2.0256265997886658e-06, -1.953914761543274e-06, -1.882202923297882e-06, -1.8104910850524902e-06, -1.7387792468070984e-06, -1.6670674085617065e-06, -1.5953555703163147e-06, -1.5236437320709229e-06, -1.451931893825531e-06, -1.3802200555801392e-06, -1.3085082173347473e-06, -1.2367963790893555e-06, -1.1650845408439636e-06, -1.0933727025985718e-06, -1.02166086435318e-06, -9.499490261077881e-07, -8.782371878623962e-07, -8.065253496170044e-07, -7.348135113716125e-07, -6.631016731262207e-07, -5.913898348808289e-07, -5.19677996635437e-07, -4.4796615839004517e-07, -3.762543201446533e-07, -3.045424818992615e-07, -2.3283064365386963e-07, -1.6111880540847778e-07, -8.940696716308594e-08, -1.7695128917694092e-08, 5.4016709327697754e-08, 1.257285475730896e-07, 1.9744038581848145e-07, 2.691522240638733e-07, 3.4086406230926514e-07, 4.12575900554657e-07, 4.842877388000488e-07, 5.559995770454407e-07, 6.277114152908325e-07, 6.994232535362244e-07, 7.711350917816162e-07, 8.428469300270081e-07, 9.145587682723999e-07, 9.862706065177917e-07, 1.0579824447631836e-06, 1.1296942830085754e-06, 1.2014061212539673e-06, 1.2731179594993591e-06, 1.344829797744751e-06, 1.4165416359901428e-06, 1.4882534742355347e-06, 1.5599653124809265e-06, 1.6316771507263184e-06, 1.7033889889717102e-06, 1.775100827217102e-06, 1.846812665462494e-06, 1.9185245037078857e-06, 1.9902363419532776e-06, 2.0619481801986694e-06, 2.1336600184440613e-06, 2.205371856689453e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 8.0, 8.0, 11.0, 15.0, 16.0, 28.0, 41.0, 57.0, 89.0, 150.0, 254.0, 456.0, 813.0, 1444.0, 3021.0, 6410.0, 14081.0, 32841.0, 79395.0, 181710.0, 292549.0, 236580.0, 114118.0, 47265.0, 19853.0, 8861.0, 4071.0, 1955.0, 1026.0, 527.0, 368.0, 202.0, 123.0, 71.0, 52.0, 29.0, 19.0, 12.0, 12.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.005405426025390625, -0.005217134952545166, -0.005028843879699707, -0.004840552806854248, -0.004652261734008789, -0.00446397066116333, -0.004275679588317871, -0.004087388515472412, -0.003899097442626953, -0.003710806369781494, -0.003522515296936035, -0.003334224224090576, -0.003145933151245117, -0.002957642078399658, -0.0027693510055541992, -0.0025810599327087402, -0.0023927688598632812, -0.0022044777870178223, -0.0020161867141723633, -0.0018278956413269043, -0.0016396045684814453, -0.0014513134956359863, -0.0012630224227905273, -0.0010747313499450684, -0.0008864402770996094, -0.0006981492042541504, -0.0005098581314086914, -0.0003215670585632324, -0.00013327598571777344, 5.501508712768555e-05, 0.00024330615997314453, 0.0004315972328186035, 0.0006198883056640625, 0.0008081793785095215, 0.0009964704513549805, 0.0011847615242004395, 0.0013730525970458984, 0.0015613436698913574, 0.0017496347427368164, 0.0019379258155822754, 0.0021262168884277344, 0.0023145079612731934, 0.0025027990341186523, 0.0026910901069641113, 0.0028793811798095703, 0.0030676722526550293, 0.0032559633255004883, 0.0034442543983459473, 0.0036325454711914062, 0.0038208365440368652, 0.004009127616882324, 0.004197418689727783, 0.004385709762573242, 0.004574000835418701, 0.00476229190826416, 0.004950582981109619, 0.005138874053955078, 0.005327165126800537, 0.005515456199645996, 0.005703747272491455, 0.005892038345336914, 0.006080329418182373, 0.006268620491027832, 0.006456911563873291, 0.00664520263671875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 9.0, 6.0, 7.0, 11.0, 19.0, 13.0, 21.0, 24.0, 35.0, 36.0, 38.0, 68.0, 80.0, 84.0, 77.0, 67.0, 77.0, 62.0, 55.0, 47.0, 30.0, 28.0, 27.0, 17.0, 14.0, 4.0, 4.0, 8.0, 6.0, 8.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01004791259765625, -0.009718537330627441, -0.009389162063598633, -0.009059786796569824, -0.008730411529541016, -0.008401036262512207, -0.008071660995483398, -0.00774228572845459, -0.007412910461425781, -0.007083535194396973, -0.006754159927368164, -0.0064247846603393555, -0.006095409393310547, -0.005766034126281738, -0.00543665885925293, -0.005107283592224121, -0.0047779083251953125, -0.004448533058166504, -0.004119157791137695, -0.0037897825241088867, -0.003460407257080078, -0.0031310319900512695, -0.002801656723022461, -0.0024722814559936523, -0.0021429061889648438, -0.0018135309219360352, -0.0014841556549072266, -0.001154780387878418, -0.0008254051208496094, -0.0004960298538208008, -0.0001666545867919922, 0.0001627206802368164, 0.000492095947265625, 0.0008214712142944336, 0.0011508464813232422, 0.0014802217483520508, 0.0018095970153808594, 0.002138972282409668, 0.0024683475494384766, 0.002797722816467285, 0.0031270980834960938, 0.0034564733505249023, 0.003785848617553711, 0.0041152238845825195, 0.004444599151611328, 0.004773974418640137, 0.005103349685668945, 0.005432724952697754, 0.0057621002197265625, 0.006091475486755371, 0.00642085075378418, 0.006750226020812988, 0.007079601287841797, 0.0074089765548706055, 0.007738351821899414, 0.008067727088928223, 0.008397102355957031, 0.00872647762298584, 0.009055852890014648, 0.009385228157043457, 0.009714603424072266, 0.010043978691101074, 0.010373353958129883, 0.010702729225158691, 0.0110321044921875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 13.0, 108.0, 572.0, 273.0, 33.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0797185897827148, -1.0588350296020508, -1.0379514694213867, -1.017067790031433, -0.996184229850769, -0.975300669670105, -0.9544170498847961, -0.9335334300994873, -0.9126498699188232, -0.8917663097381592, -0.8708826899528503, -0.8499990701675415, -0.8291155099868774, -0.8082319498062134, -0.7873483300209045, -0.7664647102355957, -0.7455811500549316, -0.7246975898742676, -0.7038139700889587, -0.6829303503036499, -0.6620467901229858, -0.6411632299423218, -0.6202796101570129, -0.5993959903717041, -0.57851243019104, -0.557628870010376, -0.5367452502250671, -0.5158616304397583, -0.49497807025909424, -0.4740944802761078, -0.45321089029312134, -0.4323273003101349, -0.4114437401294708, -0.3905601501464844, -0.3696765601634979, -0.3487929701805115, -0.327909380197525, -0.3070257902145386, -0.2861422002315521, -0.2652586102485657, -0.24437502026557922, -0.22349143028259277, -0.20260784029960632, -0.18172425031661987, -0.16084066033363342, -0.13995707035064697, -0.11907348036766052, -0.09818989038467407, -0.07730630040168762, -0.05642271041870117, -0.03553912043571472, -0.014655530452728271, 0.006228059530258179, 0.02711164951324463, 0.04799523949623108, 0.06887882947921753, 0.08976241946220398, 0.11064600944519043, 0.13152959942817688, 0.15241318941116333, 0.17329677939414978, 0.19418036937713623, 0.21506395936012268, 0.23594754934310913, 0.2568311393260956]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 9.0, 8.0, 8.0, 6.0, 8.0, 15.0, 8.0, 15.0, 18.0, 12.0, 34.0, 22.0, 32.0, 30.0, 30.0, 45.0, 42.0, 26.0, 35.0, 48.0, 35.0, 45.0, 41.0, 47.0, 33.0, 43.0, 37.0, 29.0, 22.0, 32.0, 26.0, 27.0, 13.0, 19.0, 20.0, 17.0, 16.0, 12.0, 7.0, 9.0, 8.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.16096943616867065, -0.15602640807628632, -0.15108337998390198, -0.14614035189151764, -0.1411973237991333, -0.13625429570674896, -0.13131126761436462, -0.1263682246208191, -0.12142520397901535, -0.11648217588663101, -0.11153914779424667, -0.10659611970186234, -0.1016530841588974, -0.09671005606651306, -0.09176702797412872, -0.08682399988174438, -0.08188097178936005, -0.07693794369697571, -0.07199491560459137, -0.06705188751220703, -0.062108855694532394, -0.057165827602148056, -0.05222279578447342, -0.04727976769208908, -0.04233673959970474, -0.037393711507320404, -0.032450683414936066, -0.02750765159726143, -0.02256462350487709, -0.017621595412492752, -0.012678565457463264, -0.007735535502433777, -0.0027925074100494385, 0.0021505216136574745, 0.0070935506373643875, 0.0120365796610713, 0.016979608684778214, 0.021922636777162552, 0.02686566673219204, 0.03180869668722153, 0.036751724779605865, 0.041694752871990204, 0.04663778096437454, 0.05158081278204918, 0.05652384087443352, 0.061466868966817856, 0.06640990078449249, 0.07135292887687683, 0.07629595696926117, 0.08123898506164551, 0.08618201315402985, 0.09112504124641418, 0.09606806933879852, 0.10101109743118286, 0.1059541329741478, 0.11089716106653214, 0.11584018915891647, 0.12078321725130081, 0.12572625279426575, 0.13066928088665009, 0.13561230897903442, 0.14055533707141876, 0.1454983651638031, 0.15044139325618744, 0.15538442134857178]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 11.0, 17.0, 32.0, 48.0, 102.0, 155.0, 546.0, 3545.0, 30313.0, 1595354.0, 2494719.0, 61292.0, 6401.0, 1295.0, 176.0, 110.0, 67.0, 33.0, 22.0, 9.0, 6.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06982421875, -0.06764793395996094, -0.06547164916992188, -0.06329536437988281, -0.06111907958984375, -0.05894279479980469, -0.056766510009765625, -0.05459022521972656, -0.0524139404296875, -0.05023765563964844, -0.048061370849609375, -0.04588508605957031, -0.04370880126953125, -0.04153251647949219, -0.039356231689453125, -0.03717994689941406, -0.035003662109375, -0.03282737731933594, -0.030651092529296875, -0.028474807739257812, -0.02629852294921875, -0.024122238159179688, -0.021945953369140625, -0.019769668579101562, -0.0175933837890625, -0.015417098999023438, -0.013240814208984375, -0.011064529418945312, -0.00888824462890625, -0.0067119598388671875, -0.004535675048828125, -0.0023593902587890625, -0.00018310546875, 0.0019931793212890625, 0.004169464111328125, 0.0063457489013671875, 0.00852203369140625, 0.010698318481445312, 0.012874603271484375, 0.015050888061523438, 0.0172271728515625, 0.019403457641601562, 0.021579742431640625, 0.023756027221679688, 0.02593231201171875, 0.028108596801757812, 0.030284881591796875, 0.03246116638183594, 0.034637451171875, 0.03681373596191406, 0.038990020751953125, 0.04116630554199219, 0.04334259033203125, 0.04551887512207031, 0.047695159912109375, 0.04987144470214844, 0.0520477294921875, 0.05422401428222656, 0.056400299072265625, 0.05857658386230469, 0.06075286865234375, 0.06292915344238281, 0.06510543823242188, 0.06728172302246094, 0.0694580078125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 10.0, 13.0, 14.0, 25.0, 32.0, 52.0, 61.0, 70.0, 91.0, 92.0, 75.0, 100.0, 82.0, 78.0, 55.0, 40.0, 36.0, 24.0, 17.0, 14.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.060821533203125, -0.059103965759277344, -0.05738639831542969, -0.05566883087158203, -0.053951263427734375, -0.05223369598388672, -0.05051612854003906, -0.048798561096191406, -0.04708099365234375, -0.045363426208496094, -0.04364585876464844, -0.04192829132080078, -0.040210723876953125, -0.03849315643310547, -0.03677558898925781, -0.035058021545410156, -0.0333404541015625, -0.031622886657714844, -0.029905319213867188, -0.02818775177001953, -0.026470184326171875, -0.02475261688232422, -0.023035049438476562, -0.021317481994628906, -0.01959991455078125, -0.017882347106933594, -0.016164779663085938, -0.014447212219238281, -0.012729644775390625, -0.011012077331542969, -0.009294509887695312, -0.007576942443847656, -0.005859375, -0.004141807556152344, -0.0024242401123046875, -0.0007066726684570312, 0.001010894775390625, 0.0027284622192382812, 0.0044460296630859375, 0.006163597106933594, 0.00788116455078125, 0.009598731994628906, 0.011316299438476562, 0.013033866882324219, 0.014751434326171875, 0.01646900177001953, 0.018186569213867188, 0.019904136657714844, 0.0216217041015625, 0.023339271545410156, 0.025056838989257812, 0.02677440643310547, 0.028491973876953125, 0.03020954132080078, 0.03192710876464844, 0.033644676208496094, 0.03536224365234375, 0.037079811096191406, 0.03879737854003906, 0.04051494598388672, 0.042232513427734375, 0.04395008087158203, 0.04566764831542969, 0.047385215759277344, 0.049102783203125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 6.0, 8.0, 8.0, 16.0, 17.0, 29.0, 30.0, 43.0, 69.0, 109.0, 171.0, 280.0, 501.0, 981.0, 2188.0, 6711.0, 31021.0, 254010.0, 2883802.0, 922460.0, 72390.0, 12934.0, 3553.0, 1319.0, 656.0, 361.0, 222.0, 127.0, 88.0, 46.0, 44.0, 30.0, 13.0, 9.0, 11.0, 7.0, 3.0, 6.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0310211181640625, -0.029902219772338867, -0.028783321380615234, -0.0276644229888916, -0.02654552459716797, -0.025426626205444336, -0.024307727813720703, -0.02318882942199707, -0.022069931030273438, -0.020951032638549805, -0.019832134246826172, -0.01871323585510254, -0.017594337463378906, -0.016475439071655273, -0.01535654067993164, -0.014237642288208008, -0.013118743896484375, -0.011999845504760742, -0.01088094711303711, -0.009762048721313477, -0.008643150329589844, -0.007524251937866211, -0.006405353546142578, -0.005286455154418945, -0.0041675567626953125, -0.0030486583709716797, -0.0019297599792480469, -0.0008108615875244141, 0.00030803680419921875, 0.0014269351959228516, 0.0025458335876464844, 0.003664731979370117, 0.00478363037109375, 0.005902528762817383, 0.007021427154541016, 0.008140325546264648, 0.009259223937988281, 0.010378122329711914, 0.011497020721435547, 0.01261591911315918, 0.013734817504882812, 0.014853715896606445, 0.015972614288330078, 0.01709151268005371, 0.018210411071777344, 0.019329309463500977, 0.02044820785522461, 0.021567106246948242, 0.022686004638671875, 0.023804903030395508, 0.02492380142211914, 0.026042699813842773, 0.027161598205566406, 0.02828049659729004, 0.029399394989013672, 0.030518293380737305, 0.03163719177246094, 0.03275609016418457, 0.0338749885559082, 0.034993886947631836, 0.03611278533935547, 0.0372316837310791, 0.038350582122802734, 0.03946948051452637, 0.04058837890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 9.0, 21.0, 27.0, 66.0, 190.0, 526.0, 1076.0, 1149.0, 596.0, 232.0, 79.0, 47.0, 20.0, 18.0, 8.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0692138671875, -0.0673980712890625, -0.065582275390625, -0.0637664794921875, -0.06195068359375, -0.0601348876953125, -0.058319091796875, -0.0565032958984375, -0.0546875, -0.0528717041015625, -0.051055908203125, -0.0492401123046875, -0.04742431640625, -0.0456085205078125, -0.043792724609375, -0.0419769287109375, -0.0401611328125, -0.0383453369140625, -0.036529541015625, -0.0347137451171875, -0.03289794921875, -0.0310821533203125, -0.029266357421875, -0.0274505615234375, -0.025634765625, -0.0238189697265625, -0.022003173828125, -0.0201873779296875, -0.01837158203125, -0.0165557861328125, -0.014739990234375, -0.0129241943359375, -0.0111083984375, -0.0092926025390625, -0.007476806640625, -0.0056610107421875, -0.00384521484375, -0.0020294189453125, -0.000213623046875, 0.0016021728515625, 0.00341796875, 0.0052337646484375, 0.007049560546875, 0.0088653564453125, 0.01068115234375, 0.0124969482421875, 0.014312744140625, 0.0161285400390625, 0.0179443359375, 0.0197601318359375, 0.021575927734375, 0.0233917236328125, 0.02520751953125, 0.0270233154296875, 0.028839111328125, 0.0306549072265625, 0.032470703125, 0.0342864990234375, 0.036102294921875, 0.0379180908203125, 0.03973388671875, 0.0415496826171875, 0.043365478515625, 0.0451812744140625, 0.0469970703125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 13.0, 52.0, 120.0, 245.0, 275.0, 192.0, 69.0, 27.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3421699106693268, -0.33349835872650146, -0.32482677698135376, -0.31615522503852844, -0.3074836730957031, -0.2988120913505554, -0.2901405394077301, -0.2814689576625824, -0.2727974057197571, -0.26412585377693176, -0.25545427203178406, -0.24678272008895874, -0.23811115324497223, -0.22943958640098572, -0.2207680344581604, -0.2120964676141739, -0.20342490077018738, -0.19475333392620087, -0.18608176708221436, -0.17741021513938904, -0.16873864829540253, -0.16006708145141602, -0.1513955295085907, -0.1427239626646042, -0.13405239582061768, -0.12538082897663116, -0.11670926958322525, -0.10803771018981934, -0.09936614334583282, -0.09069457650184631, -0.0820230171084404, -0.07335145771503448, -0.06467992067337036, -0.05600835755467415, -0.047336794435977936, -0.03866523131728172, -0.02999366819858551, -0.021322105079889297, -0.012650541961193085, -0.003978978842496872, 0.004692584276199341, 0.013364147394895554, 0.022035710513591766, 0.03070727363228798, 0.03937883675098419, 0.048050399869680405, 0.05672196298837662, 0.06539352238178253, 0.07406508922576904, 0.08273665606975555, 0.09140821546316147, 0.10007977485656738, 0.1087513417005539, 0.1174229085445404, 0.12609446048736572, 0.13476602733135223, 0.14343759417533875, 0.15210916101932526, 0.16078072786331177, 0.16945227980613708, 0.1781238466501236, 0.1867954134941101, 0.19546696543693542, 0.20413853228092194, 0.21281009912490845]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 6.0, 8.0, 8.0, 9.0, 12.0, 15.0, 17.0, 18.0, 27.0, 38.0, 33.0, 43.0, 24.0, 35.0, 46.0, 42.0, 33.0, 52.0, 56.0, 42.0, 56.0, 39.0, 48.0, 31.0, 35.0, 28.0, 29.0, 22.0, 22.0, 14.0, 16.0, 16.0, 18.0, 11.0, 15.0, 7.0, 2.0, 4.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07063698768615723, -0.06799672544002533, -0.06535646319389343, -0.06271620094776154, -0.06007594242691994, -0.05743568018078804, -0.05479542165994644, -0.052155159413814545, -0.04951489716768265, -0.04687463492155075, -0.044234372675418854, -0.041594114154577255, -0.03895385190844536, -0.03631358966231346, -0.03367333114147186, -0.031033068895339966, -0.02839280664920807, -0.025752544403076172, -0.023112284019589424, -0.020472023636102676, -0.01783176138997078, -0.015191500075161457, -0.012551238760352135, -0.009910978376865387, -0.00727071613073349, -0.004630454815924168, -0.0019901935011148453, 0.0006500678136944771, 0.0032903291285037994, 0.005930590443313122, 0.008570851758122444, 0.011211112141609192, 0.013851374387741089, 0.016491636633872986, 0.019131897017359734, 0.02177215740084648, 0.02441241964697838, 0.027052681893110275, 0.029692942276597023, 0.03233320266008377, 0.03497346490621567, 0.037613727152347565, 0.04025398939847946, 0.04289424791932106, 0.04553451016545296, 0.048174772411584854, 0.05081503093242645, 0.05345529317855835, 0.05609555542469025, 0.058735817670822144, 0.06137607991695404, 0.06401634216308594, 0.06665660440921783, 0.06929685920476913, 0.07193712145090103, 0.07457738369703293, 0.07721764594316483, 0.07985790818929672, 0.08249817043542862, 0.08513843268156052, 0.08777868747711182, 0.09041894972324371, 0.09305921196937561, 0.09569947421550751, 0.0983397364616394]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 7.0, 3.0, 11.0, 10.0, 30.0, 34.0, 42.0, 62.0, 106.0, 159.0, 231.0, 370.0, 630.0, 1217.0, 2667.0, 7075.0, 25186.0, 113110.0, 447025.0, 346550.0, 76002.0, 17751.0, 5521.0, 2173.0, 1041.0, 554.0, 350.0, 214.0, 132.0, 80.0, 55.0, 44.0, 31.0, 21.0, 13.0, 11.0, 5.0, 4.0, 8.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.049591064453125, -0.04820871353149414, -0.04682636260986328, -0.04544401168823242, -0.04406166076660156, -0.0426793098449707, -0.041296958923339844, -0.039914608001708984, -0.038532257080078125, -0.037149906158447266, -0.035767555236816406, -0.03438520431518555, -0.03300285339355469, -0.03162050247192383, -0.03023815155029297, -0.02885580062866211, -0.02747344970703125, -0.02609109878540039, -0.02470874786376953, -0.023326396942138672, -0.021944046020507812, -0.020561695098876953, -0.019179344177246094, -0.017796993255615234, -0.016414642333984375, -0.015032291412353516, -0.013649940490722656, -0.012267589569091797, -0.010885238647460938, -0.009502887725830078, -0.008120536804199219, -0.006738185882568359, -0.0053558349609375, -0.003973484039306641, -0.0025911331176757812, -0.0012087821960449219, 0.0001735687255859375, 0.0015559196472167969, 0.0029382705688476562, 0.004320621490478516, 0.005702972412109375, 0.007085323333740234, 0.008467674255371094, 0.009850025177001953, 0.011232376098632812, 0.012614727020263672, 0.013997077941894531, 0.01537942886352539, 0.01676177978515625, 0.01814413070678711, 0.01952648162841797, 0.020908832550048828, 0.022291183471679688, 0.023673534393310547, 0.025055885314941406, 0.026438236236572266, 0.027820587158203125, 0.029202938079833984, 0.030585289001464844, 0.0319676399230957, 0.03334999084472656, 0.03473234176635742, 0.03611469268798828, 0.03749704360961914, 0.03887939453125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 14.0, 26.0, 31.0, 50.0, 53.0, 70.0, 81.0, 87.0, 105.0, 105.0, 70.0, 75.0, 71.0, 45.0, 29.0, 32.0, 19.0, 7.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0709228515625, -0.06921529769897461, -0.06750774383544922, -0.06580018997192383, -0.06409263610839844, -0.06238508224487305, -0.060677528381347656, -0.058969974517822266, -0.057262420654296875, -0.055554866790771484, -0.053847312927246094, -0.0521397590637207, -0.05043220520019531, -0.04872465133666992, -0.04701709747314453, -0.04530954360961914, -0.04360198974609375, -0.04189443588256836, -0.04018688201904297, -0.03847932815551758, -0.03677177429199219, -0.0350642204284668, -0.033356666564941406, -0.031649112701416016, -0.029941558837890625, -0.028234004974365234, -0.026526451110839844, -0.024818897247314453, -0.023111343383789062, -0.021403789520263672, -0.01969623565673828, -0.01798868179321289, -0.0162811279296875, -0.01457357406616211, -0.012866020202636719, -0.011158466339111328, -0.009450912475585938, -0.007743358612060547, -0.006035804748535156, -0.004328250885009766, -0.002620697021484375, -0.0009131431579589844, 0.0007944107055664062, 0.002501964569091797, 0.0042095184326171875, 0.005917072296142578, 0.007624626159667969, 0.00933218002319336, 0.01103973388671875, 0.01274728775024414, 0.014454841613769531, 0.016162395477294922, 0.017869949340820312, 0.019577503204345703, 0.021285057067871094, 0.022992610931396484, 0.024700164794921875, 0.026407718658447266, 0.028115272521972656, 0.029822826385498047, 0.03153038024902344, 0.03323793411254883, 0.03494548797607422, 0.03665304183959961, 0.038360595703125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 8.0, 2.0, 8.0, 12.0, 14.0, 18.0, 28.0, 22.0, 26.0, 48.0, 82.0, 109.0, 205.0, 367.0, 960.0, 3119.0, 13275.0, 72982.0, 468456.0, 411637.0, 61162.0, 11550.0, 2637.0, 938.0, 363.0, 175.0, 107.0, 64.0, 56.0, 30.0, 18.0, 18.0, 15.0, 9.0, 11.0, 8.0, 8.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.052703857421875, -0.05094432830810547, -0.04918479919433594, -0.047425270080566406, -0.045665740966796875, -0.043906211853027344, -0.04214668273925781, -0.04038715362548828, -0.03862762451171875, -0.03686809539794922, -0.03510856628417969, -0.033349037170410156, -0.031589508056640625, -0.029829978942871094, -0.028070449829101562, -0.02631092071533203, -0.0245513916015625, -0.02279186248779297, -0.021032333374023438, -0.019272804260253906, -0.017513275146484375, -0.015753746032714844, -0.013994216918945312, -0.012234687805175781, -0.01047515869140625, -0.008715629577636719, -0.0069561004638671875, -0.005196571350097656, -0.003437042236328125, -0.0016775131225585938, 8.20159912109375e-05, 0.0018415451049804688, 0.00360107421875, 0.005360603332519531, 0.0071201324462890625, 0.008879661560058594, 0.010639190673828125, 0.012398719787597656, 0.014158248901367188, 0.01591777801513672, 0.01767730712890625, 0.01943683624267578, 0.021196365356445312, 0.022955894470214844, 0.024715423583984375, 0.026474952697753906, 0.028234481811523438, 0.02999401092529297, 0.0317535400390625, 0.03351306915283203, 0.03527259826660156, 0.037032127380371094, 0.038791656494140625, 0.040551185607910156, 0.04231071472167969, 0.04407024383544922, 0.04582977294921875, 0.04758930206298828, 0.04934883117675781, 0.051108360290527344, 0.052867889404296875, 0.054627418518066406, 0.05638694763183594, 0.05814647674560547, 0.059906005859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 9.0, 8.0, 13.0, 13.0, 9.0, 14.0, 21.0, 21.0, 25.0, 26.0, 31.0, 15.0, 26.0, 45.0, 43.0, 54.0, 51.0, 42.0, 57.0, 55.0, 38.0, 35.0, 35.0, 38.0, 34.0, 35.0, 33.0, 19.0, 25.0, 20.0, 18.0, 15.0, 20.0, 9.0, 15.0, 4.0, 6.0, 6.0, 5.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06475830078125, -0.06279993057250977, -0.06084156036376953, -0.0588831901550293, -0.05692481994628906, -0.05496644973754883, -0.053008079528808594, -0.05104970932006836, -0.049091339111328125, -0.04713296890258789, -0.045174598693847656, -0.04321622848510742, -0.04125785827636719, -0.03929948806762695, -0.03734111785888672, -0.035382747650146484, -0.03342437744140625, -0.031466007232666016, -0.02950763702392578, -0.027549266815185547, -0.025590896606445312, -0.023632526397705078, -0.021674156188964844, -0.01971578598022461, -0.017757415771484375, -0.01579904556274414, -0.013840675354003906, -0.011882305145263672, -0.009923934936523438, -0.007965564727783203, -0.006007194519042969, -0.004048824310302734, -0.0020904541015625, -0.00013208389282226562, 0.0018262863159179688, 0.003784656524658203, 0.0057430267333984375, 0.007701396942138672, 0.009659767150878906, 0.01161813735961914, 0.013576507568359375, 0.01553487777709961, 0.017493247985839844, 0.019451618194580078, 0.021409988403320312, 0.023368358612060547, 0.02532672882080078, 0.027285099029541016, 0.02924346923828125, 0.031201839447021484, 0.03316020965576172, 0.03511857986450195, 0.03707695007324219, 0.03903532028198242, 0.040993690490722656, 0.04295206069946289, 0.044910430908203125, 0.04686880111694336, 0.048827171325683594, 0.05078554153442383, 0.05274391174316406, 0.0547022819519043, 0.05666065216064453, 0.058619022369384766, 0.060577392578125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 5.0, 5.0, 7.0, 10.0, 10.0, 21.0, 19.0, 34.0, 42.0, 72.0, 114.0, 158.0, 251.0, 412.0, 663.0, 1075.0, 2058.0, 3929.0, 7765.0, 17287.0, 39760.0, 95093.0, 207991.0, 291060.0, 210231.0, 96302.0, 40014.0, 17202.0, 8077.0, 3911.0, 2062.0, 1133.0, 674.0, 395.0, 223.0, 160.0, 82.0, 90.0, 44.0, 27.0, 26.0, 17.0, 16.0, 17.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005405426025390625, -0.005208909511566162, -0.005012392997741699, -0.004815876483917236, -0.0046193599700927734, -0.0044228434562683105, -0.004226326942443848, -0.004029810428619385, -0.003833293914794922, -0.003636777400970459, -0.003440260887145996, -0.003243744373321533, -0.0030472278594970703, -0.0028507113456726074, -0.0026541948318481445, -0.0024576783180236816, -0.0022611618041992188, -0.002064645290374756, -0.001868128776550293, -0.00167161226272583, -0.0014750957489013672, -0.0012785792350769043, -0.0010820627212524414, -0.0008855462074279785, -0.0006890296936035156, -0.0004925131797790527, -0.00029599666595458984, -9.948015213012695e-05, 9.703636169433594e-05, 0.00029355287551879883, 0.0004900693893432617, 0.0006865859031677246, 0.0008831024169921875, 0.0010796189308166504, 0.0012761354446411133, 0.0014726519584655762, 0.001669168472290039, 0.001865684986114502, 0.002062201499938965, 0.0022587180137634277, 0.0024552345275878906, 0.0026517510414123535, 0.0028482675552368164, 0.0030447840690612793, 0.003241300582885742, 0.003437817096710205, 0.003634333610534668, 0.003830850124359131, 0.004027366638183594, 0.004223883152008057, 0.0044203996658325195, 0.004616916179656982, 0.004813432693481445, 0.005009949207305908, 0.005206465721130371, 0.005402982234954834, 0.005599498748779297, 0.00579601526260376, 0.005992531776428223, 0.0061890482902526855, 0.0063855648040771484, 0.006582081317901611, 0.006778597831726074, 0.006975114345550537, 0.007171630859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 6.0, 5.0, 10.0, 6.0, 19.0, 11.0, 11.0, 7.0, 16.0, 18.0, 43.0, 16.0, 32.0, 35.0, 46.0, 41.0, 75.0, 39.0, 52.0, 34.0, 43.0, 81.0, 31.0, 31.0, 36.0, 38.0, 26.0, 50.0, 19.0, 18.0, 14.0, 16.0, 11.0, 25.0, 5.0, 7.0, 6.0, 4.0, 3.0, 7.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.2649765014648438e-06, -2.195127308368683e-06, -2.125278115272522e-06, -2.055428922176361e-06, -1.9855797290802e-06, -1.9157305359840393e-06, -1.8458813428878784e-06, -1.7760321497917175e-06, -1.7061829566955566e-06, -1.6363337635993958e-06, -1.5664845705032349e-06, -1.496635377407074e-06, -1.426786184310913e-06, -1.3569369912147522e-06, -1.2870877981185913e-06, -1.2172386050224304e-06, -1.1473894119262695e-06, -1.0775402188301086e-06, -1.0076910257339478e-06, -9.378418326377869e-07, -8.67992639541626e-07, -7.981434464454651e-07, -7.282942533493042e-07, -6.584450602531433e-07, -5.885958671569824e-07, -5.187466740608215e-07, -4.4889748096466064e-07, -3.7904828786849976e-07, -3.0919909477233887e-07, -2.39349901676178e-07, -1.695007085800171e-07, -9.96515154838562e-08, -2.9802322387695312e-08, 4.0046870708465576e-08, 1.0989606380462646e-07, 1.7974525690078735e-07, 2.4959444999694824e-07, 3.1944364309310913e-07, 3.8929283618927e-07, 4.591420292854309e-07, 5.289912223815918e-07, 5.988404154777527e-07, 6.686896085739136e-07, 7.385388016700745e-07, 8.083879947662354e-07, 8.782371878623962e-07, 9.480863809585571e-07, 1.017935574054718e-06, 1.087784767150879e-06, 1.1576339602470398e-06, 1.2274831533432007e-06, 1.2973323464393616e-06, 1.3671815395355225e-06, 1.4370307326316833e-06, 1.5068799257278442e-06, 1.5767291188240051e-06, 1.646578311920166e-06, 1.716427505016327e-06, 1.7862766981124878e-06, 1.8561258912086487e-06, 1.9259750843048096e-06, 1.9958242774009705e-06, 2.0656734704971313e-06, 2.1355226635932922e-06, 2.205371856689453e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 7.0, 3.0, 8.0, 8.0, 7.0, 21.0, 31.0, 37.0, 57.0, 110.0, 142.0, 223.0, 352.0, 691.0, 1429.0, 3797.0, 12582.0, 56245.0, 289384.0, 495633.0, 147145.0, 28518.0, 7288.0, 2547.0, 1019.0, 499.0, 251.0, 168.0, 127.0, 63.0, 46.0, 32.0, 31.0, 17.0, 10.0, 4.0, 6.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.01251983642578125, -0.012132048606872559, -0.011744260787963867, -0.011356472969055176, -0.010968685150146484, -0.010580897331237793, -0.010193109512329102, -0.00980532169342041, -0.009417533874511719, -0.009029746055603027, -0.008641958236694336, -0.008254170417785645, -0.007866382598876953, -0.007478594779968262, -0.00709080696105957, -0.006703019142150879, -0.0063152313232421875, -0.005927443504333496, -0.005539655685424805, -0.005151867866516113, -0.004764080047607422, -0.0043762922286987305, -0.003988504409790039, -0.0036007165908813477, -0.0032129287719726562, -0.002825140953063965, -0.0024373531341552734, -0.002049565315246582, -0.0016617774963378906, -0.0012739896774291992, -0.0008862018585205078, -0.0004984140396118164, -0.000110626220703125, 0.0002771615982055664, 0.0006649494171142578, 0.0010527372360229492, 0.0014405250549316406, 0.001828312873840332, 0.0022161006927490234, 0.002603888511657715, 0.0029916763305664062, 0.0033794641494750977, 0.003767251968383789, 0.0041550397872924805, 0.004542827606201172, 0.004930615425109863, 0.005318403244018555, 0.005706191062927246, 0.0060939788818359375, 0.006481766700744629, 0.00686955451965332, 0.007257342338562012, 0.007645130157470703, 0.008032917976379395, 0.008420705795288086, 0.008808493614196777, 0.009196281433105469, 0.00958406925201416, 0.009971857070922852, 0.010359644889831543, 0.010747432708740234, 0.011135220527648926, 0.011523008346557617, 0.011910796165466309, 0.012298583984375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 11.0, 8.0, 13.0, 20.0, 26.0, 45.0, 60.0, 64.0, 86.0, 116.0, 116.0, 105.0, 84.0, 53.0, 44.0, 39.0, 27.0, 24.0, 11.0, 13.0, 7.0, 5.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013580322265625, -0.013158679008483887, -0.012737035751342773, -0.01231539249420166, -0.011893749237060547, -0.011472105979919434, -0.01105046272277832, -0.010628819465637207, -0.010207176208496094, -0.00978553295135498, -0.009363889694213867, -0.008942246437072754, -0.00852060317993164, -0.008098959922790527, -0.007677316665649414, -0.007255673408508301, -0.0068340301513671875, -0.006412386894226074, -0.005990743637084961, -0.005569100379943848, -0.005147457122802734, -0.004725813865661621, -0.004304170608520508, -0.0038825273513793945, -0.0034608840942382812, -0.003039240837097168, -0.0026175975799560547, -0.0021959543228149414, -0.0017743110656738281, -0.0013526678085327148, -0.0009310245513916016, -0.0005093812942504883, -8.7738037109375e-05, 0.0003339052200317383, 0.0007555484771728516, 0.0011771917343139648, 0.0015988349914550781, 0.0020204782485961914, 0.0024421215057373047, 0.002863764762878418, 0.0032854080200195312, 0.0037070512771606445, 0.004128694534301758, 0.004550337791442871, 0.004971981048583984, 0.005393624305725098, 0.005815267562866211, 0.006236910820007324, 0.0066585540771484375, 0.007080197334289551, 0.007501840591430664, 0.007923483848571777, 0.00834512710571289, 0.008766770362854004, 0.009188413619995117, 0.00961005687713623, 0.010031700134277344, 0.010453343391418457, 0.01087498664855957, 0.011296629905700684, 0.011718273162841797, 0.01213991641998291, 0.012561559677124023, 0.012983202934265137, 0.01340484619140625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 7.0, 11.0, 31.0, 179.0, 390.0, 296.0, 65.0, 20.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.7190210223197937, -0.7056674957275391, -0.6923139691352844, -0.6789604425430298, -0.6656069159507751, -0.6522533893585205, -0.6388998627662659, -0.6255463361740112, -0.6121928095817566, -0.598839282989502, -0.5854857563972473, -0.5721322298049927, -0.558778703212738, -0.5454251766204834, -0.5320716500282288, -0.5187181234359741, -0.5053645968437195, -0.49201107025146484, -0.4786575436592102, -0.46530401706695557, -0.4519504904747009, -0.4385969638824463, -0.42524343729019165, -0.411889910697937, -0.39853635430336, -0.38518282771110535, -0.3718293011188507, -0.35847577452659607, -0.34512224793434143, -0.3317687213420868, -0.31841519474983215, -0.3050616681575775, -0.2917081117630005, -0.27835458517074585, -0.2650010585784912, -0.2516475319862366, -0.23829400539398193, -0.2249404788017273, -0.21158695220947266, -0.19823342561721802, -0.18487989902496338, -0.17152637243270874, -0.1581728458404541, -0.14481931924819946, -0.13146579265594482, -0.11811225861310959, -0.10475873202085495, -0.09140520542860031, -0.07805168628692627, -0.06469815969467163, -0.05134463310241699, -0.037991102784872055, -0.024637576192617416, -0.01128404587507248, 0.0020694807171821594, 0.015423007309436798, 0.028776533901691437, 0.042130060493946075, 0.055483587086200714, 0.06883712112903595, 0.08219064772129059, 0.09554417431354523, 0.10889770090579987, 0.1222512274980545, 0.13560475409030914]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 5.0, 7.0, 8.0, 10.0, 4.0, 12.0, 12.0, 15.0, 14.0, 15.0, 19.0, 19.0, 41.0, 24.0, 23.0, 38.0, 33.0, 22.0, 33.0, 35.0, 37.0, 44.0, 35.0, 44.0, 41.0, 41.0, 35.0, 28.0, 31.0, 31.0, 23.0, 25.0, 25.0, 29.0, 19.0, 26.0, 17.0, 11.0, 13.0, 8.0, 5.0, 8.0, 4.0, 7.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1282963752746582, -0.12428830564022064, -0.12028024345636368, -0.11627217382192612, -0.11226411163806915, -0.10825604200363159, -0.10424797236919403, -0.10023990273475647, -0.0962318405508995, -0.09222377091646194, -0.08821570873260498, -0.08420763909816742, -0.08019956946372986, -0.0761915072798729, -0.07218343764543533, -0.06817537546157837, -0.06416730582714081, -0.060159239917993546, -0.05615117400884628, -0.05214310437440872, -0.04813503846526146, -0.0441269725561142, -0.040118902921676636, -0.03611083701252937, -0.03210277110338211, -0.028094705194234848, -0.024086637422442436, -0.020078569650650024, -0.016070503741502762, -0.0120624378323555, -0.008054370060563087, -0.004046302288770676, -3.8236379623413086e-05, 0.003969830460846424, 0.007977897301316261, 0.011985964141786098, 0.015994030982255936, 0.020002096891403198, 0.02401016466319561, 0.028018232434988022, 0.032026298344135284, 0.03603436425328255, 0.04004243016242981, 0.04405049979686737, 0.04805856570601463, 0.052066631615161896, 0.05607470124959946, 0.06008276715874672, 0.06409083306789398, 0.06809890270233154, 0.07210696488618851, 0.07611503452062607, 0.08012309670448303, 0.0841311663389206, 0.08813923597335815, 0.09214730560779572, 0.09615536779165268, 0.10016343742609024, 0.1041714996099472, 0.10817956924438477, 0.11218763887882233, 0.11619570106267929, 0.12020377069711685, 0.12421183288097382, 0.12821990251541138]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 4.0, 7.0, 12.0, 12.0, 21.0, 31.0, 49.0, 96.0, 150.0, 322.0, 974.0, 4042.0, 16826.0, 179348.0, 2417110.0, 1476915.0, 79294.0, 12156.0, 4730.0, 1515.0, 345.0, 129.0, 67.0, 45.0, 26.0, 18.0, 11.0, 10.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048126220703125, -0.04656696319580078, -0.04500770568847656, -0.043448448181152344, -0.041889190673828125, -0.040329933166503906, -0.03877067565917969, -0.03721141815185547, -0.03565216064453125, -0.03409290313720703, -0.03253364562988281, -0.030974388122558594, -0.029415130615234375, -0.027855873107910156, -0.026296615600585938, -0.02473735809326172, -0.0231781005859375, -0.02161884307861328, -0.020059585571289062, -0.018500328063964844, -0.016941070556640625, -0.015381813049316406, -0.013822555541992188, -0.012263298034667969, -0.01070404052734375, -0.009144783020019531, -0.0075855255126953125, -0.006026268005371094, -0.004467010498046875, -0.0029077529907226562, -0.0013484954833984375, 0.00021076202392578125, 0.00177001953125, 0.0033292770385742188, 0.0048885345458984375, 0.006447792053222656, 0.008007049560546875, 0.009566307067871094, 0.011125564575195312, 0.012684822082519531, 0.01424407958984375, 0.01580333709716797, 0.017362594604492188, 0.018921852111816406, 0.020481109619140625, 0.022040367126464844, 0.023599624633789062, 0.02515888214111328, 0.0267181396484375, 0.02827739715576172, 0.029836654663085938, 0.031395912170410156, 0.032955169677734375, 0.034514427185058594, 0.03607368469238281, 0.03763294219970703, 0.03919219970703125, 0.04075145721435547, 0.04231071472167969, 0.043869972229003906, 0.045429229736328125, 0.046988487243652344, 0.04854774475097656, 0.05010700225830078, 0.051666259765625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 5.0, 11.0, 12.0, 23.0, 31.0, 52.0, 70.0, 64.0, 95.0, 92.0, 97.0, 88.0, 91.0, 73.0, 49.0, 46.0, 36.0, 28.0, 10.0, 11.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062164306640625, -0.06045961380004883, -0.058754920959472656, -0.057050228118896484, -0.05534553527832031, -0.05364084243774414, -0.05193614959716797, -0.0502314567565918, -0.048526763916015625, -0.04682207107543945, -0.04511737823486328, -0.04341268539428711, -0.04170799255371094, -0.040003299713134766, -0.038298606872558594, -0.03659391403198242, -0.03488922119140625, -0.03318452835083008, -0.031479835510253906, -0.029775142669677734, -0.028070449829101562, -0.02636575698852539, -0.02466106414794922, -0.022956371307373047, -0.021251678466796875, -0.019546985626220703, -0.01784229278564453, -0.01613759994506836, -0.014432907104492188, -0.012728214263916016, -0.011023521423339844, -0.009318828582763672, -0.0076141357421875, -0.005909442901611328, -0.004204750061035156, -0.0025000572204589844, -0.0007953643798828125, 0.0009093284606933594, 0.0026140213012695312, 0.004318714141845703, 0.006023406982421875, 0.007728099822998047, 0.009432792663574219, 0.01113748550415039, 0.012842178344726562, 0.014546871185302734, 0.016251564025878906, 0.017956256866455078, 0.01966094970703125, 0.021365642547607422, 0.023070335388183594, 0.024775028228759766, 0.026479721069335938, 0.02818441390991211, 0.02988910675048828, 0.03159379959106445, 0.033298492431640625, 0.0350031852722168, 0.03670787811279297, 0.03841257095336914, 0.04011726379394531, 0.041821956634521484, 0.043526649475097656, 0.04523134231567383, 0.04693603515625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 4.0, 7.0, 14.0, 18.0, 24.0, 31.0, 50.0, 61.0, 114.0, 167.0, 287.0, 439.0, 823.0, 1623.0, 3573.0, 9690.0, 32653.0, 156135.0, 1654685.0, 2080366.0, 196084.0, 38436.0, 11091.0, 3981.0, 1711.0, 935.0, 543.0, 258.0, 199.0, 104.0, 61.0, 44.0, 18.0, 17.0, 14.0, 9.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0273284912109375, -0.026354551315307617, -0.025380611419677734, -0.02440667152404785, -0.02343273162841797, -0.022458791732788086, -0.021484851837158203, -0.02051091194152832, -0.019536972045898438, -0.018563032150268555, -0.017589092254638672, -0.01661515235900879, -0.015641212463378906, -0.014667272567749023, -0.01369333267211914, -0.012719392776489258, -0.011745452880859375, -0.010771512985229492, -0.00979757308959961, -0.008823633193969727, -0.007849693298339844, -0.006875753402709961, -0.005901813507080078, -0.004927873611450195, -0.0039539337158203125, -0.0029799938201904297, -0.002006053924560547, -0.001032114028930664, -5.817413330078125e-05, 0.0009157657623291016, 0.0018897056579589844, 0.002863645553588867, 0.00383758544921875, 0.004811525344848633, 0.005785465240478516, 0.0067594051361083984, 0.007733345031738281, 0.008707284927368164, 0.009681224822998047, 0.01065516471862793, 0.011629104614257812, 0.012603044509887695, 0.013576984405517578, 0.014550924301147461, 0.015524864196777344, 0.016498804092407227, 0.01747274398803711, 0.018446683883666992, 0.019420623779296875, 0.020394563674926758, 0.02136850357055664, 0.022342443466186523, 0.023316383361816406, 0.02429032325744629, 0.025264263153076172, 0.026238203048706055, 0.027212142944335938, 0.02818608283996582, 0.029160022735595703, 0.030133962631225586, 0.03110790252685547, 0.03208184242248535, 0.033055782318115234, 0.03402972221374512, 0.035003662109375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 1.0, 3.0, 4.0, 8.0, 17.0, 19.0, 36.0, 37.0, 92.0, 218.0, 510.0, 883.0, 947.0, 655.0, 316.0, 133.0, 62.0, 34.0, 32.0, 21.0, 14.0, 11.0, 3.0, 1.0, 6.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050689697265625, -0.04932975769042969, -0.047969818115234375, -0.04660987854003906, -0.04524993896484375, -0.04388999938964844, -0.042530059814453125, -0.04117012023925781, -0.0398101806640625, -0.03845024108886719, -0.037090301513671875, -0.03573036193847656, -0.03437042236328125, -0.03301048278808594, -0.031650543212890625, -0.030290603637695312, -0.0289306640625, -0.027570724487304688, -0.026210784912109375, -0.024850845336914062, -0.02349090576171875, -0.022130966186523438, -0.020771026611328125, -0.019411087036132812, -0.0180511474609375, -0.016691207885742188, -0.015331268310546875, -0.013971328735351562, -0.01261138916015625, -0.011251449584960938, -0.009891510009765625, -0.008531570434570312, -0.007171630859375, -0.0058116912841796875, -0.004451751708984375, -0.0030918121337890625, -0.00173187255859375, -0.0003719329833984375, 0.000988006591796875, 0.0023479461669921875, 0.0037078857421875, 0.0050678253173828125, 0.006427764892578125, 0.0077877044677734375, 0.00914764404296875, 0.010507583618164062, 0.011867523193359375, 0.013227462768554688, 0.01458740234375, 0.015947341918945312, 0.017307281494140625, 0.018667221069335938, 0.02002716064453125, 0.021387100219726562, 0.022747039794921875, 0.024106979370117188, 0.0254669189453125, 0.026826858520507812, 0.028186798095703125, 0.029546737670898438, 0.03090667724609375, 0.03226661682128906, 0.033626556396484375, 0.03498649597167969, 0.036346435546875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 9.0, 16.0, 36.0, 48.0, 86.0, 99.0, 130.0, 171.0, 134.0, 107.0, 66.0, 41.0, 22.0, 14.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23338447511196136, -0.22848081588745117, -0.22357714176177979, -0.2186734825372696, -0.2137698233127594, -0.2088661640882492, -0.20396248996257782, -0.19905883073806763, -0.19415517151355743, -0.18925151228904724, -0.18434783816337585, -0.17944417893886566, -0.17454051971435547, -0.16963686048984528, -0.1647331863641739, -0.1598295271396637, -0.1549258530139923, -0.15002219378948212, -0.14511851966381073, -0.14021486043930054, -0.13531120121479034, -0.13040754199028015, -0.12550386786460876, -0.12060020864009857, -0.11569654941558838, -0.11079288274049759, -0.1058892235159874, -0.1009855568408966, -0.09608189761638641, -0.09117823094129562, -0.08627456426620483, -0.08137090504169464, -0.07646725326776505, -0.07156358659267426, -0.06665992736816406, -0.06175626069307327, -0.05685260146856308, -0.05194893479347229, -0.0470452718436718, -0.04214160889387131, -0.037237945944070816, -0.032334282994270325, -0.027430620044469833, -0.022526955232024193, -0.0176232922822237, -0.01271962933242321, -0.00781596451997757, -0.0029123015701770782, 0.001991361379623413, 0.006895024795085192, 0.01179868821054697, 0.016702352091670036, 0.021606015041470528, 0.02650967799127102, 0.03141334280371666, 0.03631700575351715, 0.04122066870331764, 0.046124331653118134, 0.051027994602918625, 0.055931657552719116, 0.060835324227809906, 0.0657389834523201, 0.07064265012741089, 0.07554630935192108, 0.08044997602701187]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 9.0, 10.0, 7.0, 13.0, 16.0, 16.0, 17.0, 20.0, 25.0, 23.0, 20.0, 27.0, 29.0, 36.0, 44.0, 29.0, 32.0, 40.0, 32.0, 40.0, 30.0, 42.0, 46.0, 46.0, 41.0, 23.0, 32.0, 30.0, 32.0, 17.0, 24.0, 20.0, 15.0, 17.0, 19.0, 12.0, 17.0, 5.0, 7.0, 6.0, 9.0, 1.0, 2.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06870484352111816, -0.06636084616184235, -0.06401685625314713, -0.06167285889387131, -0.05932886525988579, -0.05698487162590027, -0.05464087426662445, -0.05229688063263893, -0.04995288699865341, -0.04760889336466789, -0.04526489973068237, -0.042920902371406555, -0.040576908737421036, -0.038232915103435516, -0.0358889177441597, -0.03354492411017418, -0.03120093047618866, -0.02885693684220314, -0.02651294134557247, -0.024168945848941803, -0.021824952214956284, -0.019480958580970764, -0.017136963084340096, -0.014792967587709427, -0.012448973953723907, -0.010104979388415813, -0.007760984823107719, -0.005416990257799625, -0.0030729956924915314, -0.0007290011271834373, 0.0016149934381246567, 0.003958988934755325, 0.006302982568740845, 0.008646977134048939, 0.010990971699357033, 0.013334966264665127, 0.01567896082997322, 0.01802295446395874, 0.02036694996058941, 0.022710945457220078, 0.025054939091205597, 0.027398932725191116, 0.029742928221821785, 0.032086923718452454, 0.03443091735243797, 0.03677491098642349, 0.03911890834569931, 0.04146290197968483, 0.04380689561367035, 0.04615088924765587, 0.04849488288164139, 0.050838880240917206, 0.053182873874902725, 0.055526867508888245, 0.05787086486816406, 0.06021485850214958, 0.0625588521361351, 0.06490284949541092, 0.06724683940410614, 0.06959083676338196, 0.07193483412265778, 0.074278824031353, 0.07662282139062881, 0.07896681129932404, 0.08131080865859985]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 3.0, 9.0, 4.0, 18.0, 20.0, 32.0, 37.0, 45.0, 76.0, 127.0, 188.0, 313.0, 563.0, 957.0, 2280.0, 5419.0, 16300.0, 58555.0, 241849.0, 473796.0, 182518.0, 43985.0, 13012.0, 4452.0, 1815.0, 834.0, 463.0, 297.0, 185.0, 117.0, 77.0, 65.0, 37.0, 32.0, 19.0, 17.0, 14.0, 4.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.035675048828125, -0.03446149826049805, -0.033247947692871094, -0.03203439712524414, -0.030820846557617188, -0.029607295989990234, -0.02839374542236328, -0.027180194854736328, -0.025966644287109375, -0.024753093719482422, -0.02353954315185547, -0.022325992584228516, -0.021112442016601562, -0.01989889144897461, -0.018685340881347656, -0.017471790313720703, -0.01625823974609375, -0.015044689178466797, -0.013831138610839844, -0.01261758804321289, -0.011404037475585938, -0.010190486907958984, -0.008976936340332031, -0.007763385772705078, -0.006549835205078125, -0.005336284637451172, -0.004122734069824219, -0.0029091835021972656, -0.0016956329345703125, -0.0004820823669433594, 0.0007314682006835938, 0.0019450187683105469, 0.0031585693359375, 0.004372119903564453, 0.005585670471191406, 0.006799221038818359, 0.008012771606445312, 0.009226322174072266, 0.010439872741699219, 0.011653423309326172, 0.012866973876953125, 0.014080524444580078, 0.015294075012207031, 0.016507625579833984, 0.017721176147460938, 0.01893472671508789, 0.020148277282714844, 0.021361827850341797, 0.02257537841796875, 0.023788928985595703, 0.025002479553222656, 0.02621603012084961, 0.027429580688476562, 0.028643131256103516, 0.02985668182373047, 0.031070232391357422, 0.032283782958984375, 0.03349733352661133, 0.03471088409423828, 0.035924434661865234, 0.03713798522949219, 0.03835153579711914, 0.039565086364746094, 0.04077863693237305, 0.0419921875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 8.0, 10.0, 21.0, 32.0, 29.0, 45.0, 67.0, 75.0, 98.0, 98.0, 90.0, 84.0, 73.0, 64.0, 68.0, 45.0, 30.0, 24.0, 17.0, 10.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06524658203125, -0.06362676620483398, -0.06200695037841797, -0.06038713455200195, -0.05876731872558594, -0.05714750289916992, -0.055527687072753906, -0.05390787124633789, -0.052288055419921875, -0.05066823959350586, -0.049048423767089844, -0.04742860794067383, -0.04580879211425781, -0.0441889762878418, -0.04256916046142578, -0.040949344635009766, -0.03932952880859375, -0.037709712982177734, -0.03608989715576172, -0.0344700813293457, -0.03285026550292969, -0.031230449676513672, -0.029610633850097656, -0.02799081802368164, -0.026371002197265625, -0.02475118637084961, -0.023131370544433594, -0.021511554718017578, -0.019891738891601562, -0.018271923065185547, -0.01665210723876953, -0.015032291412353516, -0.0134124755859375, -0.011792659759521484, -0.010172843933105469, -0.008553028106689453, -0.0069332122802734375, -0.005313396453857422, -0.0036935806274414062, -0.0020737648010253906, -0.000453948974609375, 0.0011658668518066406, 0.0027856826782226562, 0.004405498504638672, 0.0060253143310546875, 0.007645130157470703, 0.009264945983886719, 0.010884761810302734, 0.01250457763671875, 0.014124393463134766, 0.01574420928955078, 0.017364025115966797, 0.018983840942382812, 0.020603656768798828, 0.022223472595214844, 0.02384328842163086, 0.025463104248046875, 0.02708292007446289, 0.028702735900878906, 0.030322551727294922, 0.03194236755371094, 0.03356218338012695, 0.03518199920654297, 0.036801815032958984, 0.038421630859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 6.0, 7.0, 15.0, 12.0, 22.0, 32.0, 39.0, 45.0, 57.0, 100.0, 132.0, 216.0, 282.0, 480.0, 833.0, 1485.0, 2706.0, 5302.0, 10468.0, 21373.0, 46361.0, 107544.0, 235513.0, 300242.0, 174041.0, 75161.0, 33321.0, 15908.0, 7692.0, 3920.0, 2173.0, 1142.0, 688.0, 408.0, 275.0, 150.0, 115.0, 78.0, 50.0, 38.0, 38.0, 23.0, 20.0, 17.0, 8.0, 5.0, 9.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0239105224609375, -0.023169994354248047, -0.022429466247558594, -0.02168893814086914, -0.020948410034179688, -0.020207881927490234, -0.01946735382080078, -0.018726825714111328, -0.017986297607421875, -0.017245769500732422, -0.01650524139404297, -0.015764713287353516, -0.015024185180664062, -0.01428365707397461, -0.013543128967285156, -0.012802600860595703, -0.01206207275390625, -0.011321544647216797, -0.010581016540527344, -0.00984048843383789, -0.009099960327148438, -0.008359432220458984, -0.007618904113769531, -0.006878376007080078, -0.006137847900390625, -0.005397319793701172, -0.004656791687011719, -0.003916263580322266, -0.0031757354736328125, -0.0024352073669433594, -0.0016946792602539062, -0.0009541511535644531, -0.000213623046875, 0.0005269050598144531, 0.0012674331665039062, 0.0020079612731933594, 0.0027484893798828125, 0.0034890174865722656, 0.004229545593261719, 0.004970073699951172, 0.005710601806640625, 0.006451129913330078, 0.007191658020019531, 0.007932186126708984, 0.008672714233398438, 0.00941324234008789, 0.010153770446777344, 0.010894298553466797, 0.01163482666015625, 0.012375354766845703, 0.013115882873535156, 0.01385641098022461, 0.014596939086914062, 0.015337467193603516, 0.01607799530029297, 0.016818523406982422, 0.017559051513671875, 0.018299579620361328, 0.01904010772705078, 0.019780635833740234, 0.020521163940429688, 0.02126169204711914, 0.022002220153808594, 0.022742748260498047, 0.0234832763671875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 4.0, 9.0, 3.0, 6.0, 7.0, 9.0, 13.0, 17.0, 17.0, 28.0, 18.0, 19.0, 22.0, 38.0, 33.0, 29.0, 36.0, 32.0, 44.0, 49.0, 59.0, 39.0, 37.0, 42.0, 35.0, 41.0, 40.0, 31.0, 31.0, 26.0, 28.0, 18.0, 21.0, 20.0, 23.0, 15.0, 10.0, 7.0, 10.0, 8.0, 7.0, 5.0, 5.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.058807373046875, -0.05710029602050781, -0.055393218994140625, -0.05368614196777344, -0.05197906494140625, -0.05027198791503906, -0.048564910888671875, -0.04685783386230469, -0.0451507568359375, -0.04344367980957031, -0.041736602783203125, -0.04002952575683594, -0.03832244873046875, -0.03661537170410156, -0.034908294677734375, -0.03320121765136719, -0.031494140625, -0.029787063598632812, -0.028079986572265625, -0.026372909545898438, -0.02466583251953125, -0.022958755493164062, -0.021251678466796875, -0.019544601440429688, -0.0178375244140625, -0.016130447387695312, -0.014423370361328125, -0.012716293334960938, -0.01100921630859375, -0.009302139282226562, -0.007595062255859375, -0.0058879852294921875, -0.004180908203125, -0.0024738311767578125, -0.000766754150390625, 0.0009403228759765625, 0.00264739990234375, 0.0043544769287109375, 0.006061553955078125, 0.0077686309814453125, 0.0094757080078125, 0.011182785034179688, 0.012889862060546875, 0.014596939086914062, 0.01630401611328125, 0.018011093139648438, 0.019718170166015625, 0.021425247192382812, 0.02313232421875, 0.024839401245117188, 0.026546478271484375, 0.028253555297851562, 0.02996063232421875, 0.03166770935058594, 0.033374786376953125, 0.03508186340332031, 0.0367889404296875, 0.03849601745605469, 0.040203094482421875, 0.04191017150878906, 0.04361724853515625, 0.04532432556152344, 0.047031402587890625, 0.04873847961425781, 0.050445556640625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 13.0, 9.0, 23.0, 42.0, 44.0, 84.0, 123.0, 179.0, 299.0, 456.0, 775.0, 1268.0, 2206.0, 3853.0, 7137.0, 13261.0, 25864.0, 50197.0, 95608.0, 158816.0, 205558.0, 192237.0, 132689.0, 75186.0, 39079.0, 20010.0, 10448.0, 5495.0, 3100.0, 1827.0, 972.0, 623.0, 375.0, 246.0, 152.0, 95.0, 67.0, 45.0, 35.0, 23.0, 14.0, 8.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00431060791015625, -0.004175066947937012, -0.0040395259857177734, -0.003903985023498535, -0.003768444061279297, -0.0036329030990600586, -0.0034973621368408203, -0.003361821174621582, -0.0032262802124023438, -0.0030907392501831055, -0.002955198287963867, -0.002819657325744629, -0.0026841163635253906, -0.0025485754013061523, -0.002413034439086914, -0.0022774934768676758, -0.0021419525146484375, -0.0020064115524291992, -0.001870870590209961, -0.0017353296279907227, -0.0015997886657714844, -0.001464247703552246, -0.0013287067413330078, -0.0011931657791137695, -0.0010576248168945312, -0.000922083854675293, -0.0007865428924560547, -0.0006510019302368164, -0.0005154609680175781, -0.00037992000579833984, -0.00024437904357910156, -0.00010883808135986328, 2.6702880859375e-05, 0.00016224384307861328, 0.00029778480529785156, 0.00043332576751708984, 0.0005688667297363281, 0.0007044076919555664, 0.0008399486541748047, 0.000975489616394043, 0.0011110305786132812, 0.0012465715408325195, 0.0013821125030517578, 0.001517653465270996, 0.0016531944274902344, 0.0017887353897094727, 0.001924276351928711, 0.0020598173141479492, 0.0021953582763671875, 0.0023308992385864258, 0.002466440200805664, 0.0026019811630249023, 0.0027375221252441406, 0.002873063087463379, 0.003008604049682617, 0.0031441450119018555, 0.0032796859741210938, 0.003415226936340332, 0.0035507678985595703, 0.0036863088607788086, 0.003821849822998047, 0.003957390785217285, 0.0040929317474365234, 0.004228472709655762, 0.004364013671875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 0.0, 2.0, 6.0, 4.0, 8.0, 7.0, 12.0, 4.0, 28.0, 12.0, 20.0, 43.0, 31.0, 30.0, 72.0, 41.0, 41.0, 82.0, 48.0, 38.0, 80.0, 43.0, 34.0, 76.0, 27.0, 50.0, 24.0, 18.0, 40.0, 15.0, 9.0, 19.0, 9.0, 4.0, 14.0, 4.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2649765014648438e-06, -2.1848827600479126e-06, -2.1047890186309814e-06, -2.0246952772140503e-06, -1.944601535797119e-06, -1.864507794380188e-06, -1.7844140529632568e-06, -1.7043203115463257e-06, -1.6242265701293945e-06, -1.5441328287124634e-06, -1.4640390872955322e-06, -1.383945345878601e-06, -1.30385160446167e-06, -1.2237578630447388e-06, -1.1436641216278076e-06, -1.0635703802108765e-06, -9.834766387939453e-07, -9.033828973770142e-07, -8.23289155960083e-07, -7.431954145431519e-07, -6.631016731262207e-07, -5.830079317092896e-07, -5.029141902923584e-07, -4.2282044887542725e-07, -3.427267074584961e-07, -2.6263296604156494e-07, -1.825392246246338e-07, -1.0244548320770264e-07, -2.2351741790771484e-08, 5.774199962615967e-08, 1.3783574104309082e-07, 2.1792948246002197e-07, 2.980232238769531e-07, 3.781169652938843e-07, 4.5821070671081543e-07, 5.383044481277466e-07, 6.183981895446777e-07, 6.984919309616089e-07, 7.7858567237854e-07, 8.586794137954712e-07, 9.387731552124023e-07, 1.0188668966293335e-06, 1.0989606380462646e-06, 1.1790543794631958e-06, 1.259148120880127e-06, 1.339241862297058e-06, 1.4193356037139893e-06, 1.4994293451309204e-06, 1.5795230865478516e-06, 1.6596168279647827e-06, 1.7397105693817139e-06, 1.819804310798645e-06, 1.8998980522155762e-06, 1.9799917936325073e-06, 2.0600855350494385e-06, 2.1401792764663696e-06, 2.2202730178833008e-06, 2.300366759300232e-06, 2.380460500717163e-06, 2.4605542421340942e-06, 2.5406479835510254e-06, 2.6207417249679565e-06, 2.7008354663848877e-06, 2.780929207801819e-06, 2.86102294921875e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 6.0, 5.0, 11.0, 8.0, 16.0, 17.0, 34.0, 48.0, 90.0, 142.0, 255.0, 445.0, 830.0, 1559.0, 3281.0, 7335.0, 17287.0, 41797.0, 101349.0, 208000.0, 279978.0, 209307.0, 102384.0, 42586.0, 17565.0, 7449.0, 3308.0, 1560.0, 820.0, 461.0, 236.0, 148.0, 81.0, 44.0, 39.0, 25.0, 19.0, 9.0, 9.0, 12.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00588226318359375, -0.005689442157745361, -0.005496621131896973, -0.005303800106048584, -0.005110979080200195, -0.004918158054351807, -0.004725337028503418, -0.004532516002655029, -0.004339694976806641, -0.004146873950958252, -0.003954052925109863, -0.0037612318992614746, -0.003568410873413086, -0.0033755898475646973, -0.0031827688217163086, -0.00298994779586792, -0.0027971267700195312, -0.0026043057441711426, -0.002411484718322754, -0.0022186636924743652, -0.0020258426666259766, -0.0018330216407775879, -0.0016402006149291992, -0.0014473795890808105, -0.0012545585632324219, -0.0010617375373840332, -0.0008689165115356445, -0.0006760954856872559, -0.0004832744598388672, -0.0002904534339904785, -9.763240814208984e-05, 9.518861770629883e-05, 0.0002880096435546875, 0.00048083066940307617, 0.0006736516952514648, 0.0008664727210998535, 0.0010592937469482422, 0.0012521147727966309, 0.0014449357986450195, 0.0016377568244934082, 0.0018305778503417969, 0.0020233988761901855, 0.0022162199020385742, 0.002409040927886963, 0.0026018619537353516, 0.0027946829795837402, 0.002987504005432129, 0.0031803250312805176, 0.0033731460571289062, 0.003565967082977295, 0.0037587881088256836, 0.003951609134674072, 0.004144430160522461, 0.00433725118637085, 0.004530072212219238, 0.004722893238067627, 0.004915714263916016, 0.005108535289764404, 0.005301356315612793, 0.005494177341461182, 0.00568699836730957, 0.005879819393157959, 0.006072640419006348, 0.006265461444854736, 0.006458282470703125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 1.0, 3.0, 6.0, 4.0, 7.0, 5.0, 10.0, 22.0, 16.0, 33.0, 41.0, 47.0, 53.0, 62.0, 77.0, 62.0, 56.0, 78.0, 87.0, 57.0, 46.0, 47.0, 37.0, 34.0, 25.0, 22.0, 20.0, 5.0, 18.0, 12.0, 6.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00795745849609375, -0.007674098014831543, -0.007390737533569336, -0.007107377052307129, -0.006824016571044922, -0.006540656089782715, -0.006257295608520508, -0.005973935127258301, -0.005690574645996094, -0.005407214164733887, -0.00512385368347168, -0.004840493202209473, -0.004557132720947266, -0.004273772239685059, -0.0039904117584228516, -0.0037070512771606445, -0.0034236907958984375, -0.0031403303146362305, -0.0028569698333740234, -0.0025736093521118164, -0.0022902488708496094, -0.0020068883895874023, -0.0017235279083251953, -0.0014401674270629883, -0.0011568069458007812, -0.0008734464645385742, -0.0005900859832763672, -0.00030672550201416016, -2.3365020751953125e-05, 0.0002599954605102539, 0.0005433559417724609, 0.000826716423034668, 0.001110076904296875, 0.001393437385559082, 0.001676797866821289, 0.001960158348083496, 0.002243518829345703, 0.00252687931060791, 0.002810239791870117, 0.0030936002731323242, 0.0033769607543945312, 0.0036603212356567383, 0.003943681716918945, 0.004227042198181152, 0.004510402679443359, 0.004793763160705566, 0.0050771236419677734, 0.0053604841232299805, 0.0056438446044921875, 0.0059272050857543945, 0.0062105655670166016, 0.006493926048278809, 0.006777286529541016, 0.007060647010803223, 0.00734400749206543, 0.007627367973327637, 0.007910728454589844, 0.00819408893585205, 0.008477449417114258, 0.008760809898376465, 0.009044170379638672, 0.009327530860900879, 0.009610891342163086, 0.009894251823425293, 0.0101776123046875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 22.0, 49.0, 132.0, 269.0, 258.0, 154.0, 63.0, 31.0, 11.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27737826108932495, -0.2692928910255432, -0.2612074911594391, -0.25312212109565735, -0.2450367510318756, -0.23695136606693268, -0.22886598110198975, -0.220780611038208, -0.21269522607326508, -0.20460984110832214, -0.1965244710445404, -0.18843908607959747, -0.18035370111465454, -0.1722683310508728, -0.16418294608592987, -0.15609756112098694, -0.1480121910572052, -0.13992680609226227, -0.13184143602848053, -0.1237560510635376, -0.11567067354917526, -0.10758529603481293, -0.09949991106987, -0.09141453355550766, -0.08332915604114532, -0.07524377852678299, -0.06715840101242065, -0.05907301604747772, -0.05098763853311539, -0.04290226101875305, -0.03481687977910042, -0.026731498539447784, -0.018646135926246643, -0.010560756549239159, -0.002475377172231674, 0.00561000220477581, 0.013695381581783295, 0.02178075909614563, 0.029866140335798264, 0.0379515215754509, 0.04603689908981323, 0.05412227660417557, 0.0622076578438282, 0.07029303908348083, 0.07837841659784317, 0.0864637941122055, 0.09454917907714844, 0.10263455659151077, 0.11071993410587311, 0.11880531162023544, 0.12689068913459778, 0.1349760740995407, 0.14306145906448364, 0.15114682912826538, 0.1592322140932083, 0.16731759905815125, 0.17540296912193298, 0.18348835408687592, 0.19157372415065765, 0.19965910911560059, 0.20774447917938232, 0.21582986414432526, 0.2239152491092682, 0.23200061917304993, 0.24008600413799286]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 3.0, 8.0, 7.0, 10.0, 10.0, 10.0, 16.0, 17.0, 20.0, 22.0, 29.0, 28.0, 33.0, 36.0, 26.0, 30.0, 38.0, 36.0, 37.0, 35.0, 35.0, 42.0, 34.0, 45.0, 31.0, 44.0, 35.0, 39.0, 26.0, 32.0, 28.0, 24.0, 19.0, 21.0, 17.0, 12.0, 17.0, 11.0, 7.0, 9.0, 4.0, 3.0, 7.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.1458343267440796, -0.14177799224853516, -0.13772164285182953, -0.1336653083562851, -0.12960895895957947, -0.12555262446403503, -0.12149628251791, -0.11743994057178497, -0.11338359862565994, -0.10932725667953491, -0.10527091473340988, -0.10121457278728485, -0.09715823829174042, -0.09310188889503479, -0.08904555439949036, -0.08498921245336533, -0.0809328705072403, -0.07687652856111526, -0.07282018661499023, -0.0687638446688652, -0.06470750272274017, -0.06065116450190544, -0.05659482628107071, -0.05253848433494568, -0.04848214238882065, -0.04442580044269562, -0.04036945849657059, -0.036313120275735855, -0.032256778329610825, -0.028200436383485794, -0.024144096300005913, -0.02008775621652603, -0.016031414270401, -0.011975073255598545, -0.00791873224079609, -0.0038623912259936333, 0.00019394978880882263, 0.004250291734933853, 0.008306631818413734, 0.012362971901893616, 0.016419313848018646, 0.020475655794143677, 0.024531995877623558, 0.02858833596110344, 0.03264467790722847, 0.0367010198533535, 0.04075735807418823, 0.04481370002031326, 0.04887004196643829, 0.052926383912563324, 0.056982725858688354, 0.06103906407952309, 0.06509540975093842, 0.06915174424648285, 0.07320808619260788, 0.07726442813873291, 0.08132077008485794, 0.08537711203098297, 0.089433453977108, 0.09348979592323303, 0.09754613041877747, 0.1016024798154831, 0.10565881431102753, 0.10971515625715256, 0.11377149820327759]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 3.0, 8.0, 6.0, 24.0, 36.0, 57.0, 103.0, 149.0, 258.0, 436.0, 925.0, 5090.0, 18634.0, 176764.0, 2313336.0, 1575777.0, 82357.0, 12866.0, 5216.0, 1323.0, 350.0, 214.0, 134.0, 83.0, 58.0, 22.0, 21.0, 9.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059478759765625, -0.057773590087890625, -0.05606842041015625, -0.054363250732421875, -0.0526580810546875, -0.050952911376953125, -0.04924774169921875, -0.047542572021484375, -0.04583740234375, -0.044132232666015625, -0.04242706298828125, -0.040721893310546875, -0.0390167236328125, -0.037311553955078125, -0.03560638427734375, -0.033901214599609375, -0.032196044921875, -0.030490875244140625, -0.02878570556640625, -0.027080535888671875, -0.0253753662109375, -0.023670196533203125, -0.02196502685546875, -0.020259857177734375, -0.0185546875, -0.016849517822265625, -0.01514434814453125, -0.013439178466796875, -0.0117340087890625, -0.010028839111328125, -0.00832366943359375, -0.006618499755859375, -0.004913330078125, -0.003208160400390625, -0.00150299072265625, 0.000202178955078125, 0.0019073486328125, 0.003612518310546875, 0.00531768798828125, 0.007022857666015625, 0.00872802734375, 0.010433197021484375, 0.01213836669921875, 0.013843536376953125, 0.0155487060546875, 0.017253875732421875, 0.01895904541015625, 0.020664215087890625, 0.022369384765625, 0.024074554443359375, 0.02577972412109375, 0.027484893798828125, 0.0291900634765625, 0.030895233154296875, 0.03260040283203125, 0.034305572509765625, 0.0360107421875, 0.037715911865234375, 0.03942108154296875, 0.041126251220703125, 0.0428314208984375, 0.044536590576171875, 0.04624176025390625, 0.047946929931640625, 0.049652099609375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 18.0, 23.0, 34.0, 36.0, 50.0, 76.0, 82.0, 85.0, 92.0, 92.0, 87.0, 70.0, 52.0, 57.0, 44.0, 34.0, 18.0, 19.0, 10.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.057281494140625, -0.05568885803222656, -0.054096221923828125, -0.05250358581542969, -0.05091094970703125, -0.04931831359863281, -0.047725677490234375, -0.04613304138183594, -0.0445404052734375, -0.04294776916503906, -0.041355133056640625, -0.03976249694824219, -0.03816986083984375, -0.03657722473144531, -0.034984588623046875, -0.03339195251464844, -0.03179931640625, -0.030206680297851562, -0.028614044189453125, -0.027021408081054688, -0.02542877197265625, -0.023836135864257812, -0.022243499755859375, -0.020650863647460938, -0.0190582275390625, -0.017465591430664062, -0.015872955322265625, -0.014280319213867188, -0.01268768310546875, -0.011095046997070312, -0.009502410888671875, -0.007909774780273438, -0.006317138671875, -0.0047245025634765625, -0.003131866455078125, -0.0015392303466796875, 5.340576171875e-05, 0.0016460418701171875, 0.003238677978515625, 0.0048313140869140625, 0.0064239501953125, 0.008016586303710938, 0.009609222412109375, 0.011201858520507812, 0.01279449462890625, 0.014387130737304688, 0.015979766845703125, 0.017572402954101562, 0.0191650390625, 0.020757675170898438, 0.022350311279296875, 0.023942947387695312, 0.02553558349609375, 0.027128219604492188, 0.028720855712890625, 0.030313491821289062, 0.0319061279296875, 0.03349876403808594, 0.035091400146484375, 0.03668403625488281, 0.03827667236328125, 0.03986930847167969, 0.041461944580078125, 0.04305458068847656, 0.044647216796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 11.0, 11.0, 25.0, 11.0, 22.0, 45.0, 77.0, 97.0, 143.0, 246.0, 394.0, 761.0, 1753.0, 3757.0, 10230.0, 33696.0, 147384.0, 1353279.0, 2312105.0, 255263.0, 50824.0, 14564.0, 5123.0, 2169.0, 987.0, 501.0, 258.0, 164.0, 144.0, 65.0, 51.0, 30.0, 28.0, 17.0, 15.0, 7.0, 6.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03460693359375, -0.03362226486206055, -0.032637596130371094, -0.03165292739868164, -0.030668258666992188, -0.029683589935302734, -0.02869892120361328, -0.027714252471923828, -0.026729583740234375, -0.025744915008544922, -0.02476024627685547, -0.023775577545166016, -0.022790908813476562, -0.02180624008178711, -0.020821571350097656, -0.019836902618408203, -0.01885223388671875, -0.017867565155029297, -0.016882896423339844, -0.01589822769165039, -0.014913558959960938, -0.013928890228271484, -0.012944221496582031, -0.011959552764892578, -0.010974884033203125, -0.009990215301513672, -0.009005546569824219, -0.008020877838134766, -0.0070362091064453125, -0.006051540374755859, -0.005066871643066406, -0.004082202911376953, -0.0030975341796875, -0.002112865447998047, -0.0011281967163085938, -0.00014352798461914062, 0.0008411407470703125, 0.0018258094787597656, 0.0028104782104492188, 0.003795146942138672, 0.004779815673828125, 0.005764484405517578, 0.006749153137207031, 0.007733821868896484, 0.008718490600585938, 0.00970315933227539, 0.010687828063964844, 0.011672496795654297, 0.01265716552734375, 0.013641834259033203, 0.014626502990722656, 0.01561117172241211, 0.016595840454101562, 0.017580509185791016, 0.01856517791748047, 0.019549846649169922, 0.020534515380859375, 0.021519184112548828, 0.02250385284423828, 0.023488521575927734, 0.024473190307617188, 0.02545785903930664, 0.026442527770996094, 0.027427196502685547, 0.028411865234375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 7.0, 7.0, 17.0, 20.0, 27.0, 46.0, 81.0, 178.0, 467.0, 853.0, 1001.0, 686.0, 325.0, 134.0, 72.0, 42.0, 31.0, 19.0, 17.0, 14.0, 9.0, 7.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0572509765625, -0.05552959442138672, -0.05380821228027344, -0.052086830139160156, -0.050365447998046875, -0.048644065856933594, -0.04692268371582031, -0.04520130157470703, -0.04347991943359375, -0.04175853729248047, -0.04003715515136719, -0.038315773010253906, -0.036594390869140625, -0.034873008728027344, -0.03315162658691406, -0.03143024444580078, -0.0297088623046875, -0.02798748016357422, -0.026266098022460938, -0.024544715881347656, -0.022823333740234375, -0.021101951599121094, -0.019380569458007812, -0.01765918731689453, -0.01593780517578125, -0.014216423034667969, -0.012495040893554688, -0.010773658752441406, -0.009052276611328125, -0.007330894470214844, -0.0056095123291015625, -0.0038881301879882812, -0.002166748046875, -0.00044536590576171875, 0.0012760162353515625, 0.0029973983764648438, 0.004718780517578125, 0.006440162658691406, 0.008161544799804688, 0.009882926940917969, 0.01160430908203125, 0.013325691223144531, 0.015047073364257812, 0.016768455505371094, 0.018489837646484375, 0.020211219787597656, 0.021932601928710938, 0.02365398406982422, 0.0253753662109375, 0.02709674835205078, 0.028818130493164062, 0.030539512634277344, 0.032260894775390625, 0.033982276916503906, 0.03570365905761719, 0.03742504119873047, 0.03914642333984375, 0.04086780548095703, 0.04258918762207031, 0.044310569763183594, 0.046031951904296875, 0.047753334045410156, 0.04947471618652344, 0.05119609832763672, 0.05291748046875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 14.0, 97.0, 349.0, 393.0, 123.0, 23.0, 8.0, 5.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7296496033668518, -0.7122619152069092, -0.6948742270469666, -0.6774865388870239, -0.6600988507270813, -0.6427111625671387, -0.6253235340118408, -0.6079358458518982, -0.5905481576919556, -0.5731604695320129, -0.5557727813720703, -0.5383850932121277, -0.5209974050521851, -0.5036097764968872, -0.4862220585346222, -0.46883437037467957, -0.45144668221473694, -0.4340589940547943, -0.4166713058948517, -0.39928364753723145, -0.3818959593772888, -0.3645082712173462, -0.34712058305740356, -0.32973289489746094, -0.3123452067375183, -0.2949575185775757, -0.27756983041763306, -0.26018214225769043, -0.2427944839000702, -0.22540679574012756, -0.20801910758018494, -0.1906314194202423, -0.17324373126029968, -0.15585604310035706, -0.13846836984157562, -0.121080681681633, -0.10369300097227097, -0.08630532026290894, -0.06891763210296631, -0.05152995139360428, -0.03414227068424225, -0.01675458811223507, 0.00063309445977211, 0.01802077889442444, 0.03540845960378647, 0.0527961403131485, 0.07018382847309113, 0.08757150918245316, 0.10495918989181519, 0.12234687060117722, 0.13973455131053925, 0.15712223947048187, 0.1745099127292633, 0.19189760088920593, 0.20928528904914856, 0.2266729772090912, 0.24406065046787262, 0.26144832372665405, 0.2788360118865967, 0.2962237000465393, 0.31361138820648193, 0.33099907636642456, 0.3483867645263672, 0.3657744228839874, 0.38316211104393005]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 7.0, 8.0, 14.0, 16.0, 20.0, 22.0, 18.0, 26.0, 36.0, 29.0, 41.0, 35.0, 49.0, 41.0, 49.0, 32.0, 45.0, 37.0, 40.0, 46.0, 27.0, 40.0, 40.0, 49.0, 42.0, 30.0, 23.0, 25.0, 19.0, 21.0, 15.0, 14.0, 12.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.11659586429595947, -0.11305682361125946, -0.10951777547597885, -0.10597872734069824, -0.10243968665599823, -0.09890064597129822, -0.09536159783601761, -0.091822549700737, -0.08828350901603699, -0.08474446833133698, -0.08120542019605637, -0.07766637206077576, -0.07412733137607574, -0.07058829069137573, -0.06704924255609512, -0.06351019442081451, -0.0599711537361145, -0.05643210932612419, -0.05289306491613388, -0.04935402050614357, -0.04581497609615326, -0.04227593168616295, -0.03873688727617264, -0.03519784286618233, -0.03165879845619202, -0.028119754046201706, -0.024580709636211395, -0.021041665226221085, -0.017502620816230774, -0.013963576406240463, -0.010424531996250153, -0.006885487586259842, -0.0033464431762695312, 0.00019260123372077942, 0.00373164564371109, 0.007270690053701401, 0.010809734463691711, 0.014348778873682022, 0.017887823283672333, 0.021426867693662643, 0.024965912103652954, 0.028504956513643265, 0.032044000923633575, 0.035583045333623886, 0.0391220897436142, 0.04266113415360451, 0.04620017856359482, 0.04973922297358513, 0.05327826738357544, 0.05681731179356575, 0.06035635620355606, 0.06389540433883667, 0.06743444502353668, 0.0709734857082367, 0.0745125338435173, 0.07805158197879791, 0.08159062266349792, 0.08512966334819794, 0.08866871148347855, 0.09220775961875916, 0.09574680030345917, 0.09928584098815918, 0.10282488912343979, 0.1063639372587204, 0.10990297794342041]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 7.0, 13.0, 11.0, 10.0, 33.0, 16.0, 39.0, 49.0, 46.0, 89.0, 104.0, 129.0, 210.0, 302.0, 427.0, 644.0, 1107.0, 2136.0, 4793.0, 12574.0, 34991.0, 102239.0, 276714.0, 358606.0, 163699.0, 55748.0, 19293.0, 7369.0, 3138.0, 1482.0, 820.0, 509.0, 341.0, 248.0, 149.0, 122.0, 86.0, 65.0, 53.0, 38.0, 31.0, 22.0, 9.0, 11.0, 12.0, 6.0, 5.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.033172607421875, -0.032074928283691406, -0.030977249145507812, -0.02987957000732422, -0.028781890869140625, -0.02768421173095703, -0.026586532592773438, -0.025488853454589844, -0.02439117431640625, -0.023293495178222656, -0.022195816040039062, -0.02109813690185547, -0.020000457763671875, -0.01890277862548828, -0.017805099487304688, -0.016707420349121094, -0.0156097412109375, -0.014512062072753906, -0.013414382934570312, -0.012316703796386719, -0.011219024658203125, -0.010121345520019531, -0.009023666381835938, -0.007925987243652344, -0.00682830810546875, -0.005730628967285156, -0.0046329498291015625, -0.0035352706909179688, -0.002437591552734375, -0.0013399124145507812, -0.0002422332763671875, 0.0008554458618164062, 0.001953125, 0.0030508041381835938, 0.0041484832763671875, 0.005246162414550781, 0.006343841552734375, 0.007441520690917969, 0.008539199829101562, 0.009636878967285156, 0.01073455810546875, 0.011832237243652344, 0.012929916381835938, 0.014027595520019531, 0.015125274658203125, 0.01622295379638672, 0.017320632934570312, 0.018418312072753906, 0.0195159912109375, 0.020613670349121094, 0.021711349487304688, 0.02280902862548828, 0.023906707763671875, 0.02500438690185547, 0.026102066040039062, 0.027199745178222656, 0.02829742431640625, 0.029395103454589844, 0.030492782592773438, 0.03159046173095703, 0.032688140869140625, 0.03378582000732422, 0.03488349914550781, 0.035981178283691406, 0.037078857421875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 7.0, 8.0, 17.0, 35.0, 37.0, 60.0, 69.0, 63.0, 108.0, 97.0, 94.0, 87.0, 78.0, 78.0, 44.0, 36.0, 21.0, 24.0, 16.0, 6.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0615234375, -0.0599064826965332, -0.058289527893066406, -0.05667257308959961, -0.05505561828613281, -0.053438663482666016, -0.05182170867919922, -0.05020475387573242, -0.048587799072265625, -0.04697084426879883, -0.04535388946533203, -0.043736934661865234, -0.04211997985839844, -0.04050302505493164, -0.038886070251464844, -0.03726911544799805, -0.03565216064453125, -0.03403520584106445, -0.032418251037597656, -0.03080129623413086, -0.029184341430664062, -0.027567386627197266, -0.02595043182373047, -0.024333477020263672, -0.022716522216796875, -0.021099567413330078, -0.01948261260986328, -0.017865657806396484, -0.016248703002929688, -0.01463174819946289, -0.013014793395996094, -0.011397838592529297, -0.0097808837890625, -0.008163928985595703, -0.006546974182128906, -0.004930019378662109, -0.0033130645751953125, -0.0016961097717285156, -7.915496826171875e-05, 0.0015377998352050781, 0.003154754638671875, 0.004771709442138672, 0.006388664245605469, 0.008005619049072266, 0.009622573852539062, 0.01123952865600586, 0.012856483459472656, 0.014473438262939453, 0.01609039306640625, 0.017707347869873047, 0.019324302673339844, 0.02094125747680664, 0.022558212280273438, 0.024175167083740234, 0.02579212188720703, 0.027409076690673828, 0.029026031494140625, 0.030642986297607422, 0.03225994110107422, 0.033876895904541016, 0.03549385070800781, 0.03711080551147461, 0.038727760314941406, 0.0403447151184082, 0.041961669921875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 14.0, 18.0, 14.0, 26.0, 33.0, 75.0, 106.0, 125.0, 154.0, 234.0, 437.0, 663.0, 1260.0, 2418.0, 5206.0, 11845.0, 29596.0, 78471.0, 215976.0, 372659.0, 205393.0, 74023.0, 28164.0, 11345.0, 4782.0, 2442.0, 1199.0, 681.0, 384.0, 257.0, 172.0, 121.0, 70.0, 54.0, 44.0, 33.0, 19.0, 7.0, 10.0, 11.0, 7.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0411376953125, -0.03997802734375, -0.038818359375, -0.03765869140625, -0.0364990234375, -0.03533935546875, -0.0341796875, -0.03302001953125, -0.0318603515625, -0.03070068359375, -0.029541015625, -0.02838134765625, -0.0272216796875, -0.02606201171875, -0.02490234375, -0.02374267578125, -0.0225830078125, -0.02142333984375, -0.020263671875, -0.01910400390625, -0.0179443359375, -0.01678466796875, -0.015625, -0.01446533203125, -0.0133056640625, -0.01214599609375, -0.010986328125, -0.00982666015625, -0.0086669921875, -0.00750732421875, -0.00634765625, -0.00518798828125, -0.0040283203125, -0.00286865234375, -0.001708984375, -0.00054931640625, 0.0006103515625, 0.00177001953125, 0.0029296875, 0.00408935546875, 0.0052490234375, 0.00640869140625, 0.007568359375, 0.00872802734375, 0.0098876953125, 0.01104736328125, 0.01220703125, 0.01336669921875, 0.0145263671875, 0.01568603515625, 0.016845703125, 0.01800537109375, 0.0191650390625, 0.02032470703125, 0.021484375, 0.02264404296875, 0.0238037109375, 0.02496337890625, 0.026123046875, 0.02728271484375, 0.0284423828125, 0.02960205078125, 0.03076171875, 0.03192138671875, 0.0330810546875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 16.0, 9.0, 9.0, 17.0, 22.0, 24.0, 21.0, 24.0, 32.0, 29.0, 32.0, 29.0, 38.0, 40.0, 56.0, 32.0, 44.0, 44.0, 43.0, 39.0, 44.0, 41.0, 40.0, 35.0, 21.0, 30.0, 23.0, 19.0, 24.0, 18.0, 16.0, 13.0, 7.0, 13.0, 6.0, 6.0, 5.0, 5.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0662841796875, -0.06424999237060547, -0.06221580505371094, -0.060181617736816406, -0.058147430419921875, -0.056113243103027344, -0.05407905578613281, -0.05204486846923828, -0.05001068115234375, -0.04797649383544922, -0.04594230651855469, -0.043908119201660156, -0.041873931884765625, -0.039839744567871094, -0.03780555725097656, -0.03577136993408203, -0.0337371826171875, -0.03170299530029297, -0.029668807983398438, -0.027634620666503906, -0.025600433349609375, -0.023566246032714844, -0.021532058715820312, -0.01949787139892578, -0.01746368408203125, -0.015429496765136719, -0.013395309448242188, -0.011361122131347656, -0.009326934814453125, -0.007292747497558594, -0.0052585601806640625, -0.0032243728637695312, -0.001190185546875, 0.0008440017700195312, 0.0028781890869140625, 0.004912376403808594, 0.006946563720703125, 0.008980751037597656, 0.011014938354492188, 0.013049125671386719, 0.01508331298828125, 0.01711750030517578, 0.019151687622070312, 0.021185874938964844, 0.023220062255859375, 0.025254249572753906, 0.027288436889648438, 0.02932262420654297, 0.0313568115234375, 0.03339099884033203, 0.03542518615722656, 0.037459373474121094, 0.039493560791015625, 0.041527748107910156, 0.04356193542480469, 0.04559612274169922, 0.04763031005859375, 0.04966449737548828, 0.05169868469238281, 0.053732872009277344, 0.055767059326171875, 0.057801246643066406, 0.05983543395996094, 0.06186962127685547, 0.06390380859375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 7.0, 13.0, 21.0, 26.0, 41.0, 53.0, 101.0, 111.0, 202.0, 312.0, 521.0, 907.0, 1616.0, 2936.0, 5414.0, 10414.0, 20585.0, 41335.0, 85932.0, 178429.0, 270599.0, 214218.0, 109579.0, 51928.0, 25356.0, 12859.0, 6768.0, 3461.0, 1956.0, 1148.0, 610.0, 414.0, 216.0, 156.0, 104.0, 65.0, 42.0, 32.0, 18.0, 10.0, 11.0, 7.0, 1.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00762939453125, -0.007388412952423096, -0.007147431373596191, -0.006906449794769287, -0.006665468215942383, -0.0064244866371154785, -0.006183505058288574, -0.00594252347946167, -0.005701541900634766, -0.005460560321807861, -0.005219578742980957, -0.004978597164154053, -0.0047376155853271484, -0.004496634006500244, -0.00425565242767334, -0.0040146708488464355, -0.0037736892700195312, -0.003532707691192627, -0.0032917261123657227, -0.0030507445335388184, -0.002809762954711914, -0.0025687813758850098, -0.0023277997970581055, -0.002086818218231201, -0.0018458366394042969, -0.0016048550605773926, -0.0013638734817504883, -0.001122891902923584, -0.0008819103240966797, -0.0006409287452697754, -0.0003999471664428711, -0.0001589655876159668, 8.20159912109375e-05, 0.0003229975700378418, 0.0005639791488647461, 0.0008049607276916504, 0.0010459423065185547, 0.001286923885345459, 0.0015279054641723633, 0.0017688870429992676, 0.002009868621826172, 0.002250850200653076, 0.0024918317794799805, 0.0027328133583068848, 0.002973794937133789, 0.0032147765159606934, 0.0034557580947875977, 0.003696739673614502, 0.003937721252441406, 0.0041787028312683105, 0.004419684410095215, 0.004660665988922119, 0.0049016475677490234, 0.005142629146575928, 0.005383610725402832, 0.005624592304229736, 0.005865573883056641, 0.006106555461883545, 0.006347537040710449, 0.0065885186195373535, 0.006829500198364258, 0.007070481777191162, 0.007311463356018066, 0.007552444934844971, 0.007793426513671875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 2.0, 6.0, 6.0, 7.0, 10.0, 3.0, 8.0, 7.0, 22.0, 16.0, 12.0, 40.0, 22.0, 42.0, 58.0, 25.0, 76.0, 39.0, 85.0, 38.0, 84.0, 69.0, 34.0, 65.0, 27.0, 47.0, 31.0, 21.0, 21.0, 11.0, 18.0, 11.0, 6.0, 11.0, 6.0, 6.0, 7.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9802322387695312e-06, -2.8852373361587524e-06, -2.7902424335479736e-06, -2.695247530937195e-06, -2.600252628326416e-06, -2.505257725715637e-06, -2.4102628231048584e-06, -2.3152679204940796e-06, -2.2202730178833008e-06, -2.125278115272522e-06, -2.030283212661743e-06, -1.9352883100509644e-06, -1.8402934074401855e-06, -1.7452985048294067e-06, -1.650303602218628e-06, -1.5553086996078491e-06, -1.4603137969970703e-06, -1.3653188943862915e-06, -1.2703239917755127e-06, -1.1753290891647339e-06, -1.080334186553955e-06, -9.853392839431763e-07, -8.903443813323975e-07, -7.953494787216187e-07, -7.003545761108398e-07, -6.05359673500061e-07, -5.103647708892822e-07, -4.153698682785034e-07, -3.203749656677246e-07, -2.253800630569458e-07, -1.30385160446167e-07, -3.5390257835388184e-08, 5.960464477539063e-08, 1.5459954738616943e-07, 2.4959444999694824e-07, 3.4458935260772705e-07, 4.3958425521850586e-07, 5.345791578292847e-07, 6.295740604400635e-07, 7.245689630508423e-07, 8.195638656616211e-07, 9.145587682723999e-07, 1.0095536708831787e-06, 1.1045485734939575e-06, 1.1995434761047363e-06, 1.2945383787155151e-06, 1.389533281326294e-06, 1.4845281839370728e-06, 1.5795230865478516e-06, 1.6745179891586304e-06, 1.7695128917694092e-06, 1.864507794380188e-06, 1.959502696990967e-06, 2.0544975996017456e-06, 2.1494925022125244e-06, 2.2444874048233032e-06, 2.339482307434082e-06, 2.434477210044861e-06, 2.5294721126556396e-06, 2.6244670152664185e-06, 2.7194619178771973e-06, 2.814456820487976e-06, 2.909451723098755e-06, 3.0044466257095337e-06, 3.0994415283203125e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 8.0, 14.0, 25.0, 35.0, 52.0, 84.0, 138.0, 236.0, 408.0, 740.0, 1468.0, 3127.0, 7558.0, 18445.0, 48472.0, 134681.0, 316948.0, 309807.0, 128125.0, 46750.0, 17714.0, 7483.0, 2976.0, 1509.0, 730.0, 391.0, 213.0, 159.0, 85.0, 63.0, 43.0, 17.0, 14.0, 12.0, 7.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0096588134765625, -0.009325504302978516, -0.008992195129394531, -0.008658885955810547, -0.008325576782226562, -0.007992267608642578, -0.007658958435058594, -0.007325649261474609, -0.006992340087890625, -0.006659030914306641, -0.006325721740722656, -0.005992412567138672, -0.0056591033935546875, -0.005325794219970703, -0.004992485046386719, -0.004659175872802734, -0.00432586669921875, -0.003992557525634766, -0.0036592483520507812, -0.003325939178466797, -0.0029926300048828125, -0.002659320831298828, -0.0023260116577148438, -0.0019927024841308594, -0.001659393310546875, -0.0013260841369628906, -0.0009927749633789062, -0.0006594657897949219, -0.0003261566162109375, 7.152557373046875e-06, 0.00034046173095703125, 0.0006737709045410156, 0.001007080078125, 0.0013403892517089844, 0.0016736984252929688, 0.002007007598876953, 0.0023403167724609375, 0.002673625946044922, 0.0030069351196289062, 0.0033402442932128906, 0.003673553466796875, 0.004006862640380859, 0.004340171813964844, 0.004673480987548828, 0.0050067901611328125, 0.005340099334716797, 0.005673408508300781, 0.006006717681884766, 0.00634002685546875, 0.006673336029052734, 0.007006645202636719, 0.007339954376220703, 0.0076732635498046875, 0.008006572723388672, 0.008339881896972656, 0.00867319107055664, 0.009006500244140625, 0.00933980941772461, 0.009673118591308594, 0.010006427764892578, 0.010339736938476562, 0.010673046112060547, 0.011006355285644531, 0.011339664459228516, 0.0116729736328125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 6.0, 3.0, 7.0, 6.0, 2.0, 8.0, 17.0, 21.0, 27.0, 42.0, 38.0, 49.0, 75.0, 81.0, 93.0, 81.0, 99.0, 70.0, 59.0, 49.0, 47.0, 36.0, 19.0, 19.0, 14.0, 9.0, 9.0, 2.0, 4.0, 4.0, 2.0, 0.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01317596435546875, -0.012691855430603027, -0.012207746505737305, -0.011723637580871582, -0.01123952865600586, -0.010755419731140137, -0.010271310806274414, -0.009787201881408691, -0.009303092956542969, -0.008818984031677246, -0.008334875106811523, -0.0078507661819458, -0.007366657257080078, -0.0068825483322143555, -0.006398439407348633, -0.00591433048248291, -0.0054302215576171875, -0.004946112632751465, -0.004462003707885742, -0.0039778947830200195, -0.003493785858154297, -0.0030096769332885742, -0.0025255680084228516, -0.002041459083557129, -0.0015573501586914062, -0.0010732412338256836, -0.0005891323089599609, -0.00010502338409423828, 0.0003790855407714844, 0.000863194465637207, 0.0013473033905029297, 0.0018314123153686523, 0.002315521240234375, 0.0027996301651000977, 0.0032837390899658203, 0.003767848014831543, 0.004251956939697266, 0.004736065864562988, 0.005220174789428711, 0.005704283714294434, 0.006188392639160156, 0.006672501564025879, 0.0071566104888916016, 0.007640719413757324, 0.008124828338623047, 0.00860893726348877, 0.009093046188354492, 0.009577155113220215, 0.010061264038085938, 0.01054537296295166, 0.011029481887817383, 0.011513590812683105, 0.011997699737548828, 0.01248180866241455, 0.012965917587280273, 0.013450026512145996, 0.013934135437011719, 0.014418244361877441, 0.014902353286743164, 0.015386462211608887, 0.01587057113647461, 0.016354680061340332, 0.016838788986206055, 0.017322897911071777, 0.0178070068359375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 5.0, 8.0, 11.0, 30.0, 51.0, 86.0, 134.0, 170.0, 177.0, 133.0, 85.0, 43.0, 25.0, 15.0, 10.0, 6.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.207394078373909, -0.2006072700023651, -0.19382047653198242, -0.18703366816043854, -0.18024685978889465, -0.17346005141735077, -0.16667324304580688, -0.1598864495754242, -0.1530996412038803, -0.14631283283233643, -0.13952603936195374, -0.13273923099040985, -0.12595242261886597, -0.11916561424732208, -0.1123788133263588, -0.10559201240539551, -0.09880520403385162, -0.09201839566230774, -0.08523159474134445, -0.07844479382038116, -0.07165798544883728, -0.0648711770772934, -0.05808437615633011, -0.05129757151007652, -0.04451076686382294, -0.03772396221756935, -0.030937157571315765, -0.02415035292506218, -0.017363548278808594, -0.010576743632555008, -0.003789938986301422, 0.0029968656599521637, 0.00978367030620575, 0.016570474952459335, 0.02335727959871292, 0.030144084244966507, 0.03693088889122009, 0.04371769353747368, 0.050504498183727264, 0.05729130282998085, 0.06407810747623444, 0.07086491584777832, 0.07765171676874161, 0.0844385176897049, 0.09122532606124878, 0.09801213443279266, 0.10479893535375595, 0.11158573627471924, 0.11837254464626312, 0.125159353017807, 0.1319461464881897, 0.13873295485973358, 0.14551976323127747, 0.15230657160282135, 0.15909337997436523, 0.16588017344474792, 0.1726669818162918, 0.1794537901878357, 0.18624058365821838, 0.19302739202976227, 0.19981420040130615, 0.20660100877285004, 0.21338781714439392, 0.2201746106147766, 0.2269614189863205]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 1.0, 4.0, 4.0, 6.0, 6.0, 8.0, 16.0, 14.0, 16.0, 14.0, 24.0, 14.0, 23.0, 23.0, 29.0, 29.0, 26.0, 34.0, 39.0, 34.0, 41.0, 36.0, 34.0, 55.0, 41.0, 46.0, 40.0, 38.0, 40.0, 42.0, 24.0, 23.0, 23.0, 21.0, 19.0, 16.0, 17.0, 19.0, 10.0, 12.0, 8.0, 6.0, 9.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.1774510145187378, -0.17206040024757385, -0.1666697859764099, -0.16127917170524597, -0.15588855743408203, -0.15049795806407928, -0.14510734379291534, -0.1397167295217514, -0.13432611525058746, -0.12893550097942352, -0.12354488670825958, -0.11815427988767624, -0.1127636656165123, -0.10737305134534836, -0.10198244452476501, -0.09659183025360107, -0.09120121598243713, -0.0858106017112732, -0.08041998744010925, -0.07502938061952591, -0.06963876634836197, -0.06424815207719803, -0.05885754153132439, -0.053466930985450745, -0.048076316714286804, -0.042685702443122864, -0.03729509189724922, -0.03190448135137558, -0.02651386708021164, -0.021123254671692848, -0.015732642263174057, -0.010342031717300415, -0.004951417446136475, 0.0004391949623823166, 0.005829807370901108, 0.011220419779419899, 0.01661103218793869, 0.02200164459645748, 0.027392257004976273, 0.032782867550849915, 0.038173481822013855, 0.043564096093177795, 0.04895470663905144, 0.05434531718492508, 0.05973593145608902, 0.06512654572725296, 0.0705171525478363, 0.07590776681900024, 0.08129838109016418, 0.08668899536132812, 0.09207960963249207, 0.09747021645307541, 0.10286083072423935, 0.10825144499540329, 0.11364205181598663, 0.11903266608715057, 0.12442328035831451, 0.12981389462947845, 0.1352045089006424, 0.14059512317180634, 0.14598572254180908, 0.15137633681297302, 0.15676695108413696, 0.1621575653553009, 0.16754817962646484]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 13.0, 22.0, 27.0, 43.0, 50.0, 105.0, 150.0, 288.0, 597.0, 1960.0, 4587.0, 16639.0, 150571.0, 1670487.0, 2041192.0, 265407.0, 30006.0, 8809.0, 2218.0, 534.0, 233.0, 156.0, 77.0, 46.0, 25.0, 10.0, 6.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045867919921875, -0.0442352294921875, -0.0426025390625, -0.0409698486328125, -0.039337158203125, -0.0377044677734375, -0.03607177734375, -0.0344390869140625, -0.032806396484375, -0.0311737060546875, -0.029541015625, -0.0279083251953125, -0.026275634765625, -0.0246429443359375, -0.02301025390625, -0.0213775634765625, -0.019744873046875, -0.0181121826171875, -0.0164794921875, -0.0148468017578125, -0.013214111328125, -0.0115814208984375, -0.00994873046875, -0.0083160400390625, -0.006683349609375, -0.0050506591796875, -0.00341796875, -0.0017852783203125, -0.000152587890625, 0.0014801025390625, 0.00311279296875, 0.0047454833984375, 0.006378173828125, 0.0080108642578125, 0.0096435546875, 0.0112762451171875, 0.012908935546875, 0.0145416259765625, 0.01617431640625, 0.0178070068359375, 0.019439697265625, 0.0210723876953125, 0.022705078125, 0.0243377685546875, 0.025970458984375, 0.0276031494140625, 0.02923583984375, 0.0308685302734375, 0.032501220703125, 0.0341339111328125, 0.0357666015625, 0.0373992919921875, 0.039031982421875, 0.0406646728515625, 0.04229736328125, 0.0439300537109375, 0.045562744140625, 0.0471954345703125, 0.048828125, 0.0504608154296875, 0.052093505859375, 0.0537261962890625, 0.05535888671875, 0.0569915771484375, 0.058624267578125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 13.0, 5.0, 19.0, 27.0, 30.0, 37.0, 50.0, 77.0, 68.0, 79.0, 83.0, 91.0, 75.0, 80.0, 64.0, 48.0, 52.0, 37.0, 24.0, 14.0, 6.0, 5.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054534912109375, -0.05282163619995117, -0.051108360290527344, -0.049395084381103516, -0.04768180847167969, -0.04596853256225586, -0.04425525665283203, -0.0425419807434082, -0.040828704833984375, -0.03911542892456055, -0.03740215301513672, -0.03568887710571289, -0.03397560119628906, -0.032262325286865234, -0.030549049377441406, -0.028835773468017578, -0.02712249755859375, -0.025409221649169922, -0.023695945739746094, -0.021982669830322266, -0.020269393920898438, -0.01855611801147461, -0.01684284210205078, -0.015129566192626953, -0.013416290283203125, -0.011703014373779297, -0.009989738464355469, -0.00827646255493164, -0.0065631866455078125, -0.004849910736083984, -0.0031366348266601562, -0.0014233589172363281, 0.0002899169921875, 0.002003192901611328, 0.0037164688110351562, 0.005429744720458984, 0.0071430206298828125, 0.00885629653930664, 0.010569572448730469, 0.012282848358154297, 0.013996124267578125, 0.015709400177001953, 0.01742267608642578, 0.01913595199584961, 0.020849227905273438, 0.022562503814697266, 0.024275779724121094, 0.025989055633544922, 0.02770233154296875, 0.029415607452392578, 0.031128883361816406, 0.032842159271240234, 0.03455543518066406, 0.03626871109008789, 0.03798198699951172, 0.03969526290893555, 0.041408538818359375, 0.0431218147277832, 0.04483509063720703, 0.04654836654663086, 0.04826164245605469, 0.049974918365478516, 0.051688194274902344, 0.05340147018432617, 0.05511474609375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 4.0, 7.0, 11.0, 19.0, 29.0, 38.0, 58.0, 87.0, 146.0, 210.0, 344.0, 484.0, 830.0, 1500.0, 2626.0, 5125.0, 10902.0, 25484.0, 68898.0, 240156.0, 1289508.0, 1968206.0, 411654.0, 102085.0, 35789.0, 14901.0, 6652.0, 3627.0, 1861.0, 1138.0, 661.0, 436.0, 265.0, 191.0, 122.0, 58.0, 58.0, 28.0, 26.0, 13.0, 14.0, 6.0, 4.0, 3.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02581787109375, -0.024989604949951172, -0.024161338806152344, -0.023333072662353516, -0.022504806518554688, -0.02167654037475586, -0.02084827423095703, -0.020020008087158203, -0.019191741943359375, -0.018363475799560547, -0.01753520965576172, -0.01670694351196289, -0.015878677368164062, -0.015050411224365234, -0.014222145080566406, -0.013393878936767578, -0.01256561279296875, -0.011737346649169922, -0.010909080505371094, -0.010080814361572266, -0.009252548217773438, -0.00842428207397461, -0.007596015930175781, -0.006767749786376953, -0.005939483642578125, -0.005111217498779297, -0.004282951354980469, -0.0034546852111816406, -0.0026264190673828125, -0.0017981529235839844, -0.0009698867797851562, -0.00014162063598632812, 0.0006866455078125, 0.0015149116516113281, 0.0023431777954101562, 0.0031714439392089844, 0.0039997100830078125, 0.004827976226806641, 0.005656242370605469, 0.006484508514404297, 0.007312774658203125, 0.008141040802001953, 0.008969306945800781, 0.00979757308959961, 0.010625839233398438, 0.011454105377197266, 0.012282371520996094, 0.013110637664794922, 0.01393890380859375, 0.014767169952392578, 0.015595436096191406, 0.016423702239990234, 0.017251968383789062, 0.01808023452758789, 0.01890850067138672, 0.019736766815185547, 0.020565032958984375, 0.021393299102783203, 0.02222156524658203, 0.02304983139038086, 0.023878097534179688, 0.024706363677978516, 0.025534629821777344, 0.026362895965576172, 0.027191162109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 8.0, 8.0, 7.0, 13.0, 13.0, 22.0, 25.0, 38.0, 52.0, 78.0, 139.0, 234.0, 405.0, 558.0, 687.0, 561.0, 426.0, 261.0, 149.0, 87.0, 68.0, 42.0, 41.0, 28.0, 16.0, 13.0, 21.0, 20.0, 8.0, 9.0, 4.0, 7.0, 4.0, 5.0, 7.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.043853759765625, -0.042467594146728516, -0.04108142852783203, -0.03969526290893555, -0.03830909729003906, -0.03692293167114258, -0.035536766052246094, -0.03415060043334961, -0.032764434814453125, -0.03137826919555664, -0.029992103576660156, -0.028605937957763672, -0.027219772338867188, -0.025833606719970703, -0.02444744110107422, -0.023061275482177734, -0.02167510986328125, -0.020288944244384766, -0.01890277862548828, -0.017516613006591797, -0.016130447387695312, -0.014744281768798828, -0.013358116149902344, -0.01197195053100586, -0.010585784912109375, -0.00919961929321289, -0.007813453674316406, -0.006427288055419922, -0.0050411224365234375, -0.003654956817626953, -0.0022687911987304688, -0.0008826255798339844, 0.0005035400390625, 0.0018897056579589844, 0.0032758712768554688, 0.004662036895751953, 0.0060482025146484375, 0.007434368133544922, 0.008820533752441406, 0.01020669937133789, 0.011592864990234375, 0.01297903060913086, 0.014365196228027344, 0.015751361846923828, 0.017137527465820312, 0.018523693084716797, 0.01990985870361328, 0.021296024322509766, 0.02268218994140625, 0.024068355560302734, 0.02545452117919922, 0.026840686798095703, 0.028226852416992188, 0.029613018035888672, 0.030999183654785156, 0.03238534927368164, 0.033771514892578125, 0.03515768051147461, 0.036543846130371094, 0.03793001174926758, 0.03931617736816406, 0.04070234298706055, 0.04208850860595703, 0.043474674224853516, 0.04486083984375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 16.0, 20.0, 74.0, 138.0, 238.0, 218.0, 168.0, 81.0, 25.0, 11.0, 8.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4074813425540924, -0.39605218172073364, -0.3846230208873749, -0.3731938600540161, -0.36176466941833496, -0.3503355085849762, -0.33890634775161743, -0.32747718691825867, -0.3160480260848999, -0.30461886525154114, -0.2931897044181824, -0.2817605137825012, -0.27033135294914246, -0.2589021921157837, -0.24747303128242493, -0.23604387044906616, -0.224614679813385, -0.21318551898002625, -0.2017563432455063, -0.19032718241214752, -0.17889800667762756, -0.1674688458442688, -0.15603968501091003, -0.14461052417755127, -0.1331813484430313, -0.12175218015909195, -0.11032301187515259, -0.09889385104179382, -0.08746468275785446, -0.0760355144739151, -0.06460635364055634, -0.053177185356616974, -0.041747987270355225, -0.030318820849061012, -0.0188896544277668, -0.007460489869117737, 0.003968678414821625, 0.015397846698760986, 0.02682700753211975, 0.03825617581605911, 0.049685344099998474, 0.061114512383937836, 0.0725436806678772, 0.08397284150123596, 0.09540200978517532, 0.10683117806911469, 0.11826033890247345, 0.1296895146369934, 0.14111867547035217, 0.15254783630371094, 0.1639770120382309, 0.17540617287158966, 0.18683534860610962, 0.19826450943946838, 0.20969367027282715, 0.2211228311061859, 0.23255200684070587, 0.24398116767406464, 0.2554103434085846, 0.26683950424194336, 0.2782686650753021, 0.2896978259086609, 0.30112701654434204, 0.3125561773777008, 0.32398533821105957]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 7.0, 11.0, 11.0, 7.0, 9.0, 11.0, 16.0, 14.0, 22.0, 18.0, 19.0, 26.0, 24.0, 31.0, 23.0, 33.0, 41.0, 56.0, 38.0, 46.0, 36.0, 46.0, 42.0, 38.0, 39.0, 41.0, 37.0, 21.0, 27.0, 31.0, 26.0, 20.0, 22.0, 21.0, 22.0, 16.0, 10.0, 9.0, 5.0, 3.0, 8.0, 8.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1263020634651184, -0.12204372882843018, -0.11778539419174194, -0.11352705955505371, -0.10926872491836548, -0.10501039028167725, -0.10075204819440842, -0.09649371355772018, -0.09223537892103195, -0.08797704428434372, -0.08371870964765549, -0.07946037501096725, -0.07520203292369843, -0.07094369828701019, -0.06668536365032196, -0.06242702901363373, -0.058168694376945496, -0.05391035974025726, -0.04965202510356903, -0.0453936867415905, -0.04113535210490227, -0.036877017468214035, -0.032618679106235504, -0.02836034446954727, -0.02410200983285904, -0.019843675196170807, -0.015585338696837425, -0.011327003128826618, -0.007068667560815811, -0.0028103329241275787, 0.001448003575205803, 0.005706340074539185, 0.009964674711227417, 0.014223010279238224, 0.01848134584724903, 0.022739682346582413, 0.026998016983270645, 0.03125635161995888, 0.03551468998193741, 0.03977302461862564, 0.04403135925531387, 0.048289693892002106, 0.05254802852869034, 0.05680636689066887, 0.0610647015273571, 0.06532303988933563, 0.06958137452602386, 0.0738397091627121, 0.07809804379940033, 0.08235637843608856, 0.0866147130727768, 0.09087304770946503, 0.09513138234615326, 0.09938971698284149, 0.10364805907011032, 0.10790639370679855, 0.11216472834348679, 0.11642306298017502, 0.12068139761686325, 0.12493973225355148, 0.1291980743408203, 0.13345640897750854, 0.13771474361419678, 0.141973078250885, 0.14623141288757324]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 4.0, 10.0, 13.0, 14.0, 17.0, 25.0, 43.0, 70.0, 79.0, 124.0, 155.0, 224.0, 395.0, 641.0, 1227.0, 2353.0, 5262.0, 13603.0, 37699.0, 115854.0, 335931.0, 347653.0, 122189.0, 39808.0, 14154.0, 5537.0, 2432.0, 1156.0, 632.0, 395.0, 254.0, 189.0, 115.0, 91.0, 61.0, 46.0, 29.0, 25.0, 10.0, 5.0, 9.0, 6.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.042083740234375, -0.04076957702636719, -0.039455413818359375, -0.03814125061035156, -0.03682708740234375, -0.03551292419433594, -0.034198760986328125, -0.03288459777832031, -0.0315704345703125, -0.030256271362304688, -0.028942108154296875, -0.027627944946289062, -0.02631378173828125, -0.024999618530273438, -0.023685455322265625, -0.022371292114257812, -0.02105712890625, -0.019742965698242188, -0.018428802490234375, -0.017114639282226562, -0.01580047607421875, -0.014486312866210938, -0.013172149658203125, -0.011857986450195312, -0.0105438232421875, -0.009229660034179688, -0.007915496826171875, -0.0066013336181640625, -0.00528717041015625, -0.0039730072021484375, -0.002658843994140625, -0.0013446807861328125, -3.0517578125e-05, 0.0012836456298828125, 0.002597808837890625, 0.0039119720458984375, 0.00522613525390625, 0.0065402984619140625, 0.007854461669921875, 0.009168624877929688, 0.0104827880859375, 0.011796951293945312, 0.013111114501953125, 0.014425277709960938, 0.01573944091796875, 0.017053604125976562, 0.018367767333984375, 0.019681930541992188, 0.02099609375, 0.022310256958007812, 0.023624420166015625, 0.024938583374023438, 0.02625274658203125, 0.027566909790039062, 0.028881072998046875, 0.030195236206054688, 0.0315093994140625, 0.03282356262207031, 0.034137725830078125, 0.03545188903808594, 0.03676605224609375, 0.03808021545410156, 0.039394378662109375, 0.04070854187011719, 0.042022705078125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 4.0, 15.0, 18.0, 21.0, 30.0, 35.0, 52.0, 59.0, 80.0, 104.0, 86.0, 82.0, 85.0, 78.0, 68.0, 51.0, 25.0, 31.0, 25.0, 10.0, 12.0, 6.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.057403564453125, -0.055922508239746094, -0.05444145202636719, -0.05296039581298828, -0.051479339599609375, -0.04999828338623047, -0.04851722717285156, -0.047036170959472656, -0.04555511474609375, -0.044074058532714844, -0.04259300231933594, -0.04111194610595703, -0.039630889892578125, -0.03814983367919922, -0.03666877746582031, -0.035187721252441406, -0.0337066650390625, -0.032225608825683594, -0.030744552612304688, -0.02926349639892578, -0.027782440185546875, -0.02630138397216797, -0.024820327758789062, -0.023339271545410156, -0.02185821533203125, -0.020377159118652344, -0.018896102905273438, -0.01741504669189453, -0.015933990478515625, -0.014452934265136719, -0.012971878051757812, -0.011490821838378906, -0.010009765625, -0.008528709411621094, -0.0070476531982421875, -0.005566596984863281, -0.004085540771484375, -0.0026044845581054688, -0.0011234283447265625, 0.00035762786865234375, 0.00183868408203125, 0.0033197402954101562, 0.0048007965087890625, 0.006281852722167969, 0.007762908935546875, 0.009243965148925781, 0.010725021362304688, 0.012206077575683594, 0.0136871337890625, 0.015168190002441406, 0.016649246215820312, 0.01813030242919922, 0.019611358642578125, 0.02109241485595703, 0.022573471069335938, 0.024054527282714844, 0.02553558349609375, 0.027016639709472656, 0.028497695922851562, 0.02997875213623047, 0.031459808349609375, 0.03294086456298828, 0.03442192077636719, 0.035902976989746094, 0.037384033203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 8.0, 10.0, 10.0, 18.0, 27.0, 44.0, 57.0, 82.0, 106.0, 147.0, 204.0, 335.0, 494.0, 804.0, 1541.0, 3133.0, 7003.0, 17860.0, 49576.0, 147191.0, 373776.0, 290308.0, 98073.0, 34277.0, 12625.0, 5280.0, 2365.0, 1194.0, 670.0, 448.0, 249.0, 171.0, 132.0, 84.0, 71.0, 47.0, 41.0, 24.0, 18.0, 16.0, 9.0, 11.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.040252685546875, -0.03894662857055664, -0.03764057159423828, -0.03633451461791992, -0.03502845764160156, -0.0337224006652832, -0.032416343688964844, -0.031110286712646484, -0.029804229736328125, -0.028498172760009766, -0.027192115783691406, -0.025886058807373047, -0.024580001831054688, -0.023273944854736328, -0.02196788787841797, -0.02066183090209961, -0.01935577392578125, -0.01804971694946289, -0.01674365997314453, -0.015437602996826172, -0.014131546020507812, -0.012825489044189453, -0.011519432067871094, -0.010213375091552734, -0.008907318115234375, -0.007601261138916016, -0.006295204162597656, -0.004989147186279297, -0.0036830902099609375, -0.002377033233642578, -0.0010709762573242188, 0.00023508071899414062, 0.0015411376953125, 0.0028471946716308594, 0.004153251647949219, 0.005459308624267578, 0.0067653656005859375, 0.008071422576904297, 0.009377479553222656, 0.010683536529541016, 0.011989593505859375, 0.013295650482177734, 0.014601707458496094, 0.015907764434814453, 0.017213821411132812, 0.018519878387451172, 0.01982593536376953, 0.02113199234008789, 0.02243804931640625, 0.02374410629272461, 0.02505016326904297, 0.026356220245361328, 0.027662277221679688, 0.028968334197998047, 0.030274391174316406, 0.031580448150634766, 0.032886505126953125, 0.034192562103271484, 0.035498619079589844, 0.0368046760559082, 0.03811073303222656, 0.03941679000854492, 0.04072284698486328, 0.04202890396118164, 0.0433349609375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 5.0, 11.0, 7.0, 11.0, 13.0, 10.0, 16.0, 26.0, 25.0, 34.0, 32.0, 32.0, 37.0, 44.0, 35.0, 54.0, 45.0, 56.0, 47.0, 52.0, 41.0, 46.0, 51.0, 38.0, 38.0, 29.0, 24.0, 25.0, 17.0, 22.0, 17.0, 13.0, 9.0, 11.0, 10.0, 9.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07476806640625, -0.07240676879882812, -0.07004547119140625, -0.06768417358398438, -0.0653228759765625, -0.06296157836914062, -0.06060028076171875, -0.058238983154296875, -0.055877685546875, -0.053516387939453125, -0.05115509033203125, -0.048793792724609375, -0.0464324951171875, -0.044071197509765625, -0.04170989990234375, -0.039348602294921875, -0.0369873046875, -0.034626007080078125, -0.03226470947265625, -0.029903411865234375, -0.0275421142578125, -0.025180816650390625, -0.02281951904296875, -0.020458221435546875, -0.018096923828125, -0.015735626220703125, -0.01337432861328125, -0.011013031005859375, -0.0086517333984375, -0.006290435791015625, -0.00392913818359375, -0.001567840576171875, 0.00079345703125, 0.003154754638671875, 0.00551605224609375, 0.007877349853515625, 0.0102386474609375, 0.012599945068359375, 0.01496124267578125, 0.017322540283203125, 0.019683837890625, 0.022045135498046875, 0.02440643310546875, 0.026767730712890625, 0.0291290283203125, 0.031490325927734375, 0.03385162353515625, 0.036212921142578125, 0.03857421875, 0.040935516357421875, 0.04329681396484375, 0.045658111572265625, 0.0480194091796875, 0.050380706787109375, 0.05274200439453125, 0.055103302001953125, 0.057464599609375, 0.059825897216796875, 0.06218719482421875, 0.06454849243164062, 0.0669097900390625, 0.06927108764648438, 0.07163238525390625, 0.07399368286132812, 0.07635498046875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 8.0, 15.0, 9.0, 19.0, 28.0, 41.0, 58.0, 91.0, 140.0, 170.0, 236.0, 383.0, 587.0, 889.0, 1378.0, 2340.0, 4432.0, 10249.0, 26074.0, 77846.0, 249272.0, 418055.0, 167373.0, 53700.0, 18581.0, 7496.0, 3674.0, 1959.0, 1231.0, 708.0, 480.0, 343.0, 208.0, 148.0, 98.0, 70.0, 54.0, 31.0, 29.0, 11.0, 12.0, 7.0, 12.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01424407958984375, -0.013803482055664062, -0.013362884521484375, -0.012922286987304688, -0.012481689453125, -0.012041091918945312, -0.011600494384765625, -0.011159896850585938, -0.01071929931640625, -0.010278701782226562, -0.009838104248046875, -0.009397506713867188, -0.0089569091796875, -0.008516311645507812, -0.008075714111328125, -0.0076351165771484375, -0.00719451904296875, -0.0067539215087890625, -0.006313323974609375, -0.0058727264404296875, -0.00543212890625, -0.0049915313720703125, -0.004550933837890625, -0.0041103363037109375, -0.00366973876953125, -0.0032291412353515625, -0.002788543701171875, -0.0023479461669921875, -0.0019073486328125, -0.0014667510986328125, -0.001026153564453125, -0.0005855560302734375, -0.00014495849609375, 0.0002956390380859375, 0.000736236572265625, 0.0011768341064453125, 0.001617431640625, 0.0020580291748046875, 0.002498626708984375, 0.0029392242431640625, 0.00337982177734375, 0.0038204193115234375, 0.004261016845703125, 0.0047016143798828125, 0.0051422119140625, 0.0055828094482421875, 0.006023406982421875, 0.0064640045166015625, 0.00690460205078125, 0.0073451995849609375, 0.007785797119140625, 0.008226394653320312, 0.0086669921875, 0.009107589721679688, 0.009548187255859375, 0.009988784790039062, 0.01042938232421875, 0.010869979858398438, 0.011310577392578125, 0.011751174926757812, 0.0121917724609375, 0.012632369995117188, 0.013072967529296875, 0.013513565063476562, 0.01395416259765625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 7.0, 9.0, 14.0, 26.0, 49.0, 91.0, 117.0, 142.0, 172.0, 117.0, 106.0, 59.0, 31.0, 20.0, 15.0, 12.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.702278137207031e-06, -8.440576493740082e-06, -8.178874850273132e-06, -7.917173206806183e-06, -7.655471563339233e-06, -7.393769919872284e-06, -7.1320682764053345e-06, -6.870366632938385e-06, -6.6086649894714355e-06, -6.346963346004486e-06, -6.085261702537537e-06, -5.823560059070587e-06, -5.561858415603638e-06, -5.300156772136688e-06, -5.038455128669739e-06, -4.776753485202789e-06, -4.51505184173584e-06, -4.25335019826889e-06, -3.991648554801941e-06, -3.7299469113349915e-06, -3.468245267868042e-06, -3.2065436244010925e-06, -2.944841980934143e-06, -2.6831403374671936e-06, -2.421438694000244e-06, -2.1597370505332947e-06, -1.8980354070663452e-06, -1.6363337635993958e-06, -1.3746321201324463e-06, -1.1129304766654968e-06, -8.512288331985474e-07, -5.895271897315979e-07, -3.2782554626464844e-07, -6.612390279769897e-08, 1.955777406692505e-07, 4.5727938413619995e-07, 7.189810276031494e-07, 9.806826710700989e-07, 1.2423843145370483e-06, 1.5040859580039978e-06, 1.7657876014709473e-06, 2.0274892449378967e-06, 2.289190888404846e-06, 2.5508925318717957e-06, 2.812594175338745e-06, 3.0742958188056946e-06, 3.335997462272644e-06, 3.5976991057395935e-06, 3.859400749206543e-06, 4.1211023926734924e-06, 4.382804036140442e-06, 4.644505679607391e-06, 4.906207323074341e-06, 5.16790896654129e-06, 5.42961061000824e-06, 5.691312253475189e-06, 5.953013896942139e-06, 6.214715540409088e-06, 6.476417183876038e-06, 6.738118827342987e-06, 6.9998204708099365e-06, 7.261522114276886e-06, 7.5232237577438354e-06, 7.784925401210785e-06, 8.046627044677734e-06]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 8.0, 9.0, 19.0, 19.0, 30.0, 45.0, 72.0, 103.0, 181.0, 245.0, 414.0, 690.0, 1187.0, 2277.0, 4927.0, 13816.0, 44989.0, 160639.0, 456905.0, 257224.0, 70282.0, 20641.0, 7222.0, 2880.0, 1515.0, 846.0, 511.0, 283.0, 196.0, 133.0, 78.0, 52.0, 38.0, 31.0, 13.0, 10.0, 11.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0159759521484375, -0.015501618385314941, -0.015027284622192383, -0.014552950859069824, -0.014078617095947266, -0.013604283332824707, -0.013129949569702148, -0.01265561580657959, -0.012181282043457031, -0.011706948280334473, -0.011232614517211914, -0.010758280754089355, -0.010283946990966797, -0.009809613227844238, -0.00933527946472168, -0.008860945701599121, -0.008386611938476562, -0.007912278175354004, -0.007437944412231445, -0.006963610649108887, -0.006489276885986328, -0.0060149431228637695, -0.005540609359741211, -0.005066275596618652, -0.004591941833496094, -0.004117608070373535, -0.0036432743072509766, -0.003168940544128418, -0.0026946067810058594, -0.0022202730178833008, -0.0017459392547607422, -0.0012716054916381836, -0.000797271728515625, -0.0003229379653930664, 0.0001513957977294922, 0.0006257295608520508, 0.0011000633239746094, 0.001574397087097168, 0.0020487308502197266, 0.002523064613342285, 0.0029973983764648438, 0.0034717321395874023, 0.003946065902709961, 0.0044203996658325195, 0.004894733428955078, 0.005369067192077637, 0.005843400955200195, 0.006317734718322754, 0.0067920684814453125, 0.007266402244567871, 0.00774073600769043, 0.008215069770812988, 0.008689403533935547, 0.009163737297058105, 0.009638071060180664, 0.010112404823303223, 0.010586738586425781, 0.01106107234954834, 0.011535406112670898, 0.012009739875793457, 0.012484073638916016, 0.012958407402038574, 0.013432741165161133, 0.013907074928283691, 0.01438140869140625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 14.0, 9.0, 16.0, 26.0, 26.0, 26.0, 41.0, 59.0, 62.0, 94.0, 105.0, 122.0, 82.0, 103.0, 55.0, 35.0, 34.0, 23.0, 22.0, 11.0, 9.0, 8.0, 5.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0173187255859375, -0.01674342155456543, -0.01616811752319336, -0.015592813491821289, -0.015017509460449219, -0.014442205429077148, -0.013866901397705078, -0.013291597366333008, -0.012716293334960938, -0.012140989303588867, -0.011565685272216797, -0.010990381240844727, -0.010415077209472656, -0.009839773178100586, -0.009264469146728516, -0.008689165115356445, -0.008113861083984375, -0.007538557052612305, -0.006963253021240234, -0.006387948989868164, -0.005812644958496094, -0.0052373409271240234, -0.004662036895751953, -0.004086732864379883, -0.0035114288330078125, -0.002936124801635742, -0.002360820770263672, -0.0017855167388916016, -0.0012102127075195312, -0.0006349086761474609, -5.9604644775390625e-05, 0.0005156993865966797, 0.00109100341796875, 0.0016663074493408203, 0.0022416114807128906, 0.002816915512084961, 0.0033922195434570312, 0.0039675235748291016, 0.004542827606201172, 0.005118131637573242, 0.0056934356689453125, 0.006268739700317383, 0.006844043731689453, 0.0074193477630615234, 0.007994651794433594, 0.008569955825805664, 0.009145259857177734, 0.009720563888549805, 0.010295867919921875, 0.010871171951293945, 0.011446475982666016, 0.012021780014038086, 0.012597084045410156, 0.013172388076782227, 0.013747692108154297, 0.014322996139526367, 0.014898300170898438, 0.015473604202270508, 0.016048908233642578, 0.01662421226501465, 0.01719951629638672, 0.01777482032775879, 0.01835012435913086, 0.01892542839050293, 0.019500732421875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 20.0, 18.0, 47.0, 82.0, 123.0, 164.0, 174.0, 156.0, 100.0, 51.0, 28.0, 11.0, 5.0, 6.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.3411496877670288, -0.33350932598114014, -0.32586896419525146, -0.3182285726070404, -0.31058821082115173, -0.30294784903526306, -0.2953074872493744, -0.2876671254634857, -0.28002673387527466, -0.272386372089386, -0.2647460103034973, -0.25710561871528625, -0.24946525692939758, -0.2418248951435089, -0.23418453335762024, -0.22654417157173157, -0.2189038097858429, -0.21126344799995422, -0.20362307131290436, -0.19598270952701569, -0.18834233283996582, -0.18070197105407715, -0.17306160926818848, -0.1654212474822998, -0.15778087079524994, -0.15014050900936127, -0.1425001323223114, -0.13485977053642273, -0.12721940875053406, -0.11957903206348419, -0.11193867027759552, -0.10429830104112625, -0.09665794670581818, -0.08901757746934891, -0.08137720823287964, -0.07373684644699097, -0.0660964772105217, -0.05845610797405243, -0.05081574246287346, -0.04317537695169449, -0.03553500771522522, -0.0278946403414011, -0.02025427296757698, -0.012613905593752861, -0.0049735382199287415, 0.0026668310165405273, 0.010307196527719498, 0.017947562038898468, 0.025587931275367737, 0.033228300511837006, 0.040868666023015976, 0.048509031534194946, 0.056149400770664215, 0.06378977000713348, 0.07143013179302216, 0.07907050102949142, 0.0867108702659607, 0.09435123950242996, 0.10199160873889923, 0.1096319705247879, 0.11727233976125717, 0.12491270899772644, 0.1325530707836151, 0.14019343256950378, 0.14783380925655365]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 6.0, 2.0, 4.0, 7.0, 4.0, 7.0, 11.0, 8.0, 12.0, 19.0, 12.0, 9.0, 20.0, 22.0, 25.0, 21.0, 30.0, 28.0, 27.0, 34.0, 38.0, 29.0, 33.0, 44.0, 34.0, 38.0, 41.0, 41.0, 39.0, 39.0, 29.0, 33.0, 28.0, 28.0, 27.0, 24.0, 19.0, 21.0, 19.0, 20.0, 21.0, 8.0, 15.0, 8.0, 6.0, 2.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13038122653961182, -0.12594418227672577, -0.12150715291500092, -0.11707011610269547, -0.11263307929039001, -0.10819603502750397, -0.10375899821519852, -0.09932196140289307, -0.09488492459058762, -0.09044788777828217, -0.08601085096597672, -0.08157381415367126, -0.07713676989078522, -0.07269974052906036, -0.06826269626617432, -0.06382565945386887, -0.059388622641563416, -0.054951585829257965, -0.050514549016952515, -0.046077508479356766, -0.041640471667051315, -0.037203434854745865, -0.032766394317150116, -0.028329357504844666, -0.023892320692539215, -0.019455283880233765, -0.015018245205283165, -0.01058120746165514, -0.006144169718027115, -0.0017071329057216644, 0.0027299057692289352, 0.007166944444179535, 0.011603981256484985, 0.016041018068790436, 0.020478056743741035, 0.024915095418691635, 0.029352132230997086, 0.033789169043302536, 0.038226209580898285, 0.042663246393203735, 0.047100283205509186, 0.051537320017814636, 0.05597435683012009, 0.060411397367715836, 0.06484843790531158, 0.06928546726703644, 0.07372251152992249, 0.07815954834222794, 0.08259658515453339, 0.08703362196683884, 0.09147065877914429, 0.09590769559144974, 0.10034473240375519, 0.10478177666664124, 0.10921881347894669, 0.11365585029125214, 0.11809288710355759, 0.12252992391586304, 0.12696696817874908, 0.13140399754047394, 0.13584104180335999, 0.14027807116508484, 0.1447151154279709, 0.14915215969085693, 0.1535891890525818]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 10.0, 11.0, 16.0, 32.0, 56.0, 86.0, 133.0, 258.0, 442.0, 1262.0, 3218.0, 9441.0, 39188.0, 343121.0, 1929458.0, 1595437.0, 224638.0, 31186.0, 10322.0, 4284.0, 1006.0, 327.0, 184.0, 69.0, 37.0, 29.0, 18.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04754638671875, -0.04605674743652344, -0.044567108154296875, -0.04307746887207031, -0.04158782958984375, -0.04009819030761719, -0.038608551025390625, -0.03711891174316406, -0.0356292724609375, -0.03413963317871094, -0.032649993896484375, -0.031160354614257812, -0.02967071533203125, -0.028181076049804688, -0.026691436767578125, -0.025201797485351562, -0.023712158203125, -0.022222518920898438, -0.020732879638671875, -0.019243240356445312, -0.01775360107421875, -0.016263961791992188, -0.014774322509765625, -0.013284683227539062, -0.0117950439453125, -0.010305404663085938, -0.008815765380859375, -0.0073261260986328125, -0.00583648681640625, -0.0043468475341796875, -0.002857208251953125, -0.0013675689697265625, 0.0001220703125, 0.0016117095947265625, 0.003101348876953125, 0.0045909881591796875, 0.00608062744140625, 0.0075702667236328125, 0.009059906005859375, 0.010549545288085938, 0.0120391845703125, 0.013528823852539062, 0.015018463134765625, 0.016508102416992188, 0.01799774169921875, 0.019487380981445312, 0.020977020263671875, 0.022466659545898438, 0.023956298828125, 0.025445938110351562, 0.026935577392578125, 0.028425216674804688, 0.02991485595703125, 0.03140449523925781, 0.032894134521484375, 0.03438377380371094, 0.0358734130859375, 0.03736305236816406, 0.038852691650390625, 0.04034233093261719, 0.04183197021484375, 0.04332160949707031, 0.044811248779296875, 0.04630088806152344, 0.04779052734375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 6.0, 12.0, 22.0, 27.0, 38.0, 44.0, 87.0, 83.0, 74.0, 82.0, 85.0, 91.0, 86.0, 70.0, 52.0, 47.0, 35.0, 15.0, 16.0, 14.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05718994140625, -0.055408477783203125, -0.05362701416015625, -0.051845550537109375, -0.0500640869140625, -0.048282623291015625, -0.04650115966796875, -0.044719696044921875, -0.042938232421875, -0.041156768798828125, -0.03937530517578125, -0.037593841552734375, -0.0358123779296875, -0.034030914306640625, -0.03224945068359375, -0.030467987060546875, -0.0286865234375, -0.026905059814453125, -0.02512359619140625, -0.023342132568359375, -0.0215606689453125, -0.019779205322265625, -0.01799774169921875, -0.016216278076171875, -0.014434814453125, -0.012653350830078125, -0.01087188720703125, -0.009090423583984375, -0.0073089599609375, -0.005527496337890625, -0.00374603271484375, -0.001964569091796875, -0.00018310546875, 0.001598358154296875, 0.00337982177734375, 0.005161285400390625, 0.0069427490234375, 0.008724212646484375, 0.01050567626953125, 0.012287139892578125, 0.014068603515625, 0.015850067138671875, 0.01763153076171875, 0.019412994384765625, 0.0211944580078125, 0.022975921630859375, 0.02475738525390625, 0.026538848876953125, 0.0283203125, 0.030101776123046875, 0.03188323974609375, 0.033664703369140625, 0.0354461669921875, 0.037227630615234375, 0.03900909423828125, 0.040790557861328125, 0.042572021484375, 0.044353485107421875, 0.04613494873046875, 0.047916412353515625, 0.0496978759765625, 0.051479339599609375, 0.05326080322265625, 0.055042266845703125, 0.05682373046875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 10.0, 14.0, 18.0, 26.0, 52.0, 69.0, 125.0, 256.0, 481.0, 1008.0, 2411.0, 7260.0, 28391.0, 138452.0, 1190274.0, 2451731.0, 301940.0, 52412.0, 12510.0, 3851.0, 1467.0, 632.0, 385.0, 212.0, 109.0, 69.0, 38.0, 21.0, 18.0, 9.0, 11.0, 10.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.042083740234375, -0.04069042205810547, -0.03929710388183594, -0.037903785705566406, -0.036510467529296875, -0.035117149353027344, -0.03372383117675781, -0.03233051300048828, -0.03093719482421875, -0.02954387664794922, -0.028150558471679688, -0.026757240295410156, -0.025363922119140625, -0.023970603942871094, -0.022577285766601562, -0.02118396759033203, -0.0197906494140625, -0.01839733123779297, -0.017004013061523438, -0.015610694885253906, -0.014217376708984375, -0.012824058532714844, -0.011430740356445312, -0.010037422180175781, -0.00864410400390625, -0.007250785827636719, -0.0058574676513671875, -0.004464149475097656, -0.003070831298828125, -0.0016775131225585938, -0.0002841949462890625, 0.0011091232299804688, 0.00250244140625, 0.0038957595825195312, 0.0052890777587890625, 0.006682395935058594, 0.008075714111328125, 0.009469032287597656, 0.010862350463867188, 0.012255668640136719, 0.01364898681640625, 0.015042304992675781, 0.016435623168945312, 0.017828941345214844, 0.019222259521484375, 0.020615577697753906, 0.022008895874023438, 0.02340221405029297, 0.0247955322265625, 0.02618885040283203, 0.027582168579101562, 0.028975486755371094, 0.030368804931640625, 0.031762123107910156, 0.03315544128417969, 0.03454875946044922, 0.03594207763671875, 0.03733539581298828, 0.03872871398925781, 0.040122032165527344, 0.041515350341796875, 0.042908668518066406, 0.04430198669433594, 0.04569530487060547, 0.047088623046875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 8.0, 13.0, 15.0, 20.0, 25.0, 39.0, 45.0, 81.0, 129.0, 211.0, 384.0, 567.0, 709.0, 584.0, 463.0, 278.0, 163.0, 85.0, 59.0, 51.0, 33.0, 24.0, 17.0, 17.0, 18.0, 9.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04449462890625, -0.04282951354980469, -0.041164398193359375, -0.03949928283691406, -0.03783416748046875, -0.03616905212402344, -0.034503936767578125, -0.03283882141113281, -0.0311737060546875, -0.029508590698242188, -0.027843475341796875, -0.026178359985351562, -0.02451324462890625, -0.022848129272460938, -0.021183013916015625, -0.019517898559570312, -0.017852783203125, -0.016187667846679688, -0.014522552490234375, -0.012857437133789062, -0.01119232177734375, -0.009527206420898438, -0.007862091064453125, -0.0061969757080078125, -0.0045318603515625, -0.0028667449951171875, -0.001201629638671875, 0.0004634857177734375, 0.00212860107421875, 0.0037937164306640625, 0.005458831787109375, 0.0071239471435546875, 0.0087890625, 0.010454177856445312, 0.012119293212890625, 0.013784408569335938, 0.01544952392578125, 0.017114639282226562, 0.018779754638671875, 0.020444869995117188, 0.0221099853515625, 0.023775100708007812, 0.025440216064453125, 0.027105331420898438, 0.02877044677734375, 0.030435562133789062, 0.032100677490234375, 0.03376579284667969, 0.035430908203125, 0.03709602355957031, 0.038761138916015625, 0.04042625427246094, 0.04209136962890625, 0.04375648498535156, 0.045421600341796875, 0.04708671569824219, 0.0487518310546875, 0.05041694641113281, 0.052082061767578125, 0.05374717712402344, 0.05541229248046875, 0.05707740783691406, 0.058742523193359375, 0.06040763854980469, 0.06207275390625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 10.0, 36.0, 58.0, 112.0, 146.0, 183.0, 166.0, 133.0, 71.0, 41.0, 14.0, 9.0, 12.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37211930751800537, -0.3619363605976105, -0.35175344347953796, -0.34157049655914307, -0.33138757944107056, -0.32120463252067566, -0.31102168560028076, -0.30083876848220825, -0.29065582156181335, -0.28047287464141846, -0.27028995752334595, -0.26010701060295105, -0.24992407858371735, -0.23974114656448364, -0.22955819964408875, -0.21937526762485504, -0.20919233560562134, -0.19900940358638763, -0.18882647156715393, -0.17864352464675903, -0.16846059262752533, -0.15827766060829163, -0.14809471368789673, -0.13791178166866302, -0.12772884964942932, -0.11754591763019562, -0.10736297816038132, -0.09718003869056702, -0.08699710667133331, -0.07681417465209961, -0.06663123518228531, -0.05644829571247101, -0.04626533389091492, -0.036082398146390915, -0.025899462401866913, -0.01571652665734291, -0.005533590912818909, 0.004649344831705093, 0.014832280576229095, 0.025015220046043396, 0.0351981520652771, 0.0453810878098011, 0.055564023554325104, 0.0657469630241394, 0.07592989504337311, 0.08611282706260681, 0.09629576653242111, 0.10647870600223541, 0.11666163802146912, 0.12684457004070282, 0.13702750205993652, 0.14721044898033142, 0.15739338099956512, 0.16757631301879883, 0.17775925993919373, 0.18794219195842743, 0.19812512397766113, 0.20830805599689484, 0.21849098801612854, 0.22867393493652344, 0.23885686695575714, 0.24903979897499084, 0.25922274589538574, 0.26940566301345825, 0.27958860993385315]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 10.0, 9.0, 8.0, 15.0, 17.0, 12.0, 20.0, 24.0, 26.0, 32.0, 35.0, 40.0, 47.0, 31.0, 44.0, 42.0, 57.0, 50.0, 45.0, 49.0, 35.0, 31.0, 42.0, 33.0, 36.0, 35.0, 25.0, 34.0, 21.0, 18.0, 17.0, 13.0, 10.0, 5.0, 6.0, 10.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.14731961488723755, -0.14219419658184052, -0.13706879317760468, -0.13194337487220764, -0.1268179565668106, -0.12169254571199417, -0.11656713485717773, -0.1114417165517807, -0.10631630569696426, -0.10119089484214783, -0.0960654765367508, -0.09094006568193436, -0.08581465482711792, -0.08068923652172089, -0.07556382566690445, -0.07043841481208801, -0.06531299650669098, -0.060187581926584244, -0.05506216734647751, -0.04993675649166107, -0.04481134191155434, -0.0396859273314476, -0.034560516476631165, -0.02943510189652443, -0.024309687316417694, -0.01918427273631096, -0.014058860018849373, -0.008933446370065212, -0.0038080327212810516, 0.0013173818588256836, 0.00644279457628727, 0.011568207293748856, 0.01669362187385559, 0.021819036453962326, 0.026944449171423912, 0.0320698618888855, 0.03719527646899223, 0.04232069104909897, 0.047446101903915405, 0.05257151648402214, 0.057696931064128876, 0.06282234191894531, 0.06794776022434235, 0.07307317107915878, 0.07819858193397522, 0.08332400023937225, 0.08844941109418869, 0.09357482194900513, 0.09870024025440216, 0.1038256511092186, 0.10895106941461563, 0.11407648026943207, 0.1192018985748291, 0.12432730942964554, 0.12945272028446198, 0.134578138589859, 0.13970354199409485, 0.14482896029949188, 0.14995436370372772, 0.15507978200912476, 0.1602052003145218, 0.16533061861991882, 0.17045602202415466, 0.1755814403295517, 0.18070685863494873]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 7.0, 7.0, 15.0, 14.0, 28.0, 30.0, 39.0, 61.0, 81.0, 100.0, 134.0, 204.0, 297.0, 502.0, 803.0, 1329.0, 2332.0, 4659.0, 10067.0, 21844.0, 49613.0, 120968.0, 267915.0, 302706.0, 151103.0, 62205.0, 26770.0, 12158.0, 5713.0, 2750.0, 1521.0, 879.0, 499.0, 346.0, 233.0, 171.0, 124.0, 80.0, 50.0, 48.0, 32.0, 26.0, 19.0, 10.0, 16.0, 10.0, 8.0, 5.0, 1.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.032073974609375, -0.031043529510498047, -0.030013084411621094, -0.02898263931274414, -0.027952194213867188, -0.026921749114990234, -0.02589130401611328, -0.024860858917236328, -0.023830413818359375, -0.022799968719482422, -0.02176952362060547, -0.020739078521728516, -0.019708633422851562, -0.01867818832397461, -0.017647743225097656, -0.016617298126220703, -0.01558685302734375, -0.014556407928466797, -0.013525962829589844, -0.01249551773071289, -0.011465072631835938, -0.010434627532958984, -0.009404182434082031, -0.008373737335205078, -0.007343292236328125, -0.006312847137451172, -0.005282402038574219, -0.004251956939697266, -0.0032215118408203125, -0.0021910667419433594, -0.0011606216430664062, -0.00013017654418945312, 0.0009002685546875, 0.0019307136535644531, 0.0029611587524414062, 0.003991603851318359, 0.0050220489501953125, 0.006052494049072266, 0.007082939147949219, 0.008113384246826172, 0.009143829345703125, 0.010174274444580078, 0.011204719543457031, 0.012235164642333984, 0.013265609741210938, 0.01429605484008789, 0.015326499938964844, 0.016356945037841797, 0.01738739013671875, 0.018417835235595703, 0.019448280334472656, 0.02047872543334961, 0.021509170532226562, 0.022539615631103516, 0.02357006072998047, 0.024600505828857422, 0.025630950927734375, 0.026661396026611328, 0.02769184112548828, 0.028722286224365234, 0.029752731323242188, 0.03078317642211914, 0.031813621520996094, 0.03284406661987305, 0.03387451171875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 6.0, 15.0, 23.0, 24.0, 37.0, 55.0, 53.0, 79.0, 92.0, 81.0, 82.0, 104.0, 67.0, 82.0, 60.0, 46.0, 25.0, 22.0, 14.0, 9.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054443359375, -0.052887916564941406, -0.05133247375488281, -0.04977703094482422, -0.048221588134765625, -0.04666614532470703, -0.04511070251464844, -0.043555259704589844, -0.04199981689453125, -0.040444374084472656, -0.03888893127441406, -0.03733348846435547, -0.035778045654296875, -0.03422260284423828, -0.03266716003417969, -0.031111717224121094, -0.0295562744140625, -0.028000831604003906, -0.026445388793945312, -0.02488994598388672, -0.023334503173828125, -0.02177906036376953, -0.020223617553710938, -0.018668174743652344, -0.01711273193359375, -0.015557289123535156, -0.014001846313476562, -0.012446403503417969, -0.010890960693359375, -0.009335517883300781, -0.0077800750732421875, -0.006224632263183594, -0.004669189453125, -0.0031137466430664062, -0.0015583038330078125, -2.86102294921875e-06, 0.001552581787109375, 0.0031080245971679688, 0.0046634674072265625, 0.006218910217285156, 0.00777435302734375, 0.009329795837402344, 0.010885238647460938, 0.012440681457519531, 0.013996124267578125, 0.015551567077636719, 0.017107009887695312, 0.018662452697753906, 0.0202178955078125, 0.021773338317871094, 0.023328781127929688, 0.02488422393798828, 0.026439666748046875, 0.02799510955810547, 0.029550552368164062, 0.031105995178222656, 0.03266143798828125, 0.034216880798339844, 0.03577232360839844, 0.03732776641845703, 0.038883209228515625, 0.04043865203857422, 0.04199409484863281, 0.043549537658691406, 0.04510498046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 3.0, 6.0, 4.0, 12.0, 9.0, 18.0, 17.0, 33.0, 57.0, 63.0, 86.0, 137.0, 205.0, 279.0, 441.0, 687.0, 1214.0, 2306.0, 4564.0, 10518.0, 25878.0, 69988.0, 204679.0, 387208.0, 217159.0, 74205.0, 27194.0, 10973.0, 4898.0, 2352.0, 1216.0, 730.0, 419.0, 296.0, 193.0, 165.0, 110.0, 62.0, 57.0, 32.0, 18.0, 18.0, 14.0, 8.0, 5.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04132080078125, -0.040050506591796875, -0.03878021240234375, -0.037509918212890625, -0.0362396240234375, -0.034969329833984375, -0.03369903564453125, -0.032428741455078125, -0.031158447265625, -0.029888153076171875, -0.02861785888671875, -0.027347564697265625, -0.0260772705078125, -0.024806976318359375, -0.02353668212890625, -0.022266387939453125, -0.02099609375, -0.019725799560546875, -0.01845550537109375, -0.017185211181640625, -0.0159149169921875, -0.014644622802734375, -0.01337432861328125, -0.012104034423828125, -0.010833740234375, -0.009563446044921875, -0.00829315185546875, -0.007022857666015625, -0.0057525634765625, -0.004482269287109375, -0.00321197509765625, -0.001941680908203125, -0.00067138671875, 0.000598907470703125, 0.00186920166015625, 0.003139495849609375, 0.0044097900390625, 0.005680084228515625, 0.00695037841796875, 0.008220672607421875, 0.009490966796875, 0.010761260986328125, 0.01203155517578125, 0.013301849365234375, 0.0145721435546875, 0.015842437744140625, 0.01711273193359375, 0.018383026123046875, 0.0196533203125, 0.020923614501953125, 0.02219390869140625, 0.023464202880859375, 0.0247344970703125, 0.026004791259765625, 0.02727508544921875, 0.028545379638671875, 0.029815673828125, 0.031085968017578125, 0.03235626220703125, 0.033626556396484375, 0.0348968505859375, 0.036167144775390625, 0.03743743896484375, 0.038707733154296875, 0.03997802734375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 8.0, 7.0, 14.0, 6.0, 11.0, 10.0, 20.0, 22.0, 29.0, 41.0, 29.0, 29.0, 30.0, 44.0, 56.0, 43.0, 56.0, 57.0, 45.0, 45.0, 55.0, 41.0, 31.0, 48.0, 30.0, 37.0, 23.0, 24.0, 15.0, 13.0, 19.0, 9.0, 15.0, 6.0, 8.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.069091796875, -0.06684494018554688, -0.06459808349609375, -0.062351226806640625, -0.0601043701171875, -0.057857513427734375, -0.05561065673828125, -0.053363800048828125, -0.051116943359375, -0.048870086669921875, -0.04662322998046875, -0.044376373291015625, -0.0421295166015625, -0.039882659912109375, -0.03763580322265625, -0.035388946533203125, -0.03314208984375, -0.030895233154296875, -0.02864837646484375, -0.026401519775390625, -0.0241546630859375, -0.021907806396484375, -0.01966094970703125, -0.017414093017578125, -0.015167236328125, -0.012920379638671875, -0.01067352294921875, -0.008426666259765625, -0.0061798095703125, -0.003932952880859375, -0.00168609619140625, 0.000560760498046875, 0.0028076171875, 0.005054473876953125, 0.00730133056640625, 0.009548187255859375, 0.0117950439453125, 0.014041900634765625, 0.01628875732421875, 0.018535614013671875, 0.020782470703125, 0.023029327392578125, 0.02527618408203125, 0.027523040771484375, 0.0297698974609375, 0.032016754150390625, 0.03426361083984375, 0.036510467529296875, 0.03875732421875, 0.041004180908203125, 0.04325103759765625, 0.045497894287109375, 0.0477447509765625, 0.049991607666015625, 0.05223846435546875, 0.054485321044921875, 0.056732177734375, 0.058979034423828125, 0.06122589111328125, 0.06347274780273438, 0.0657196044921875, 0.06796646118164062, 0.07021331787109375, 0.07246017456054688, 0.07470703125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 8.0, 6.0, 16.0, 21.0, 28.0, 48.0, 65.0, 82.0, 139.0, 183.0, 341.0, 545.0, 795.0, 1408.0, 2408.0, 4236.0, 7806.0, 14321.0, 28021.0, 56105.0, 115152.0, 218750.0, 264619.0, 165045.0, 83056.0, 40560.0, 20044.0, 10764.0, 5831.0, 3282.0, 1883.0, 1100.0, 694.0, 403.0, 256.0, 181.0, 116.0, 76.0, 43.0, 36.0, 30.0, 20.0, 7.0, 10.0, 4.0, 5.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.00876617431640625, -0.008510351181030273, -0.008254528045654297, -0.00799870491027832, -0.007742881774902344, -0.007487058639526367, -0.007231235504150391, -0.006975412368774414, -0.0067195892333984375, -0.006463766098022461, -0.006207942962646484, -0.005952119827270508, -0.005696296691894531, -0.005440473556518555, -0.005184650421142578, -0.0049288272857666016, -0.004673004150390625, -0.0044171810150146484, -0.004161357879638672, -0.0039055347442626953, -0.0036497116088867188, -0.003393888473510742, -0.0031380653381347656, -0.002882242202758789, -0.0026264190673828125, -0.002370595932006836, -0.0021147727966308594, -0.0018589496612548828, -0.0016031265258789062, -0.0013473033905029297, -0.0010914802551269531, -0.0008356571197509766, -0.000579833984375, -0.00032401084899902344, -6.818771362304688e-05, 0.0001876354217529297, 0.00044345855712890625, 0.0006992816925048828, 0.0009551048278808594, 0.001210927963256836, 0.0014667510986328125, 0.001722574234008789, 0.0019783973693847656, 0.002234220504760742, 0.0024900436401367188, 0.0027458667755126953, 0.003001689910888672, 0.0032575130462646484, 0.003513336181640625, 0.0037691593170166016, 0.004024982452392578, 0.004280805587768555, 0.004536628723144531, 0.004792451858520508, 0.005048274993896484, 0.005304098129272461, 0.0055599212646484375, 0.005815744400024414, 0.006071567535400391, 0.006327390670776367, 0.006583213806152344, 0.00683903694152832, 0.007094860076904297, 0.0073506832122802734, 0.00760650634765625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 5.0, 15.0, 15.0, 26.0, 29.0, 41.0, 79.0, 82.0, 78.0, 99.0, 112.0, 131.0, 77.0, 60.0, 36.0, 26.0, 43.0, 14.0, 15.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.318092346191406e-06, -6.127171218395233e-06, -5.93625009059906e-06, -5.745328962802887e-06, -5.554407835006714e-06, -5.363486707210541e-06, -5.172565579414368e-06, -4.981644451618195e-06, -4.7907233238220215e-06, -4.599802196025848e-06, -4.408881068229675e-06, -4.217959940433502e-06, -4.027038812637329e-06, -3.836117684841156e-06, -3.645196557044983e-06, -3.45427542924881e-06, -3.2633543014526367e-06, -3.0724331736564636e-06, -2.8815120458602905e-06, -2.6905909180641174e-06, -2.4996697902679443e-06, -2.3087486624717712e-06, -2.117827534675598e-06, -1.926906406879425e-06, -1.735985279083252e-06, -1.5450641512870789e-06, -1.3541430234909058e-06, -1.1632218956947327e-06, -9.723007678985596e-07, -7.813796401023865e-07, -5.904585123062134e-07, -3.995373845100403e-07, -2.086162567138672e-07, -1.7695128917694092e-08, 1.73225998878479e-07, 3.641471266746521e-07, 5.550682544708252e-07, 7.459893822669983e-07, 9.369105100631714e-07, 1.1278316378593445e-06, 1.3187527656555176e-06, 1.5096738934516907e-06, 1.7005950212478638e-06, 1.8915161490440369e-06, 2.08243727684021e-06, 2.273358404636383e-06, 2.464279532432556e-06, 2.6552006602287292e-06, 2.8461217880249023e-06, 3.0370429158210754e-06, 3.2279640436172485e-06, 3.4188851714134216e-06, 3.6098062992095947e-06, 3.800727427005768e-06, 3.991648554801941e-06, 4.182569682598114e-06, 4.373490810394287e-06, 4.56441193819046e-06, 4.755333065986633e-06, 4.946254193782806e-06, 5.1371753215789795e-06, 5.328096449375153e-06, 5.519017577171326e-06, 5.709938704967499e-06, 5.900859832763672e-06]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 0.0, 7.0, 15.0, 13.0, 22.0, 16.0, 33.0, 37.0, 58.0, 78.0, 116.0, 152.0, 261.0, 403.0, 659.0, 1021.0, 1731.0, 2918.0, 5213.0, 9765.0, 18671.0, 38170.0, 80583.0, 165043.0, 262957.0, 225263.0, 120181.0, 56662.0, 27419.0, 13891.0, 7315.0, 3997.0, 2308.0, 1311.0, 778.0, 509.0, 280.0, 199.0, 132.0, 110.0, 80.0, 45.0, 39.0, 23.0, 17.0, 17.0, 12.0, 3.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0], "bins": [-0.00814056396484375, -0.007892131805419922, -0.007643699645996094, -0.007395267486572266, -0.0071468353271484375, -0.006898403167724609, -0.006649971008300781, -0.006401538848876953, -0.006153106689453125, -0.005904674530029297, -0.005656242370605469, -0.005407810211181641, -0.0051593780517578125, -0.004910945892333984, -0.004662513732910156, -0.004414081573486328, -0.0041656494140625, -0.003917217254638672, -0.0036687850952148438, -0.0034203529357910156, -0.0031719207763671875, -0.0029234886169433594, -0.0026750564575195312, -0.002426624298095703, -0.002178192138671875, -0.0019297599792480469, -0.0016813278198242188, -0.0014328956604003906, -0.0011844635009765625, -0.0009360313415527344, -0.0006875991821289062, -0.0004391670227050781, -0.00019073486328125, 5.7697296142578125e-05, 0.00030612945556640625, 0.0005545616149902344, 0.0008029937744140625, 0.0010514259338378906, 0.0012998580932617188, 0.0015482902526855469, 0.001796722412109375, 0.002045154571533203, 0.0022935867309570312, 0.0025420188903808594, 0.0027904510498046875, 0.0030388832092285156, 0.0032873153686523438, 0.003535747528076172, 0.0037841796875, 0.004032611846923828, 0.004281044006347656, 0.004529476165771484, 0.0047779083251953125, 0.005026340484619141, 0.005274772644042969, 0.005523204803466797, 0.005771636962890625, 0.006020069122314453, 0.006268501281738281, 0.006516933441162109, 0.0067653656005859375, 0.007013797760009766, 0.007262229919433594, 0.007510662078857422, 0.00775909423828125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 11.0, 4.0, 10.0, 13.0, 17.0, 16.0, 14.0, 20.0, 31.0, 28.0, 31.0, 44.0, 39.0, 70.0, 71.0, 70.0, 73.0, 86.0, 57.0, 53.0, 32.0, 31.0, 30.0, 28.0, 14.0, 22.0, 18.0, 16.0, 9.0, 6.0, 8.0, 6.0, 3.0, 9.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01153564453125, -0.011204242706298828, -0.010872840881347656, -0.010541439056396484, -0.010210037231445312, -0.00987863540649414, -0.009547233581542969, -0.009215831756591797, -0.008884429931640625, -0.008553028106689453, -0.008221626281738281, -0.00789022445678711, -0.0075588226318359375, -0.007227420806884766, -0.006896018981933594, -0.006564617156982422, -0.00623321533203125, -0.005901813507080078, -0.005570411682128906, -0.005239009857177734, -0.0049076080322265625, -0.004576206207275391, -0.004244804382324219, -0.003913402557373047, -0.003582000732421875, -0.003250598907470703, -0.0029191970825195312, -0.0025877952575683594, -0.0022563934326171875, -0.0019249916076660156, -0.0015935897827148438, -0.0012621879577636719, -0.0009307861328125, -0.0005993843078613281, -0.00026798248291015625, 6.341934204101562e-05, 0.0003948211669921875, 0.0007262229919433594, 0.0010576248168945312, 0.0013890266418457031, 0.001720428466796875, 0.002051830291748047, 0.0023832321166992188, 0.0027146339416503906, 0.0030460357666015625, 0.0033774375915527344, 0.0037088394165039062, 0.004040241241455078, 0.00437164306640625, 0.004703044891357422, 0.005034446716308594, 0.005365848541259766, 0.0056972503662109375, 0.006028652191162109, 0.006360054016113281, 0.006691455841064453, 0.007022857666015625, 0.007354259490966797, 0.007685661315917969, 0.00801706314086914, 0.008348464965820312, 0.008679866790771484, 0.009011268615722656, 0.009342670440673828, 0.009674072265625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 14.0, 16.0, 46.0, 71.0, 139.0, 201.0, 164.0, 155.0, 97.0, 32.0, 27.0, 10.0, 9.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3487190306186676, -0.34026214480400085, -0.3318052589893341, -0.32334840297698975, -0.314891517162323, -0.30643463134765625, -0.2979777455329895, -0.28952085971832275, -0.2810640037059784, -0.27260711789131165, -0.2641502320766449, -0.25569337606430054, -0.2472364902496338, -0.23877960443496704, -0.2303227186203003, -0.22186584770679474, -0.213408961892128, -0.20495207607746124, -0.1964952051639557, -0.18803831934928894, -0.1795814484357834, -0.17112456262111664, -0.16266769170761108, -0.15421080589294434, -0.1457539200782776, -0.13729703426361084, -0.12884016335010529, -0.12038327753543854, -0.11192640662193298, -0.10346952080726624, -0.09501264244318008, -0.08655576407909393, -0.07809890806674957, -0.06964202970266342, -0.06118515133857727, -0.05272826924920082, -0.04427139088511467, -0.03581451252102852, -0.02735763043165207, -0.018900752067565918, -0.010443873703479767, -0.001986994408071041, 0.006469884887337685, 0.014926765114068985, 0.023383643478155136, 0.03184052184224129, 0.04029740393161774, 0.04875428229570389, 0.05721116065979004, 0.06566803902387619, 0.07412491738796234, 0.08258180320262909, 0.09103867411613464, 0.09949555993080139, 0.10795243829488754, 0.1164093166589737, 0.12486619502305984, 0.133323073387146, 0.14177995920181274, 0.1502368301153183, 0.15869371592998505, 0.1671505868434906, 0.17560747265815735, 0.1840643584728241, 0.19252122938632965]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 2.0, 7.0, 9.0, 7.0, 7.0, 15.0, 13.0, 10.0, 17.0, 22.0, 26.0, 23.0, 22.0, 35.0, 35.0, 29.0, 36.0, 40.0, 33.0, 36.0, 27.0, 36.0, 29.0, 31.0, 48.0, 33.0, 31.0, 25.0, 47.0, 22.0, 20.0, 29.0, 19.0, 25.0, 14.0, 17.0, 12.0, 20.0, 15.0, 14.0, 14.0, 6.0, 12.0, 2.0, 6.0, 5.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.14736515283584595, -0.1428213268518448, -0.13827751576900482, -0.13373368978500366, -0.1291898638010025, -0.12464604526758194, -0.12010222673416138, -0.11555840075016022, -0.11101458221673965, -0.10647076368331909, -0.10192693769931793, -0.09738311916589737, -0.0928393006324768, -0.08829547464847565, -0.08375165611505508, -0.07920783758163452, -0.07466401159763336, -0.0701201930642128, -0.06557636708021164, -0.06103254854679108, -0.056488726288080215, -0.051944904029369354, -0.04740108549594879, -0.04285726323723793, -0.03831344097852707, -0.03376961871981621, -0.029225798323750496, -0.024681977927684784, -0.020138155668973923, -0.015594333410263062, -0.01105051301419735, -0.006506692618131638, -0.0019628703594207764, 0.0025809509679675102, 0.007124772295355797, 0.011668593622744083, 0.01621241495013237, 0.02075623720884323, 0.025300057604908943, 0.029843878000974655, 0.034387700259685516, 0.03893152251839638, 0.04347534477710724, 0.0480191633105278, 0.05256298556923866, 0.057106807827949524, 0.06165062636137009, 0.06619444489479065, 0.07073827087879181, 0.07528208941221237, 0.07982591539621353, 0.0843697339296341, 0.08891355991363525, 0.09345737844705582, 0.09800119698047638, 0.10254502296447754, 0.1070888414978981, 0.11163266003131866, 0.11617648601531982, 0.12072030454874039, 0.12526412308216095, 0.1298079490661621, 0.13435177505016327, 0.13889558613300323, 0.1434394121170044]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 10.0, 6.0, 16.0, 15.0, 32.0, 28.0, 56.0, 91.0, 155.0, 204.0, 309.0, 607.0, 1298.0, 3240.0, 8694.0, 21982.0, 93160.0, 602051.0, 1760314.0, 1305342.0, 309217.0, 58382.0, 16538.0, 6886.0, 3466.0, 1301.0, 412.0, 180.0, 102.0, 56.0, 39.0, 23.0, 15.0, 18.0, 11.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03436279296875, -0.03328275680541992, -0.032202720642089844, -0.031122684478759766, -0.030042648315429688, -0.02896261215209961, -0.02788257598876953, -0.026802539825439453, -0.025722503662109375, -0.024642467498779297, -0.02356243133544922, -0.02248239517211914, -0.021402359008789062, -0.020322322845458984, -0.019242286682128906, -0.018162250518798828, -0.01708221435546875, -0.016002178192138672, -0.014922142028808594, -0.013842105865478516, -0.012762069702148438, -0.01168203353881836, -0.010601997375488281, -0.009521961212158203, -0.008441925048828125, -0.007361888885498047, -0.006281852722167969, -0.005201816558837891, -0.0041217803955078125, -0.0030417442321777344, -0.0019617080688476562, -0.0008816719055175781, 0.0001983642578125, 0.0012784004211425781, 0.0023584365844726562, 0.0034384727478027344, 0.0045185089111328125, 0.005598545074462891, 0.006678581237792969, 0.007758617401123047, 0.008838653564453125, 0.009918689727783203, 0.010998725891113281, 0.01207876205444336, 0.013158798217773438, 0.014238834381103516, 0.015318870544433594, 0.016398906707763672, 0.01747894287109375, 0.018558979034423828, 0.019639015197753906, 0.020719051361083984, 0.021799087524414062, 0.02287912368774414, 0.02395915985107422, 0.025039196014404297, 0.026119232177734375, 0.027199268341064453, 0.02827930450439453, 0.02935934066772461, 0.030439376831054688, 0.031519412994384766, 0.032599449157714844, 0.03367948532104492, 0.034759521484375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 10.0, 18.0, 18.0, 28.0, 42.0, 45.0, 59.0, 71.0, 91.0, 80.0, 91.0, 78.0, 75.0, 59.0, 63.0, 56.0, 32.0, 24.0, 24.0, 16.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0531005859375, -0.05163145065307617, -0.050162315368652344, -0.048693180084228516, -0.04722404479980469, -0.04575490951538086, -0.04428577423095703, -0.0428166389465332, -0.041347503662109375, -0.03987836837768555, -0.03840923309326172, -0.03694009780883789, -0.03547096252441406, -0.034001827239990234, -0.032532691955566406, -0.031063556671142578, -0.02959442138671875, -0.028125286102294922, -0.026656150817871094, -0.025187015533447266, -0.023717880249023438, -0.02224874496459961, -0.02077960968017578, -0.019310474395751953, -0.017841339111328125, -0.016372203826904297, -0.014903068542480469, -0.01343393325805664, -0.011964797973632812, -0.010495662689208984, -0.009026527404785156, -0.007557392120361328, -0.0060882568359375, -0.004619121551513672, -0.0031499862670898438, -0.0016808509826660156, -0.0002117156982421875, 0.0012574195861816406, 0.0027265548706054688, 0.004195690155029297, 0.005664825439453125, 0.007133960723876953, 0.008603096008300781, 0.01007223129272461, 0.011541366577148438, 0.013010501861572266, 0.014479637145996094, 0.015948772430419922, 0.01741790771484375, 0.018887042999267578, 0.020356178283691406, 0.021825313568115234, 0.023294448852539062, 0.02476358413696289, 0.02623271942138672, 0.027701854705810547, 0.029170989990234375, 0.030640125274658203, 0.03210926055908203, 0.03357839584350586, 0.03504753112792969, 0.036516666412353516, 0.037985801696777344, 0.03945493698120117, 0.040924072265625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 13.0, 13.0, 17.0, 32.0, 48.0, 118.0, 183.0, 434.0, 1007.0, 3427.0, 17046.0, 141936.0, 2234608.0, 1667895.0, 108501.0, 14095.0, 2946.0, 974.0, 484.0, 204.0, 128.0, 52.0, 34.0, 26.0, 19.0, 11.0, 11.0, 4.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0399169921875, -0.038010597229003906, -0.03610420227050781, -0.03419780731201172, -0.032291412353515625, -0.03038501739501953, -0.028478622436523438, -0.026572227478027344, -0.02466583251953125, -0.022759437561035156, -0.020853042602539062, -0.01894664764404297, -0.017040252685546875, -0.015133857727050781, -0.013227462768554688, -0.011321067810058594, -0.0094146728515625, -0.007508277893066406, -0.0056018829345703125, -0.0036954879760742188, -0.001789093017578125, 0.00011730194091796875, 0.0020236968994140625, 0.003930091857910156, 0.00583648681640625, 0.007742881774902344, 0.009649276733398438, 0.011555671691894531, 0.013462066650390625, 0.015368461608886719, 0.017274856567382812, 0.019181251525878906, 0.021087646484375, 0.022994041442871094, 0.024900436401367188, 0.02680683135986328, 0.028713226318359375, 0.03061962127685547, 0.03252601623535156, 0.034432411193847656, 0.03633880615234375, 0.038245201110839844, 0.04015159606933594, 0.04205799102783203, 0.043964385986328125, 0.04587078094482422, 0.04777717590332031, 0.049683570861816406, 0.0515899658203125, 0.053496360778808594, 0.05540275573730469, 0.05730915069580078, 0.059215545654296875, 0.06112194061279297, 0.06302833557128906, 0.06493473052978516, 0.06684112548828125, 0.06874752044677734, 0.07065391540527344, 0.07256031036376953, 0.07446670532226562, 0.07637310028076172, 0.07827949523925781, 0.0801858901977539, 0.08209228515625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 4.0, 5.0, 20.0, 19.0, 31.0, 53.0, 69.0, 140.0, 221.0, 373.0, 600.0, 708.0, 670.0, 443.0, 269.0, 142.0, 89.0, 71.0, 49.0, 32.0, 23.0, 11.0, 15.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039093017578125, -0.037287235260009766, -0.03548145294189453, -0.0336756706237793, -0.03186988830566406, -0.030064105987548828, -0.028258323669433594, -0.02645254135131836, -0.024646759033203125, -0.02284097671508789, -0.021035194396972656, -0.019229412078857422, -0.017423629760742188, -0.015617847442626953, -0.013812065124511719, -0.012006282806396484, -0.01020050048828125, -0.008394718170166016, -0.006588935852050781, -0.004783153533935547, -0.0029773712158203125, -0.0011715888977050781, 0.0006341934204101562, 0.0024399757385253906, 0.004245758056640625, 0.006051540374755859, 0.007857322692871094, 0.009663105010986328, 0.011468887329101562, 0.013274669647216797, 0.015080451965332031, 0.016886234283447266, 0.0186920166015625, 0.020497798919677734, 0.02230358123779297, 0.024109363555908203, 0.025915145874023438, 0.027720928192138672, 0.029526710510253906, 0.03133249282836914, 0.033138275146484375, 0.03494405746459961, 0.036749839782714844, 0.03855562210083008, 0.04036140441894531, 0.04216718673706055, 0.04397296905517578, 0.045778751373291016, 0.04758453369140625, 0.049390316009521484, 0.05119609832763672, 0.05300188064575195, 0.05480766296386719, 0.05661344528198242, 0.058419227600097656, 0.06022500991821289, 0.062030792236328125, 0.06383657455444336, 0.0656423568725586, 0.06744813919067383, 0.06925392150878906, 0.0710597038269043, 0.07286548614501953, 0.07467126846313477, 0.07647705078125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 24.0, 96.0, 184.0, 270.0, 235.0, 122.0, 45.0, 12.0, 5.0, 5.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7297308444976807, -0.7129429578781128, -0.6961550712585449, -0.679367184638977, -0.6625792980194092, -0.6457914113998413, -0.6290035247802734, -0.6122156381607056, -0.5954277515411377, -0.5786398649215698, -0.561851978302002, -0.5450640916824341, -0.5282762050628662, -0.5114883184432983, -0.4947004020214081, -0.4779125154018402, -0.46112459897994995, -0.4443367123603821, -0.4275488257408142, -0.41076093912124634, -0.39397305250167847, -0.3771851658821106, -0.36039724946022034, -0.34360936284065247, -0.3268214762210846, -0.3100335896015167, -0.29324570298194885, -0.276457816362381, -0.2596698999404907, -0.24288202822208405, -0.22609412670135498, -0.2093062400817871, -0.19251829385757446, -0.1757304072380066, -0.15894252061843872, -0.14215461909770966, -0.12536673247814178, -0.10857884585857391, -0.09179095178842545, -0.07500305771827698, -0.058215171098709106, -0.04142728075385094, -0.024639390408992767, -0.007851500064134598, 0.008936390280723572, 0.025724276900291443, 0.04251217097043991, 0.05930006504058838, 0.07608795166015625, 0.09287583827972412, 0.10966373234987259, 0.12645162642002106, 0.14323951303958893, 0.1600273996591568, 0.17681530117988586, 0.19360318779945374, 0.2103910744190216, 0.22717896103858948, 0.24396684765815735, 0.2607547342777252, 0.2775426506996155, 0.29433053731918335, 0.3111184239387512, 0.3279063105583191, 0.34469419717788696]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 6.0, 4.0, 7.0, 3.0, 3.0, 9.0, 11.0, 21.0, 13.0, 20.0, 21.0, 24.0, 19.0, 29.0, 31.0, 38.0, 38.0, 27.0, 27.0, 32.0, 47.0, 35.0, 39.0, 52.0, 39.0, 35.0, 51.0, 29.0, 23.0, 47.0, 33.0, 20.0, 34.0, 24.0, 20.0, 24.0, 12.0, 8.0, 11.0, 5.0, 9.0, 2.0, 4.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.13383948802947998, -0.12968625128269196, -0.12553302943706512, -0.1213797926902771, -0.11722655594348907, -0.11307332664728165, -0.10892009735107422, -0.1047668606042862, -0.10061363130807877, -0.09646040201187134, -0.09230716526508331, -0.08815393596887589, -0.08400070667266846, -0.07984746992588043, -0.075694240629673, -0.07154101133346558, -0.06738777458667755, -0.06323454529047012, -0.0590813085436821, -0.05492807924747467, -0.050774846225976944, -0.04662161320447922, -0.04246838390827179, -0.03831515088677406, -0.03416191786527634, -0.03000868484377861, -0.025855453684926033, -0.021702222526073456, -0.01754898950457573, -0.013395756483078003, -0.009242525324225426, -0.0050892941653728485, -0.0009360611438751221, 0.0032171709463000298, 0.007370403036475182, 0.011523635126650333, 0.015676867216825485, 0.01983010023832321, 0.02398333139717579, 0.028136562556028366, 0.03228979557752609, 0.03644302859902382, 0.040596261620521545, 0.04474949091672897, 0.0489027239382267, 0.053055956959724426, 0.057209186255931854, 0.06136241927742958, 0.06551565229892731, 0.06966888159513474, 0.07382211834192276, 0.07797534763813019, 0.08212858438491821, 0.08628181368112564, 0.09043504297733307, 0.0945882797241211, 0.09874150902032852, 0.10289473831653595, 0.10704797506332397, 0.1112012043595314, 0.11535443365573883, 0.11950767040252686, 0.12366089969873428, 0.1278141289949417, 0.13196736574172974]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 0.0, 4.0, 1.0, 12.0, 6.0, 16.0, 25.0, 35.0, 34.0, 50.0, 73.0, 91.0, 133.0, 171.0, 294.0, 444.0, 783.0, 1359.0, 2789.0, 6522.0, 16850.0, 48510.0, 138187.0, 291659.0, 303098.0, 151848.0, 53385.0, 18290.0, 7033.0, 3115.0, 1474.0, 800.0, 470.0, 282.0, 215.0, 139.0, 100.0, 70.0, 50.0, 40.0, 29.0, 15.0, 19.0, 7.0, 12.0, 7.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.03143310546875, -0.030452251434326172, -0.029471397399902344, -0.028490543365478516, -0.027509689331054688, -0.02652883529663086, -0.02554798126220703, -0.024567127227783203, -0.023586273193359375, -0.022605419158935547, -0.02162456512451172, -0.02064371109008789, -0.019662857055664062, -0.018682003021240234, -0.017701148986816406, -0.016720294952392578, -0.01573944091796875, -0.014758586883544922, -0.013777732849121094, -0.012796878814697266, -0.011816024780273438, -0.01083517074584961, -0.009854316711425781, -0.008873462677001953, -0.007892608642578125, -0.006911754608154297, -0.005930900573730469, -0.004950046539306641, -0.0039691925048828125, -0.0029883384704589844, -0.0020074844360351562, -0.0010266304016113281, -4.57763671875e-05, 0.0009350776672363281, 0.0019159317016601562, 0.0028967857360839844, 0.0038776397705078125, 0.004858493804931641, 0.005839347839355469, 0.006820201873779297, 0.007801055908203125, 0.008781909942626953, 0.009762763977050781, 0.01074361801147461, 0.011724472045898438, 0.012705326080322266, 0.013686180114746094, 0.014667034149169922, 0.01564788818359375, 0.016628742218017578, 0.017609596252441406, 0.018590450286865234, 0.019571304321289062, 0.02055215835571289, 0.02153301239013672, 0.022513866424560547, 0.023494720458984375, 0.024475574493408203, 0.02545642852783203, 0.02643728256225586, 0.027418136596679688, 0.028398990631103516, 0.029379844665527344, 0.030360698699951172, 0.031341552734375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 9.0, 11.0, 17.0, 29.0, 22.0, 47.0, 48.0, 82.0, 76.0, 85.0, 99.0, 93.0, 95.0, 87.0, 59.0, 40.0, 37.0, 30.0, 12.0, 9.0, 5.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050445556640625, -0.04889678955078125, -0.0473480224609375, -0.04579925537109375, -0.04425048828125, -0.04270172119140625, -0.0411529541015625, -0.03960418701171875, -0.038055419921875, -0.03650665283203125, -0.0349578857421875, -0.03340911865234375, -0.0318603515625, -0.03031158447265625, -0.0287628173828125, -0.02721405029296875, -0.025665283203125, -0.02411651611328125, -0.0225677490234375, -0.02101898193359375, -0.01947021484375, -0.01792144775390625, -0.0163726806640625, -0.01482391357421875, -0.013275146484375, -0.01172637939453125, -0.0101776123046875, -0.00862884521484375, -0.007080078125, -0.00553131103515625, -0.0039825439453125, -0.00243377685546875, -0.000885009765625, 0.00066375732421875, 0.0022125244140625, 0.00376129150390625, 0.00531005859375, 0.00685882568359375, 0.0084075927734375, 0.00995635986328125, 0.011505126953125, 0.01305389404296875, 0.0146026611328125, 0.01615142822265625, 0.0177001953125, 0.01924896240234375, 0.0207977294921875, 0.02234649658203125, 0.023895263671875, 0.02544403076171875, 0.0269927978515625, 0.02854156494140625, 0.03009033203125, 0.03163909912109375, 0.0331878662109375, 0.03473663330078125, 0.036285400390625, 0.03783416748046875, 0.0393829345703125, 0.04093170166015625, 0.04248046875, 0.04402923583984375, 0.0455780029296875, 0.04712677001953125, 0.048675537109375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 9.0, 2.0, 8.0, 11.0, 12.0, 16.0, 27.0, 38.0, 68.0, 82.0, 106.0, 153.0, 265.0, 360.0, 702.0, 1285.0, 2669.0, 5898.0, 14562.0, 40392.0, 121288.0, 292174.0, 327830.0, 156130.0, 52160.0, 18170.0, 7263.0, 3213.0, 1516.0, 852.0, 441.0, 272.0, 172.0, 126.0, 78.0, 47.0, 37.0, 39.0, 22.0, 9.0, 18.0, 8.0, 11.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03741455078125, -0.036249637603759766, -0.03508472442626953, -0.0339198112487793, -0.03275489807128906, -0.03158998489379883, -0.030425071716308594, -0.02926015853881836, -0.028095245361328125, -0.02693033218383789, -0.025765419006347656, -0.024600505828857422, -0.023435592651367188, -0.022270679473876953, -0.02110576629638672, -0.019940853118896484, -0.01877593994140625, -0.017611026763916016, -0.01644611358642578, -0.015281200408935547, -0.014116287231445312, -0.012951374053955078, -0.011786460876464844, -0.01062154769897461, -0.009456634521484375, -0.00829172134399414, -0.007126808166503906, -0.005961894989013672, -0.0047969818115234375, -0.003632068634033203, -0.0024671554565429688, -0.0013022422790527344, -0.0001373291015625, 0.0010275840759277344, 0.0021924972534179688, 0.003357410430908203, 0.0045223236083984375, 0.005687236785888672, 0.006852149963378906, 0.00801706314086914, 0.009181976318359375, 0.01034688949584961, 0.011511802673339844, 0.012676715850830078, 0.013841629028320312, 0.015006542205810547, 0.01617145538330078, 0.017336368560791016, 0.01850128173828125, 0.019666194915771484, 0.02083110809326172, 0.021996021270751953, 0.023160934448242188, 0.024325847625732422, 0.025490760803222656, 0.02665567398071289, 0.027820587158203125, 0.02898550033569336, 0.030150413513183594, 0.03131532669067383, 0.03248023986816406, 0.0336451530456543, 0.03481006622314453, 0.035974979400634766, 0.037139892578125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 10.0, 7.0, 10.0, 14.0, 12.0, 22.0, 22.0, 16.0, 15.0, 24.0, 32.0, 17.0, 33.0, 37.0, 55.0, 40.0, 35.0, 39.0, 33.0, 52.0, 48.0, 53.0, 36.0, 38.0, 40.0, 39.0, 31.0, 35.0, 17.0, 20.0, 30.0, 13.0, 10.0, 20.0, 10.0, 6.0, 6.0, 4.0, 7.0, 1.0, 5.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057220458984375, -0.05520963668823242, -0.053198814392089844, -0.051187992095947266, -0.04917716979980469, -0.04716634750366211, -0.04515552520751953, -0.04314470291137695, -0.041133880615234375, -0.0391230583190918, -0.03711223602294922, -0.03510141372680664, -0.03309059143066406, -0.031079769134521484, -0.029068946838378906, -0.027058124542236328, -0.02504730224609375, -0.023036479949951172, -0.021025657653808594, -0.019014835357666016, -0.017004013061523438, -0.01499319076538086, -0.012982368469238281, -0.010971546173095703, -0.008960723876953125, -0.006949901580810547, -0.004939079284667969, -0.0029282569885253906, -0.0009174346923828125, 0.0010933876037597656, 0.0031042098999023438, 0.005115032196044922, 0.0071258544921875, 0.009136676788330078, 0.011147499084472656, 0.013158321380615234, 0.015169143676757812, 0.01717996597290039, 0.01919078826904297, 0.021201610565185547, 0.023212432861328125, 0.025223255157470703, 0.02723407745361328, 0.02924489974975586, 0.03125572204589844, 0.033266544342041016, 0.035277366638183594, 0.03728818893432617, 0.03929901123046875, 0.04130983352661133, 0.043320655822753906, 0.045331478118896484, 0.04734230041503906, 0.04935312271118164, 0.05136394500732422, 0.0533747673034668, 0.055385589599609375, 0.05739641189575195, 0.05940723419189453, 0.06141805648803711, 0.06342887878417969, 0.06543970108032227, 0.06745052337646484, 0.06946134567260742, 0.07147216796875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 8.0, 3.0, 16.0, 15.0, 24.0, 39.0, 58.0, 97.0, 185.0, 398.0, 775.0, 1659.0, 3996.0, 9620.0, 23691.0, 55978.0, 115744.0, 194598.0, 234907.0, 193927.0, 115929.0, 55886.0, 23889.0, 10020.0, 3835.0, 1670.0, 771.0, 388.0, 192.0, 85.0, 61.0, 38.0, 15.0, 13.0, 11.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0077972412109375, -0.007557332515716553, -0.0073174238204956055, -0.007077515125274658, -0.006837606430053711, -0.006597697734832764, -0.006357789039611816, -0.006117880344390869, -0.005877971649169922, -0.005638062953948975, -0.005398154258728027, -0.00515824556350708, -0.004918336868286133, -0.0046784281730651855, -0.004438519477844238, -0.004198610782623291, -0.003958702087402344, -0.0037187933921813965, -0.0034788846969604492, -0.003238976001739502, -0.0029990673065185547, -0.0027591586112976074, -0.00251924991607666, -0.002279341220855713, -0.0020394325256347656, -0.0017995238304138184, -0.001559615135192871, -0.0013197064399719238, -0.0010797977447509766, -0.0008398890495300293, -0.000599980354309082, -0.00036007165908813477, -0.0001201629638671875, 0.00011974573135375977, 0.00035965442657470703, 0.0005995631217956543, 0.0008394718170166016, 0.0010793805122375488, 0.001319289207458496, 0.0015591979026794434, 0.0017991065979003906, 0.002039015293121338, 0.002278923988342285, 0.0025188326835632324, 0.0027587413787841797, 0.002998650074005127, 0.0032385587692260742, 0.0034784674644470215, 0.0037183761596679688, 0.003958284854888916, 0.004198193550109863, 0.0044381022453308105, 0.004678010940551758, 0.004917919635772705, 0.005157828330993652, 0.0053977370262146, 0.005637645721435547, 0.005877554416656494, 0.006117463111877441, 0.006357371807098389, 0.006597280502319336, 0.006837189197540283, 0.0070770978927612305, 0.007317006587982178, 0.007556915283203125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 2.0, 16.0, 12.0, 4.0, 7.0, 10.0, 17.0, 18.0, 6.0, 24.0, 40.0, 29.0, 30.0, 32.0, 61.0, 25.0, 29.0, 37.0, 88.0, 36.0, 28.0, 37.0, 39.0, 54.0, 32.0, 32.0, 27.0, 50.0, 27.0, 28.0, 20.0, 33.0, 11.0, 8.0, 12.0, 15.0, 4.0, 2.0, 6.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2649765014648438e-06, -2.191402018070221e-06, -2.117827534675598e-06, -2.0442530512809753e-06, -1.9706785678863525e-06, -1.8971040844917297e-06, -1.823529601097107e-06, -1.7499551177024841e-06, -1.6763806343078613e-06, -1.6028061509132385e-06, -1.5292316675186157e-06, -1.455657184123993e-06, -1.3820827007293701e-06, -1.3085082173347473e-06, -1.2349337339401245e-06, -1.1613592505455017e-06, -1.087784767150879e-06, -1.014210283756256e-06, -9.406358003616333e-07, -8.670613169670105e-07, -7.934868335723877e-07, -7.199123501777649e-07, -6.463378667831421e-07, -5.727633833885193e-07, -4.991888999938965e-07, -4.256144165992737e-07, -3.520399332046509e-07, -2.784654498100281e-07, -2.0489096641540527e-07, -1.3131648302078247e-07, -5.774199962615967e-08, 1.5832483768463135e-08, 8.940696716308594e-08, 1.6298145055770874e-07, 2.3655593395233154e-07, 3.1013041734695435e-07, 3.8370490074157715e-07, 4.5727938413619995e-07, 5.308538675308228e-07, 6.044283509254456e-07, 6.780028343200684e-07, 7.515773177146912e-07, 8.25151801109314e-07, 8.987262845039368e-07, 9.723007678985596e-07, 1.0458752512931824e-06, 1.1194497346878052e-06, 1.193024218082428e-06, 1.2665987014770508e-06, 1.3401731848716736e-06, 1.4137476682662964e-06, 1.4873221516609192e-06, 1.560896635055542e-06, 1.6344711184501648e-06, 1.7080456018447876e-06, 1.7816200852394104e-06, 1.8551945686340332e-06, 1.928769052028656e-06, 2.002343535423279e-06, 2.0759180188179016e-06, 2.1494925022125244e-06, 2.2230669856071472e-06, 2.29664146900177e-06, 2.370215952396393e-06, 2.4437904357910156e-06]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 13.0, 16.0, 23.0, 36.0, 54.0, 81.0, 130.0, 193.0, 370.0, 628.0, 1189.0, 2413.0, 5050.0, 10598.0, 22259.0, 44957.0, 83470.0, 134595.0, 180955.0, 190667.0, 154584.0, 101752.0, 57363.0, 29435.0, 14227.0, 6742.0, 3225.0, 1630.0, 807.0, 453.0, 227.0, 133.0, 92.0, 51.0, 43.0, 30.0, 27.0, 11.0, 12.0, 4.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0054779052734375, -0.00527644157409668, -0.005074977874755859, -0.004873514175415039, -0.004672050476074219, -0.0044705867767333984, -0.004269123077392578, -0.004067659378051758, -0.0038661956787109375, -0.003664731979370117, -0.003463268280029297, -0.0032618045806884766, -0.0030603408813476562, -0.002858877182006836, -0.0026574134826660156, -0.0024559497833251953, -0.002254486083984375, -0.0020530223846435547, -0.0018515586853027344, -0.001650094985961914, -0.0014486312866210938, -0.0012471675872802734, -0.0010457038879394531, -0.0008442401885986328, -0.0006427764892578125, -0.0004413127899169922, -0.00023984909057617188, -3.838539123535156e-05, 0.00016307830810546875, 0.00036454200744628906, 0.0005660057067871094, 0.0007674694061279297, 0.00096893310546875, 0.0011703968048095703, 0.0013718605041503906, 0.001573324203491211, 0.0017747879028320312, 0.0019762516021728516, 0.002177715301513672, 0.002379179000854492, 0.0025806427001953125, 0.002782106399536133, 0.002983570098876953, 0.0031850337982177734, 0.0033864974975585938, 0.003587961196899414, 0.0037894248962402344, 0.003990888595581055, 0.004192352294921875, 0.004393815994262695, 0.004595279693603516, 0.004796743392944336, 0.004998207092285156, 0.0051996707916259766, 0.005401134490966797, 0.005602598190307617, 0.0058040618896484375, 0.006005525588989258, 0.006206989288330078, 0.0064084529876708984, 0.006609916687011719, 0.006811380386352539, 0.007012844085693359, 0.00721430778503418, 0.007415771484375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 8.0, 9.0, 9.0, 10.0, 14.0, 24.0, 19.0, 26.0, 22.0, 21.0, 36.0, 29.0, 42.0, 45.0, 45.0, 31.0, 44.0, 43.0, 43.0, 50.0, 50.0, 50.0, 38.0, 57.0, 36.0, 39.0, 25.0, 23.0, 19.0, 18.0, 22.0, 11.0, 11.0, 9.0, 5.0, 8.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00780487060546875, -0.007552981376647949, -0.0073010921478271484, -0.007049202919006348, -0.006797313690185547, -0.006545424461364746, -0.006293535232543945, -0.0060416460037231445, -0.005789756774902344, -0.005537867546081543, -0.005285978317260742, -0.005034089088439941, -0.004782199859619141, -0.00453031063079834, -0.004278421401977539, -0.004026532173156738, -0.0037746429443359375, -0.0035227537155151367, -0.003270864486694336, -0.003018975257873535, -0.0027670860290527344, -0.0025151968002319336, -0.002263307571411133, -0.002011418342590332, -0.0017595291137695312, -0.0015076398849487305, -0.0012557506561279297, -0.001003861427307129, -0.0007519721984863281, -0.0005000829696655273, -0.00024819374084472656, 3.6954879760742188e-06, 0.000255584716796875, 0.0005074739456176758, 0.0007593631744384766, 0.0010112524032592773, 0.0012631416320800781, 0.001515030860900879, 0.0017669200897216797, 0.0020188093185424805, 0.0022706985473632812, 0.002522587776184082, 0.002774477005004883, 0.0030263662338256836, 0.0032782554626464844, 0.003530144691467285, 0.003782033920288086, 0.004033923149108887, 0.0042858123779296875, 0.004537701606750488, 0.004789590835571289, 0.00504148006439209, 0.005293369293212891, 0.005545258522033691, 0.005797147750854492, 0.006049036979675293, 0.006300926208496094, 0.0065528154373168945, 0.006804704666137695, 0.007056593894958496, 0.007308483123779297, 0.007560372352600098, 0.0078122615814208984, 0.0080641508102417, 0.0083160400390625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 1.0, 5.0, 9.0, 15.0, 26.0, 41.0, 84.0, 127.0, 241.0, 222.0, 122.0, 56.0, 26.0, 14.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3470926284790039, -0.33905553817749023, -0.33101844787597656, -0.3229813575744629, -0.31494423747062683, -0.30690714716911316, -0.2988700568675995, -0.2908329665660858, -0.28279587626457214, -0.27475878596305847, -0.2667216956615448, -0.25868457555770874, -0.25064748525619507, -0.2426103949546814, -0.23457330465316772, -0.22653621435165405, -0.2184991091489792, -0.21046201884746552, -0.20242491364479065, -0.19438782334327698, -0.1863507330417633, -0.17831364274024963, -0.17027653753757477, -0.1622394472360611, -0.15420234203338623, -0.14616525173187256, -0.1381281465291977, -0.13009105622768402, -0.12205396592617035, -0.11401686817407608, -0.10597977042198181, -0.09794268012046814, -0.08990557491779327, -0.081868477165699, -0.07383138686418533, -0.06579428911209106, -0.057757195085287094, -0.049720101058483124, -0.041683003306388855, -0.033645909279584885, -0.025608815252780914, -0.017571721225976944, -0.009534625336527824, -0.0014975294470787048, 0.0065395645797252655, 0.014576658606529236, 0.022613756358623505, 0.030650850385427475, 0.038687944412231445, 0.046725038439035416, 0.054762132465839386, 0.06279923021793365, 0.07083632051944733, 0.0788734182715416, 0.08691051602363586, 0.09494760632514954, 0.1029847040772438, 0.11102180182933807, 0.11905889213085175, 0.1270959973335266, 0.13513308763504028, 0.14317017793655396, 0.15120726823806763, 0.1592443734407425, 0.16728146374225616]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 8.0, 12.0, 6.0, 11.0, 11.0, 15.0, 10.0, 22.0, 12.0, 27.0, 27.0, 25.0, 28.0, 24.0, 37.0, 34.0, 34.0, 29.0, 34.0, 58.0, 38.0, 42.0, 46.0, 41.0, 38.0, 45.0, 28.0, 26.0, 36.0, 27.0, 18.0, 20.0, 21.0, 16.0, 16.0, 15.0, 16.0, 5.0, 5.0, 4.0, 6.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1541242003440857, -0.14924372732639313, -0.14436326920986176, -0.1394827961921692, -0.13460233807563782, -0.12972186505794525, -0.12484139204025269, -0.11996092647314072, -0.11508046090602875, -0.11019999533891678, -0.10531952977180481, -0.10043905675411224, -0.09555859118700027, -0.0906781256198883, -0.08579765260219574, -0.08091718703508377, -0.0760367214679718, -0.07115625590085983, -0.06627579033374786, -0.0613953173160553, -0.05651485174894333, -0.05163438618183136, -0.04675391688942909, -0.041873447597026825, -0.036992982029914856, -0.03211251646280289, -0.02723204717040062, -0.0223515797406435, -0.017471112310886383, -0.012590644881129265, -0.007710177451372147, -0.002829708158969879, 0.00205075740814209, 0.006931224837899208, 0.011811692267656326, 0.016692159697413445, 0.021572627127170563, 0.02645309455692768, 0.0313335619866848, 0.03621403127908707, 0.041094496846199036, 0.045974962413311005, 0.05085543170571327, 0.05573590099811554, 0.06061636656522751, 0.06549683213233948, 0.07037730515003204, 0.07525777071714401, 0.08013823628425598, 0.08501870185136795, 0.08989916741847992, 0.09477964043617249, 0.09966010600328445, 0.10454057157039642, 0.10942104458808899, 0.11430151015520096, 0.11918197572231293, 0.1240624412894249, 0.12894290685653687, 0.13382337987422943, 0.138703852891922, 0.14358431100845337, 0.14846478402614594, 0.1533452570438385, 0.15822571516036987]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 3.0, 5.0, 5.0, 7.0, 9.0, 15.0, 21.0, 30.0, 65.0, 101.0, 190.0, 390.0, 1166.0, 4214.0, 20178.0, 251453.0, 2422512.0, 1390062.0, 83927.0, 14112.0, 4310.0, 918.0, 271.0, 129.0, 70.0, 33.0, 35.0, 14.0, 19.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06304931640625, -0.061185359954833984, -0.05932140350341797, -0.05745744705200195, -0.05559349060058594, -0.05372953414916992, -0.051865577697753906, -0.05000162124633789, -0.048137664794921875, -0.04627370834350586, -0.044409751892089844, -0.04254579544067383, -0.04068183898925781, -0.0388178825378418, -0.03695392608642578, -0.035089969635009766, -0.03322601318359375, -0.031362056732177734, -0.02949810028076172, -0.027634143829345703, -0.025770187377929688, -0.023906230926513672, -0.022042274475097656, -0.02017831802368164, -0.018314361572265625, -0.01645040512084961, -0.014586448669433594, -0.012722492218017578, -0.010858535766601562, -0.008994579315185547, -0.007130622863769531, -0.005266666412353516, -0.0034027099609375, -0.0015387535095214844, 0.00032520294189453125, 0.002189159393310547, 0.0040531158447265625, 0.005917072296142578, 0.007781028747558594, 0.00964498519897461, 0.011508941650390625, 0.01337289810180664, 0.015236854553222656, 0.017100811004638672, 0.018964767456054688, 0.020828723907470703, 0.02269268035888672, 0.024556636810302734, 0.02642059326171875, 0.028284549713134766, 0.03014850616455078, 0.0320124626159668, 0.03387641906738281, 0.03574037551879883, 0.037604331970214844, 0.03946828842163086, 0.041332244873046875, 0.04319620132446289, 0.045060157775878906, 0.04692411422729492, 0.04878807067871094, 0.05065202713012695, 0.05251598358154297, 0.054379940032958984, 0.056243896484375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 7.0, 19.0, 18.0, 35.0, 35.0, 68.0, 76.0, 80.0, 93.0, 101.0, 72.0, 80.0, 73.0, 67.0, 46.0, 36.0, 37.0, 16.0, 17.0, 8.0, 9.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058624267578125, -0.056984901428222656, -0.05534553527832031, -0.05370616912841797, -0.052066802978515625, -0.05042743682861328, -0.04878807067871094, -0.047148704528808594, -0.04550933837890625, -0.043869972229003906, -0.04223060607910156, -0.04059123992919922, -0.038951873779296875, -0.03731250762939453, -0.03567314147949219, -0.034033775329589844, -0.0323944091796875, -0.030755043029785156, -0.029115676879882812, -0.02747631072998047, -0.025836944580078125, -0.02419757843017578, -0.022558212280273438, -0.020918846130371094, -0.01927947998046875, -0.017640113830566406, -0.016000747680664062, -0.014361381530761719, -0.012722015380859375, -0.011082649230957031, -0.009443283081054688, -0.007803916931152344, -0.00616455078125, -0.004525184631347656, -0.0028858184814453125, -0.0012464523315429688, 0.000392913818359375, 0.0020322799682617188, 0.0036716461181640625, 0.005311012268066406, 0.00695037841796875, 0.008589744567871094, 0.010229110717773438, 0.011868476867675781, 0.013507843017578125, 0.015147209167480469, 0.016786575317382812, 0.018425941467285156, 0.0200653076171875, 0.021704673767089844, 0.023344039916992188, 0.02498340606689453, 0.026622772216796875, 0.02826213836669922, 0.029901504516601562, 0.031540870666503906, 0.03318023681640625, 0.034819602966308594, 0.03645896911621094, 0.03809833526611328, 0.039737701416015625, 0.04137706756591797, 0.04301643371582031, 0.044655799865722656, 0.046295166015625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 15.0, 15.0, 20.0, 38.0, 51.0, 70.0, 92.0, 153.0, 214.0, 385.0, 702.0, 1526.0, 4089.0, 13171.0, 52726.0, 296343.0, 2332669.0, 1291520.0, 154541.0, 31630.0, 8589.0, 2918.0, 1194.0, 598.0, 335.0, 228.0, 145.0, 82.0, 64.0, 43.0, 32.0, 22.0, 13.0, 18.0, 9.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.040924072265625, -0.0395965576171875, -0.03826904296875, -0.0369415283203125, -0.035614013671875, -0.0342864990234375, -0.032958984375, -0.0316314697265625, -0.030303955078125, -0.0289764404296875, -0.02764892578125, -0.0263214111328125, -0.024993896484375, -0.0236663818359375, -0.0223388671875, -0.0210113525390625, -0.019683837890625, -0.0183563232421875, -0.01702880859375, -0.0157012939453125, -0.014373779296875, -0.0130462646484375, -0.01171875, -0.0103912353515625, -0.009063720703125, -0.0077362060546875, -0.00640869140625, -0.0050811767578125, -0.003753662109375, -0.0024261474609375, -0.0010986328125, 0.0002288818359375, 0.001556396484375, 0.0028839111328125, 0.00421142578125, 0.0055389404296875, 0.006866455078125, 0.0081939697265625, 0.009521484375, 0.0108489990234375, 0.012176513671875, 0.0135040283203125, 0.01483154296875, 0.0161590576171875, 0.017486572265625, 0.0188140869140625, 0.0201416015625, 0.0214691162109375, 0.022796630859375, 0.0241241455078125, 0.02545166015625, 0.0267791748046875, 0.028106689453125, 0.0294342041015625, 0.03076171875, 0.0320892333984375, 0.033416748046875, 0.0347442626953125, 0.03607177734375, 0.0373992919921875, 0.038726806640625, 0.0400543212890625, 0.0413818359375, 0.0427093505859375, 0.044036865234375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 10.0, 8.0, 15.0, 19.0, 13.0, 29.0, 39.0, 67.0, 98.0, 191.0, 281.0, 455.0, 621.0, 621.0, 562.0, 373.0, 253.0, 136.0, 80.0, 56.0, 33.0, 32.0, 24.0, 12.0, 12.0, 12.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033294677734375, -0.031805992126464844, -0.030317306518554688, -0.02882862091064453, -0.027339935302734375, -0.02585124969482422, -0.024362564086914062, -0.022873878479003906, -0.02138519287109375, -0.019896507263183594, -0.018407821655273438, -0.01691913604736328, -0.015430450439453125, -0.013941764831542969, -0.012453079223632812, -0.010964393615722656, -0.0094757080078125, -0.007987022399902344, -0.0064983367919921875, -0.005009651184082031, -0.003520965576171875, -0.0020322799682617188, -0.0005435943603515625, 0.0009450912475585938, 0.00243377685546875, 0.003922462463378906, 0.0054111480712890625, 0.006899833679199219, 0.008388519287109375, 0.009877204895019531, 0.011365890502929688, 0.012854576110839844, 0.01434326171875, 0.015831947326660156, 0.017320632934570312, 0.01880931854248047, 0.020298004150390625, 0.02178668975830078, 0.023275375366210938, 0.024764060974121094, 0.02625274658203125, 0.027741432189941406, 0.029230117797851562, 0.03071880340576172, 0.032207489013671875, 0.03369617462158203, 0.03518486022949219, 0.036673545837402344, 0.0381622314453125, 0.039650917053222656, 0.04113960266113281, 0.04262828826904297, 0.044116973876953125, 0.04560565948486328, 0.04709434509277344, 0.048583030700683594, 0.05007171630859375, 0.051560401916503906, 0.05304908752441406, 0.05453777313232422, 0.056026458740234375, 0.05751514434814453, 0.05900382995605469, 0.060492515563964844, 0.061981201171875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 30.0, 64.0, 158.0, 195.0, 216.0, 169.0, 89.0, 42.0, 17.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40166759490966797, -0.38950851559638977, -0.37734946608543396, -0.36519038677215576, -0.35303130745887756, -0.34087225794792175, -0.32871317863464355, -0.31655412912368774, -0.30439504981040955, -0.29223597049713135, -0.28007692098617554, -0.26791784167289734, -0.25575876235961914, -0.24359971284866333, -0.23144063353538513, -0.21928156912326813, -0.20712248980998993, -0.19496342539787292, -0.18280434608459473, -0.17064528167247772, -0.15848621726036072, -0.14632713794708252, -0.13416807353496552, -0.12200900912284851, -0.10984993726015091, -0.09769086539745331, -0.0855318009853363, -0.0733727291226387, -0.0612136609852314, -0.0490545928478241, -0.036895520985126495, -0.02473645657300949, -0.01257738471031189, -0.0004183156415820122, 0.011740753427147865, 0.023899823427200317, 0.03605889156460762, 0.04821795970201492, 0.060377031564712524, 0.07253609597682953, 0.08469516783952713, 0.09685423970222473, 0.10901330411434174, 0.12117237597703934, 0.13333144783973694, 0.14549051225185394, 0.15764957666397095, 0.16980865597724915, 0.18196772038936615, 0.19412678480148315, 0.20628586411476135, 0.21844492852687836, 0.23060399293899536, 0.24276307225227356, 0.25492215156555176, 0.26708120107650757, 0.27924028038978577, 0.29139935970306396, 0.3035584092140198, 0.315717488527298, 0.32787656784057617, 0.340035617351532, 0.3521946966648102, 0.3643537759780884, 0.3765128254890442]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 8.0, 7.0, 6.0, 13.0, 14.0, 10.0, 25.0, 23.0, 27.0, 31.0, 32.0, 36.0, 51.0, 37.0, 36.0, 42.0, 47.0, 45.0, 36.0, 43.0, 42.0, 41.0, 43.0, 47.0, 37.0, 26.0, 34.0, 31.0, 22.0, 20.0, 26.0, 19.0, 7.0, 6.0, 6.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.14348220825195312, -0.1393526792526245, -0.1352231502532959, -0.13109362125396729, -0.12696409225463867, -0.12283456325531006, -0.11870502680540085, -0.11457549780607224, -0.11044596880674362, -0.10631643980741501, -0.1021869108080864, -0.09805738180875778, -0.09392784535884857, -0.08979831635951996, -0.08566878736019135, -0.08153925836086273, -0.07740972936153412, -0.0732802003622055, -0.06915067136287689, -0.06502114236354828, -0.06089160963892937, -0.056762080639600754, -0.05263254791498184, -0.04850301891565323, -0.044373489916324615, -0.040243960916996, -0.03611443191766739, -0.03198489919304848, -0.027855370193719864, -0.02372584119439125, -0.019596310332417488, -0.015466779470443726, -0.011337250471115112, -0.007207720540463924, -0.0030781906098127365, 0.0010513393208384514, 0.005180869251489639, 0.009310398250818253, 0.013439929112792015, 0.017569459974765778, 0.02169898897409439, 0.025828517973423004, 0.029958048835396767, 0.03408757969737053, 0.03821710869669914, 0.042346637696027756, 0.04647617042064667, 0.05060569941997528, 0.054735228419303894, 0.05886475741863251, 0.06299428641796112, 0.06712381541728973, 0.07125334441661835, 0.07538287341594696, 0.07951240986585617, 0.08364193886518478, 0.0877714678645134, 0.09190099686384201, 0.09603052586317062, 0.10016005486249924, 0.10428959131240845, 0.10841912031173706, 0.11254864931106567, 0.11667817831039429, 0.1208077073097229]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 8.0, 16.0, 13.0, 30.0, 31.0, 30.0, 64.0, 98.0, 157.0, 191.0, 353.0, 520.0, 851.0, 1631.0, 3245.0, 7240.0, 18285.0, 50577.0, 137237.0, 285276.0, 298887.0, 151305.0, 56388.0, 20596.0, 7946.0, 3376.0, 1684.0, 950.0, 551.0, 300.0, 236.0, 153.0, 97.0, 66.0, 42.0, 26.0, 26.0, 19.0, 10.0, 7.0, 8.0, 3.0, 7.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03204345703125, -0.030940532684326172, -0.029837608337402344, -0.028734683990478516, -0.027631759643554688, -0.02652883529663086, -0.02542591094970703, -0.024322986602783203, -0.023220062255859375, -0.022117137908935547, -0.02101421356201172, -0.01991128921508789, -0.018808364868164062, -0.017705440521240234, -0.016602516174316406, -0.015499591827392578, -0.01439666748046875, -0.013293743133544922, -0.012190818786621094, -0.011087894439697266, -0.009984970092773438, -0.00888204574584961, -0.007779121398925781, -0.006676197052001953, -0.005573272705078125, -0.004470348358154297, -0.0033674240112304688, -0.0022644996643066406, -0.0011615753173828125, -5.8650970458984375e-05, 0.0010442733764648438, 0.002147197723388672, 0.0032501220703125, 0.004353046417236328, 0.005455970764160156, 0.006558895111083984, 0.0076618194580078125, 0.00876474380493164, 0.009867668151855469, 0.010970592498779297, 0.012073516845703125, 0.013176441192626953, 0.014279365539550781, 0.01538228988647461, 0.016485214233398438, 0.017588138580322266, 0.018691062927246094, 0.019793987274169922, 0.02089691162109375, 0.021999835968017578, 0.023102760314941406, 0.024205684661865234, 0.025308609008789062, 0.02641153335571289, 0.02751445770263672, 0.028617382049560547, 0.029720306396484375, 0.030823230743408203, 0.03192615509033203, 0.03302907943725586, 0.03413200378417969, 0.035234928131103516, 0.036337852478027344, 0.03744077682495117, 0.038543701171875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 6.0, 14.0, 12.0, 31.0, 23.0, 34.0, 37.0, 60.0, 62.0, 63.0, 92.0, 82.0, 78.0, 62.0, 61.0, 63.0, 54.0, 41.0, 30.0, 27.0, 20.0, 10.0, 8.0, 8.0, 3.0, 8.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.047210693359375, -0.045891761779785156, -0.04457283020019531, -0.04325389862060547, -0.041934967041015625, -0.04061603546142578, -0.03929710388183594, -0.037978172302246094, -0.03665924072265625, -0.035340309143066406, -0.03402137756347656, -0.03270244598388672, -0.031383514404296875, -0.03006458282470703, -0.028745651245117188, -0.027426719665527344, -0.0261077880859375, -0.024788856506347656, -0.023469924926757812, -0.02215099334716797, -0.020832061767578125, -0.01951313018798828, -0.018194198608398438, -0.016875267028808594, -0.01555633544921875, -0.014237403869628906, -0.012918472290039062, -0.011599540710449219, -0.010280609130859375, -0.008961677551269531, -0.0076427459716796875, -0.006323814392089844, -0.0050048828125, -0.0036859512329101562, -0.0023670196533203125, -0.0010480880737304688, 0.000270843505859375, 0.0015897750854492188, 0.0029087066650390625, 0.004227638244628906, 0.00554656982421875, 0.006865501403808594, 0.008184432983398438, 0.009503364562988281, 0.010822296142578125, 0.012141227722167969, 0.013460159301757812, 0.014779090881347656, 0.0160980224609375, 0.017416954040527344, 0.018735885620117188, 0.02005481719970703, 0.021373748779296875, 0.02269268035888672, 0.024011611938476562, 0.025330543518066406, 0.02664947509765625, 0.027968406677246094, 0.029287338256835938, 0.03060626983642578, 0.031925201416015625, 0.03324413299560547, 0.03456306457519531, 0.035881996154785156, 0.037200927734375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 9.0, 7.0, 13.0, 13.0, 25.0, 31.0, 32.0, 31.0, 61.0, 91.0, 136.0, 181.0, 268.0, 409.0, 723.0, 1347.0, 2793.0, 5840.0, 14165.0, 37479.0, 101855.0, 245701.0, 330502.0, 188330.0, 71994.0, 26521.0, 10560.0, 4455.0, 2136.0, 1069.0, 573.0, 364.0, 246.0, 167.0, 112.0, 71.0, 61.0, 54.0, 33.0, 22.0, 20.0, 20.0, 10.0, 7.0, 9.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0360107421875, -0.03482341766357422, -0.03363609313964844, -0.032448768615722656, -0.031261444091796875, -0.030074119567871094, -0.028886795043945312, -0.02769947052001953, -0.02651214599609375, -0.02532482147216797, -0.024137496948242188, -0.022950172424316406, -0.021762847900390625, -0.020575523376464844, -0.019388198852539062, -0.01820087432861328, -0.0170135498046875, -0.01582622528076172, -0.014638900756835938, -0.013451576232910156, -0.012264251708984375, -0.011076927185058594, -0.009889602661132812, -0.008702278137207031, -0.00751495361328125, -0.006327629089355469, -0.0051403045654296875, -0.003952980041503906, -0.002765655517578125, -0.0015783309936523438, -0.0003910064697265625, 0.0007963180541992188, 0.001983642578125, 0.0031709671020507812, 0.0043582916259765625, 0.005545616149902344, 0.006732940673828125, 0.007920265197753906, 0.009107589721679688, 0.010294914245605469, 0.01148223876953125, 0.012669563293457031, 0.013856887817382812, 0.015044212341308594, 0.016231536865234375, 0.017418861389160156, 0.018606185913085938, 0.01979351043701172, 0.0209808349609375, 0.02216815948486328, 0.023355484008789062, 0.024542808532714844, 0.025730133056640625, 0.026917457580566406, 0.028104782104492188, 0.02929210662841797, 0.03047943115234375, 0.03166675567626953, 0.03285408020019531, 0.034041404724121094, 0.035228729248046875, 0.036416053771972656, 0.03760337829589844, 0.03879070281982422, 0.03997802734375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 4.0, 7.0, 6.0, 3.0, 5.0, 7.0, 12.0, 8.0, 18.0, 25.0, 26.0, 31.0, 28.0, 30.0, 34.0, 34.0, 36.0, 41.0, 45.0, 45.0, 37.0, 47.0, 58.0, 33.0, 43.0, 37.0, 40.0, 35.0, 25.0, 29.0, 20.0, 30.0, 26.0, 11.0, 15.0, 14.0, 10.0, 12.0, 12.0, 10.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061492919921875, -0.059255123138427734, -0.05701732635498047, -0.0547795295715332, -0.05254173278808594, -0.05030393600463867, -0.048066139221191406, -0.04582834243774414, -0.043590545654296875, -0.04135274887084961, -0.039114952087402344, -0.03687715530395508, -0.03463935852050781, -0.03240156173706055, -0.03016376495361328, -0.027925968170166016, -0.02568817138671875, -0.023450374603271484, -0.02121257781982422, -0.018974781036376953, -0.016736984252929688, -0.014499187469482422, -0.012261390686035156, -0.01002359390258789, -0.007785797119140625, -0.005548000335693359, -0.0033102035522460938, -0.0010724067687988281, 0.0011653900146484375, 0.003403186798095703, 0.005640983581542969, 0.007878780364990234, 0.0101165771484375, 0.012354373931884766, 0.014592170715332031, 0.016829967498779297, 0.019067764282226562, 0.021305561065673828, 0.023543357849121094, 0.02578115463256836, 0.028018951416015625, 0.03025674819946289, 0.032494544982910156, 0.03473234176635742, 0.03697013854980469, 0.03920793533325195, 0.04144573211669922, 0.043683528900146484, 0.04592132568359375, 0.048159122467041016, 0.05039691925048828, 0.05263471603393555, 0.05487251281738281, 0.05711030960083008, 0.059348106384277344, 0.06158590316772461, 0.06382369995117188, 0.06606149673461914, 0.0682992935180664, 0.07053709030151367, 0.07277488708496094, 0.0750126838684082, 0.07725048065185547, 0.07948827743530273, 0.08172607421875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 7.0, 5.0, 12.0, 14.0, 14.0, 20.0, 32.0, 50.0, 68.0, 134.0, 174.0, 313.0, 510.0, 945.0, 1855.0, 3583.0, 7554.0, 15500.0, 31864.0, 63272.0, 112596.0, 175421.0, 208697.0, 178444.0, 116200.0, 65507.0, 33484.0, 16506.0, 7772.0, 3802.0, 1829.0, 998.0, 569.0, 273.0, 206.0, 108.0, 77.0, 38.0, 41.0, 16.0, 9.0, 14.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.00844573974609375, -0.008208036422729492, -0.007970333099365234, -0.0077326297760009766, -0.007494926452636719, -0.007257223129272461, -0.007019519805908203, -0.006781816482543945, -0.0065441131591796875, -0.00630640983581543, -0.006068706512451172, -0.005831003189086914, -0.005593299865722656, -0.0053555965423583984, -0.005117893218994141, -0.004880189895629883, -0.004642486572265625, -0.004404783248901367, -0.004167079925537109, -0.0039293766021728516, -0.0036916732788085938, -0.003453969955444336, -0.003216266632080078, -0.0029785633087158203, -0.0027408599853515625, -0.0025031566619873047, -0.002265453338623047, -0.002027750015258789, -0.0017900466918945312, -0.0015523433685302734, -0.0013146400451660156, -0.0010769367218017578, -0.0008392333984375, -0.0006015300750732422, -0.0003638267517089844, -0.00012612342834472656, 0.00011157989501953125, 0.00034928321838378906, 0.0005869865417480469, 0.0008246898651123047, 0.0010623931884765625, 0.0013000965118408203, 0.0015377998352050781, 0.001775503158569336, 0.0020132064819335938, 0.0022509098052978516, 0.0024886131286621094, 0.002726316452026367, 0.002964019775390625, 0.003201723098754883, 0.0034394264221191406, 0.0036771297454833984, 0.003914833068847656, 0.004152536392211914, 0.004390239715576172, 0.00462794303894043, 0.0048656463623046875, 0.005103349685668945, 0.005341053009033203, 0.005578756332397461, 0.005816459655761719, 0.0060541629791259766, 0.006291866302490234, 0.006529569625854492, 0.00676727294921875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 5.0, 4.0, 4.0, 8.0, 10.0, 7.0, 5.0, 17.0, 8.0, 33.0, 14.0, 26.0, 15.0, 32.0, 15.0, 52.0, 35.0, 52.0, 39.0, 67.0, 32.0, 36.0, 69.0, 27.0, 58.0, 41.0, 46.0, 21.0, 47.0, 19.0, 38.0, 14.0, 33.0, 11.0, 21.0, 6.0, 10.0, 8.0, 3.0, 3.0, 3.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7418136596679688e-06, -2.6542693376541138e-06, -2.566725015640259e-06, -2.479180693626404e-06, -2.391636371612549e-06, -2.304092049598694e-06, -2.216547727584839e-06, -2.129003405570984e-06, -2.041459083557129e-06, -1.953914761543274e-06, -1.866370439529419e-06, -1.778826117515564e-06, -1.691281795501709e-06, -1.603737473487854e-06, -1.516193151473999e-06, -1.428648829460144e-06, -1.341104507446289e-06, -1.253560185432434e-06, -1.166015863418579e-06, -1.0784715414047241e-06, -9.909272193908691e-07, -9.033828973770142e-07, -8.158385753631592e-07, -7.282942533493042e-07, -6.407499313354492e-07, -5.532056093215942e-07, -4.6566128730773926e-07, -3.781169652938843e-07, -2.905726432800293e-07, -2.0302832126617432e-07, -1.1548399925231934e-07, -2.7939677238464355e-08, 5.960464477539063e-08, 1.471489667892456e-07, 2.3469328880310059e-07, 3.2223761081695557e-07, 4.0978193283081055e-07, 4.973262548446655e-07, 5.848705768585205e-07, 6.724148988723755e-07, 7.599592208862305e-07, 8.475035429000854e-07, 9.350478649139404e-07, 1.0225921869277954e-06, 1.1101365089416504e-06, 1.1976808309555054e-06, 1.2852251529693604e-06, 1.3727694749832153e-06, 1.4603137969970703e-06, 1.5478581190109253e-06, 1.6354024410247803e-06, 1.7229467630386353e-06, 1.8104910850524902e-06, 1.8980354070663452e-06, 1.9855797290802e-06, 2.073124051094055e-06, 2.16066837310791e-06, 2.248212695121765e-06, 2.33575701713562e-06, 2.423301339149475e-06, 2.51084566116333e-06, 2.598389983177185e-06, 2.68593430519104e-06, 2.773478627204895e-06, 2.86102294921875e-06]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 9.0, 1.0, 8.0, 13.0, 21.0, 22.0, 35.0, 66.0, 70.0, 137.0, 233.0, 375.0, 697.0, 1426.0, 2663.0, 6037.0, 13660.0, 29688.0, 61352.0, 115427.0, 183809.0, 217865.0, 182996.0, 115495.0, 61857.0, 29340.0, 13427.0, 6042.0, 2761.0, 1323.0, 722.0, 378.0, 216.0, 121.0, 79.0, 57.0, 44.0, 31.0, 21.0, 17.0, 5.0, 6.0, 6.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.006999969482421875, -0.006745398044586182, -0.006490826606750488, -0.006236255168914795, -0.0059816837310791016, -0.005727112293243408, -0.005472540855407715, -0.0052179694175720215, -0.004963397979736328, -0.004708826541900635, -0.004454255104064941, -0.004199683666229248, -0.003945112228393555, -0.0036905407905578613, -0.003435969352722168, -0.0031813979148864746, -0.0029268264770507812, -0.002672255039215088, -0.0024176836013793945, -0.002163112163543701, -0.0019085407257080078, -0.0016539692878723145, -0.001399397850036621, -0.0011448264122009277, -0.0008902549743652344, -0.000635683536529541, -0.00038111209869384766, -0.0001265406608581543, 0.00012803077697753906, 0.0003826022148132324, 0.0006371736526489258, 0.0008917450904846191, 0.0011463165283203125, 0.0014008879661560059, 0.0016554594039916992, 0.0019100308418273926, 0.002164602279663086, 0.0024191737174987793, 0.0026737451553344727, 0.002928316593170166, 0.0031828880310058594, 0.0034374594688415527, 0.003692030906677246, 0.0039466023445129395, 0.004201173782348633, 0.004455745220184326, 0.0047103166580200195, 0.004964888095855713, 0.005219459533691406, 0.0054740309715271, 0.005728602409362793, 0.005983173847198486, 0.00623774528503418, 0.006492316722869873, 0.006746888160705566, 0.00700145959854126, 0.007256031036376953, 0.0075106024742126465, 0.00776517391204834, 0.008019745349884033, 0.008274316787719727, 0.00852888822555542, 0.008783459663391113, 0.009038031101226807, 0.0092926025390625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 5.0, 13.0, 9.0, 10.0, 7.0, 18.0, 13.0, 26.0, 24.0, 26.0, 31.0, 41.0, 43.0, 39.0, 52.0, 49.0, 41.0, 52.0, 42.0, 53.0, 51.0, 60.0, 33.0, 38.0, 32.0, 28.0, 33.0, 26.0, 15.0, 15.0, 8.0, 11.0, 12.0, 5.0, 4.0, 5.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.009246826171875, -0.008944034576416016, -0.008641242980957031, -0.008338451385498047, -0.008035659790039062, -0.007732868194580078, -0.007430076599121094, -0.007127285003662109, -0.006824493408203125, -0.006521701812744141, -0.006218910217285156, -0.005916118621826172, -0.0056133270263671875, -0.005310535430908203, -0.005007743835449219, -0.004704952239990234, -0.00440216064453125, -0.004099369049072266, -0.0037965774536132812, -0.003493785858154297, -0.0031909942626953125, -0.002888202667236328, -0.0025854110717773438, -0.0022826194763183594, -0.001979827880859375, -0.0016770362854003906, -0.0013742446899414062, -0.0010714530944824219, -0.0007686614990234375, -0.0004658699035644531, -0.00016307830810546875, 0.00013971328735351562, 0.0004425048828125, 0.0007452964782714844, 0.0010480880737304688, 0.0013508796691894531, 0.0016536712646484375, 0.001956462860107422, 0.0022592544555664062, 0.0025620460510253906, 0.002864837646484375, 0.0031676292419433594, 0.0034704208374023438, 0.003773212432861328, 0.0040760040283203125, 0.004378795623779297, 0.004681587219238281, 0.004984378814697266, 0.00528717041015625, 0.005589962005615234, 0.005892753601074219, 0.006195545196533203, 0.0064983367919921875, 0.006801128387451172, 0.007103919982910156, 0.007406711578369141, 0.007709503173828125, 0.00801229476928711, 0.008315086364746094, 0.008617877960205078, 0.008920669555664062, 0.009223461151123047, 0.009526252746582031, 0.009829044342041016, 0.0101318359375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 5.0, 3.0, 17.0, 18.0, 28.0, 70.0, 131.0, 177.0, 198.0, 168.0, 94.0, 42.0, 21.0, 13.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3125235140323639, -0.3045724034309387, -0.29662126302719116, -0.288670152425766, -0.2807190418243408, -0.27276793122291565, -0.2648167908191681, -0.2568656802177429, -0.24891456961631775, -0.24096344411373138, -0.2330123335123062, -0.22506120800971985, -0.21711009740829468, -0.2091589719057083, -0.20120784640312195, -0.19325673580169678, -0.1853056102991104, -0.17735448479652405, -0.16940337419509888, -0.1614522486925125, -0.15350113809108734, -0.14555001258850098, -0.1375989019870758, -0.12964777648448944, -0.12169665843248367, -0.1137455403804779, -0.10579442232847214, -0.09784330427646637, -0.08989217877388, -0.08194106817245483, -0.07398994266986847, -0.0660388246178627, -0.05808769166469574, -0.05013657361268997, -0.042185455560684204, -0.03423433378338814, -0.02628321573138237, -0.018332097679376602, -0.010380975902080536, -0.002429857850074768, 0.005521260201931, 0.013472379185259342, 0.021423498168587685, 0.0293746180832386, 0.03732573613524437, 0.04527685418725014, 0.053227975964546204, 0.06117909401655197, 0.06913021206855774, 0.07708133012056351, 0.08503244817256927, 0.09298357367515564, 0.10093468427658081, 0.10888580977916718, 0.11683692783117294, 0.12478804588317871, 0.13273915648460388, 0.14069028198719025, 0.14864139258861542, 0.15659251809120178, 0.16454362869262695, 0.17249475419521332, 0.18044587969779968, 0.18839699029922485, 0.19634811580181122]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 7.0, 9.0, 5.0, 8.0, 13.0, 16.0, 21.0, 18.0, 20.0, 17.0, 21.0, 29.0, 27.0, 30.0, 38.0, 33.0, 33.0, 39.0, 30.0, 53.0, 36.0, 49.0, 44.0, 31.0, 38.0, 22.0, 40.0, 36.0, 47.0, 36.0, 19.0, 19.0, 13.0, 17.0, 13.0, 19.0, 16.0, 10.0, 4.0, 6.0, 3.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15405374765396118, -0.1490592360496521, -0.14406472444534302, -0.13907021284103394, -0.13407570123672485, -0.12908117473125458, -0.1240866631269455, -0.11909215152263641, -0.11409763991832733, -0.10910312831401825, -0.10410861670970917, -0.09911409765481949, -0.0941195860505104, -0.08912507444620132, -0.08413055539131165, -0.07913604378700256, -0.07414153218269348, -0.0691470205783844, -0.06415250897407532, -0.05915798991918564, -0.054163478314876556, -0.049168966710567474, -0.044174451380968094, -0.03917993605136871, -0.03418542444705963, -0.0291909109801054, -0.02419639751315117, -0.019201884046196938, -0.014207370579242706, -0.009212857112288475, -0.004218343645334244, 0.0007761716842651367, 0.005770683288574219, 0.01076519675552845, 0.01575971022248268, 0.020754223689436913, 0.025748737156391144, 0.030743250623345375, 0.035737764090299606, 0.04073227941989899, 0.04572679102420807, 0.05072130262851715, 0.05571581795811653, 0.06071033328771591, 0.065704844892025, 0.07069935649633408, 0.07569387555122375, 0.08068838715553284, 0.08568289875984192, 0.090677410364151, 0.09567192196846008, 0.10066644102334976, 0.10566095262765884, 0.11065546423196793, 0.1156499832868576, 0.12064449489116669, 0.12563900649547577, 0.13063351809978485, 0.13562802970409393, 0.14062254130840302, 0.1456170678138733, 0.15061157941818237, 0.15560609102249146, 0.16060060262680054, 0.16559511423110962]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 12.0, 14.0, 23.0, 40.0, 73.0, 115.0, 215.0, 526.0, 1288.0, 4384.0, 24700.0, 326703.0, 2277803.0, 1419701.0, 118452.0, 14787.0, 3811.0, 857.0, 365.0, 184.0, 77.0, 60.0, 30.0, 26.0, 13.0, 10.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06549072265625, -0.06371212005615234, -0.06193351745605469, -0.06015491485595703, -0.058376312255859375, -0.05659770965576172, -0.05481910705566406, -0.053040504455566406, -0.05126190185546875, -0.049483299255371094, -0.04770469665527344, -0.04592609405517578, -0.044147491455078125, -0.04236888885498047, -0.04059028625488281, -0.038811683654785156, -0.0370330810546875, -0.035254478454589844, -0.03347587585449219, -0.03169727325439453, -0.029918670654296875, -0.02814006805419922, -0.026361465454101562, -0.024582862854003906, -0.02280426025390625, -0.021025657653808594, -0.019247055053710938, -0.01746845245361328, -0.015689849853515625, -0.013911247253417969, -0.012132644653320312, -0.010354042053222656, -0.008575439453125, -0.006796836853027344, -0.0050182342529296875, -0.0032396316528320312, -0.001461029052734375, 0.00031757354736328125, 0.0020961761474609375, 0.0038747787475585938, 0.00565338134765625, 0.007431983947753906, 0.009210586547851562, 0.010989189147949219, 0.012767791748046875, 0.014546394348144531, 0.016324996948242188, 0.018103599548339844, 0.0198822021484375, 0.021660804748535156, 0.023439407348632812, 0.02521800994873047, 0.026996612548828125, 0.02877521514892578, 0.030553817749023438, 0.032332420349121094, 0.03411102294921875, 0.035889625549316406, 0.03766822814941406, 0.03944683074951172, 0.041225433349609375, 0.04300403594970703, 0.04478263854980469, 0.046561241149902344, 0.04833984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 8.0, 10.0, 15.0, 18.0, 17.0, 23.0, 32.0, 42.0, 51.0, 58.0, 66.0, 57.0, 61.0, 57.0, 59.0, 82.0, 71.0, 56.0, 50.0, 40.0, 35.0, 24.0, 17.0, 10.0, 15.0, 11.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047515869140625, -0.046178340911865234, -0.04484081268310547, -0.0435032844543457, -0.04216575622558594, -0.04082822799682617, -0.039490699768066406, -0.03815317153930664, -0.036815643310546875, -0.03547811508178711, -0.034140586853027344, -0.03280305862426758, -0.03146553039550781, -0.030128002166748047, -0.02879047393798828, -0.027452945709228516, -0.02611541748046875, -0.024777889251708984, -0.02344036102294922, -0.022102832794189453, -0.020765304565429688, -0.019427776336669922, -0.018090248107910156, -0.01675271987915039, -0.015415191650390625, -0.01407766342163086, -0.012740135192871094, -0.011402606964111328, -0.010065078735351562, -0.008727550506591797, -0.007390022277832031, -0.006052494049072266, -0.0047149658203125, -0.0033774375915527344, -0.0020399093627929688, -0.0007023811340332031, 0.0006351470947265625, 0.001972675323486328, 0.0033102035522460938, 0.004647731781005859, 0.005985260009765625, 0.007322788238525391, 0.008660316467285156, 0.009997844696044922, 0.011335372924804688, 0.012672901153564453, 0.014010429382324219, 0.015347957611083984, 0.01668548583984375, 0.018023014068603516, 0.01936054229736328, 0.020698070526123047, 0.022035598754882812, 0.023373126983642578, 0.024710655212402344, 0.02604818344116211, 0.027385711669921875, 0.02872323989868164, 0.030060768127441406, 0.03139829635620117, 0.03273582458496094, 0.0340733528137207, 0.03541088104248047, 0.036748409271240234, 0.0380859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 15.0, 20.0, 18.0, 25.0, 36.0, 35.0, 49.0, 63.0, 111.0, 163.0, 286.0, 533.0, 1237.0, 3879.0, 16640.0, 116164.0, 1642542.0, 2224208.0, 159209.0, 21265.0, 4662.0, 1480.0, 631.0, 330.0, 182.0, 127.0, 108.0, 64.0, 46.0, 37.0, 24.0, 32.0, 13.0, 10.0, 10.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.050018310546875, -0.04823637008666992, -0.046454429626464844, -0.044672489166259766, -0.04289054870605469, -0.04110860824584961, -0.03932666778564453, -0.03754472732543945, -0.035762786865234375, -0.0339808464050293, -0.03219890594482422, -0.03041696548461914, -0.028635025024414062, -0.026853084564208984, -0.025071144104003906, -0.023289203643798828, -0.02150726318359375, -0.019725322723388672, -0.017943382263183594, -0.016161441802978516, -0.014379501342773438, -0.01259756088256836, -0.010815620422363281, -0.009033679962158203, -0.007251739501953125, -0.005469799041748047, -0.0036878585815429688, -0.0019059181213378906, -0.0001239776611328125, 0.0016579627990722656, 0.0034399032592773438, 0.005221843719482422, 0.0070037841796875, 0.008785724639892578, 0.010567665100097656, 0.012349605560302734, 0.014131546020507812, 0.01591348648071289, 0.01769542694091797, 0.019477367401123047, 0.021259307861328125, 0.023041248321533203, 0.02482318878173828, 0.02660512924194336, 0.028387069702148438, 0.030169010162353516, 0.031950950622558594, 0.03373289108276367, 0.03551483154296875, 0.03729677200317383, 0.039078712463378906, 0.040860652923583984, 0.04264259338378906, 0.04442453384399414, 0.04620647430419922, 0.0479884147644043, 0.049770355224609375, 0.05155229568481445, 0.05333423614501953, 0.05511617660522461, 0.05689811706542969, 0.058680057525634766, 0.060461997985839844, 0.06224393844604492, 0.06402587890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 1.0, 10.0, 1.0, 20.0, 9.0, 21.0, 35.0, 44.0, 74.0, 137.0, 218.0, 316.0, 547.0, 681.0, 662.0, 484.0, 274.0, 187.0, 123.0, 77.0, 42.0, 33.0, 30.0, 14.0, 9.0, 12.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.043212890625, -0.04154205322265625, -0.0398712158203125, -0.03820037841796875, -0.036529541015625, -0.03485870361328125, -0.0331878662109375, -0.03151702880859375, -0.02984619140625, -0.02817535400390625, -0.0265045166015625, -0.02483367919921875, -0.023162841796875, -0.02149200439453125, -0.0198211669921875, -0.01815032958984375, -0.0164794921875, -0.01480865478515625, -0.0131378173828125, -0.01146697998046875, -0.009796142578125, -0.00812530517578125, -0.0064544677734375, -0.00478363037109375, -0.00311279296875, -0.00144195556640625, 0.0002288818359375, 0.00189971923828125, 0.003570556640625, 0.00524139404296875, 0.0069122314453125, 0.00858306884765625, 0.01025390625, 0.01192474365234375, 0.0135955810546875, 0.01526641845703125, 0.016937255859375, 0.01860809326171875, 0.0202789306640625, 0.02194976806640625, 0.02362060546875, 0.02529144287109375, 0.0269622802734375, 0.02863311767578125, 0.030303955078125, 0.03197479248046875, 0.0336456298828125, 0.03531646728515625, 0.0369873046875, 0.03865814208984375, 0.0403289794921875, 0.04199981689453125, 0.043670654296875, 0.04534149169921875, 0.0470123291015625, 0.04868316650390625, 0.05035400390625, 0.05202484130859375, 0.0536956787109375, 0.05536651611328125, 0.057037353515625, 0.05870819091796875, 0.0603790283203125, 0.06204986572265625, 0.063720703125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 13.0, 18.0, 36.0, 76.0, 140.0, 188.0, 187.0, 151.0, 102.0, 45.0, 21.0, 5.0, 5.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37784871459007263, -0.36638322472572327, -0.3549177348613739, -0.3434522747993469, -0.33198678493499756, -0.3205212950706482, -0.30905580520629883, -0.29759031534194946, -0.2861248254776001, -0.27465933561325073, -0.26319384574890137, -0.251728355884552, -0.24026289582252502, -0.22879740595817566, -0.2173319160938263, -0.20586642622947693, -0.19440096616744995, -0.18293547630310059, -0.17147000133991241, -0.16000451147556305, -0.14853903651237488, -0.1370735466480255, -0.12560805678367615, -0.11414257436990738, -0.10267709195613861, -0.09121160954236984, -0.07974612712860107, -0.06828063726425171, -0.05681515485048294, -0.04534967243671417, -0.03388418257236481, -0.02241870015859604, -0.010953247547149658, 0.0005122367292642593, 0.011977721005678177, 0.023443207144737244, 0.03490868955850601, 0.04637417197227478, 0.057839661836624146, 0.06930514425039291, 0.08077062666416168, 0.09223610907793045, 0.10370159149169922, 0.11516708135604858, 0.12663257122039795, 0.13809804618358612, 0.14956353604793549, 0.16102901101112366, 0.17249450087547302, 0.1839599907398224, 0.19542546570301056, 0.20689095556735992, 0.2183564305305481, 0.22982192039489746, 0.24128741025924683, 0.2527529001235962, 0.26421838998794556, 0.2756838798522949, 0.2871493697166443, 0.29861485958099365, 0.31008031964302063, 0.32154580950737, 0.33301129937171936, 0.3444767892360687, 0.3559422492980957]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 7.0, 9.0, 7.0, 16.0, 13.0, 25.0, 27.0, 24.0, 42.0, 38.0, 36.0, 44.0, 37.0, 42.0, 47.0, 40.0, 34.0, 47.0, 47.0, 44.0, 41.0, 42.0, 46.0, 37.0, 32.0, 23.0, 28.0, 31.0, 21.0, 21.0, 10.0, 8.0, 10.0, 6.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.17667698860168457, -0.17145827412605286, -0.16623954474925995, -0.16102083027362823, -0.15580210089683533, -0.1505833864212036, -0.1453646719455719, -0.14014595746994019, -0.13492722809314728, -0.12970851361751556, -0.12448978424072266, -0.11927106976509094, -0.11405234783887863, -0.10883362591266632, -0.1036149114370346, -0.0983961895108223, -0.09317746758460999, -0.08795874565839767, -0.08274002373218536, -0.07752130925655365, -0.07230258733034134, -0.06708386540412903, -0.061865147203207016, -0.056646429002285004, -0.05142770707607269, -0.04620898514986038, -0.04099026694893837, -0.03577154874801636, -0.030552826821804047, -0.025334106758236885, -0.020115386694669724, -0.014896668493747711, -0.0096779465675354, -0.004459226503968239, 0.0007594935595989227, 0.005978213623166084, 0.011196933686733246, 0.016415653750300407, 0.02163437381386757, 0.02685309201478958, 0.03207181394100189, 0.0372905358672142, 0.042509254068136215, 0.04772797226905823, 0.05294669419527054, 0.05816541612148285, 0.06338413059711456, 0.06860285252332687, 0.07382157444953918, 0.0790402963757515, 0.0842590183019638, 0.08947773277759552, 0.09469645470380783, 0.09991517663002014, 0.10513389110565186, 0.11035261303186417, 0.11557133495807648, 0.12079005688428879, 0.1260087788105011, 0.1312274932861328, 0.13644620776176453, 0.14166493713855743, 0.14688365161418915, 0.15210238099098206, 0.15732109546661377]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 12.0, 11.0, 14.0, 26.0, 38.0, 37.0, 66.0, 78.0, 109.0, 196.0, 308.0, 538.0, 950.0, 1777.0, 3580.0, 7437.0, 15900.0, 35057.0, 78225.0, 162956.0, 255633.0, 236215.0, 134028.0, 62109.0, 27967.0, 12855.0, 5990.0, 2891.0, 1500.0, 798.0, 459.0, 273.0, 162.0, 110.0, 86.0, 46.0, 34.0, 21.0, 16.0, 8.0, 11.0, 7.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.027801513671875, -0.02680349349975586, -0.02580547332763672, -0.024807453155517578, -0.023809432983398438, -0.022811412811279297, -0.021813392639160156, -0.020815372467041016, -0.019817352294921875, -0.018819332122802734, -0.017821311950683594, -0.016823291778564453, -0.015825271606445312, -0.014827251434326172, -0.013829231262207031, -0.01283121109008789, -0.01183319091796875, -0.01083517074584961, -0.009837150573730469, -0.008839130401611328, -0.007841110229492188, -0.006843090057373047, -0.005845069885253906, -0.004847049713134766, -0.003849029541015625, -0.0028510093688964844, -0.0018529891967773438, -0.0008549690246582031, 0.0001430511474609375, 0.0011410713195800781, 0.0021390914916992188, 0.0031371116638183594, 0.0041351318359375, 0.005133152008056641, 0.006131172180175781, 0.007129192352294922, 0.008127212524414062, 0.009125232696533203, 0.010123252868652344, 0.011121273040771484, 0.012119293212890625, 0.013117313385009766, 0.014115333557128906, 0.015113353729248047, 0.016111373901367188, 0.017109394073486328, 0.01810741424560547, 0.01910543441772461, 0.02010345458984375, 0.02110147476196289, 0.02209949493408203, 0.023097515106201172, 0.024095535278320312, 0.025093555450439453, 0.026091575622558594, 0.027089595794677734, 0.028087615966796875, 0.029085636138916016, 0.030083656311035156, 0.031081676483154297, 0.03207969665527344, 0.03307771682739258, 0.03407573699951172, 0.03507375717163086, 0.03607177734375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 15.0, 13.0, 20.0, 22.0, 32.0, 38.0, 49.0, 48.0, 61.0, 57.0, 59.0, 77.0, 64.0, 61.0, 69.0, 67.0, 55.0, 41.0, 38.0, 32.0, 18.0, 26.0, 13.0, 13.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05535888671875, -0.053945064544677734, -0.05253124237060547, -0.0511174201965332, -0.04970359802246094, -0.04828977584838867, -0.046875953674316406, -0.04546213150024414, -0.044048309326171875, -0.04263448715209961, -0.041220664978027344, -0.03980684280395508, -0.03839302062988281, -0.03697919845581055, -0.03556537628173828, -0.034151554107666016, -0.03273773193359375, -0.031323909759521484, -0.02991008758544922, -0.028496265411376953, -0.027082443237304688, -0.025668621063232422, -0.024254798889160156, -0.02284097671508789, -0.021427154541015625, -0.02001333236694336, -0.018599510192871094, -0.017185688018798828, -0.015771865844726562, -0.014358043670654297, -0.012944221496582031, -0.011530399322509766, -0.0101165771484375, -0.008702754974365234, -0.007288932800292969, -0.005875110626220703, -0.0044612884521484375, -0.003047466278076172, -0.0016336441040039062, -0.00021982192993164062, 0.001194000244140625, 0.0026078224182128906, 0.004021644592285156, 0.005435466766357422, 0.0068492889404296875, 0.008263111114501953, 0.009676933288574219, 0.011090755462646484, 0.01250457763671875, 0.013918399810791016, 0.015332221984863281, 0.016746044158935547, 0.018159866333007812, 0.019573688507080078, 0.020987510681152344, 0.02240133285522461, 0.023815155029296875, 0.02522897720336914, 0.026642799377441406, 0.028056621551513672, 0.029470443725585938, 0.030884265899658203, 0.03229808807373047, 0.033711910247802734, 0.035125732421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 8.0, 8.0, 7.0, 16.0, 15.0, 44.0, 49.0, 79.0, 118.0, 185.0, 262.0, 460.0, 844.0, 1763.0, 3943.0, 9757.0, 25965.0, 73774.0, 205224.0, 358280.0, 232522.0, 85619.0, 29740.0, 11098.0, 4573.0, 1957.0, 914.0, 491.0, 308.0, 170.0, 120.0, 80.0, 50.0, 37.0, 21.0, 14.0, 14.0, 7.0, 4.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.053131103515625, -0.05167818069458008, -0.050225257873535156, -0.048772335052490234, -0.04731941223144531, -0.04586648941040039, -0.04441356658935547, -0.04296064376831055, -0.041507720947265625, -0.0400547981262207, -0.03860187530517578, -0.03714895248413086, -0.03569602966308594, -0.034243106842041016, -0.032790184020996094, -0.03133726119995117, -0.02988433837890625, -0.028431415557861328, -0.026978492736816406, -0.025525569915771484, -0.024072647094726562, -0.02261972427368164, -0.02116680145263672, -0.019713878631591797, -0.018260955810546875, -0.016808032989501953, -0.015355110168457031, -0.01390218734741211, -0.012449264526367188, -0.010996341705322266, -0.009543418884277344, -0.008090496063232422, -0.0066375732421875, -0.005184650421142578, -0.0037317276000976562, -0.0022788047790527344, -0.0008258819580078125, 0.0006270408630371094, 0.0020799636840820312, 0.003532886505126953, 0.004985809326171875, 0.006438732147216797, 0.007891654968261719, 0.00934457778930664, 0.010797500610351562, 0.012250423431396484, 0.013703346252441406, 0.015156269073486328, 0.01660919189453125, 0.018062114715576172, 0.019515037536621094, 0.020967960357666016, 0.022420883178710938, 0.02387380599975586, 0.02532672882080078, 0.026779651641845703, 0.028232574462890625, 0.029685497283935547, 0.03113842010498047, 0.03259134292602539, 0.03404426574707031, 0.035497188568115234, 0.036950111389160156, 0.03840303421020508, 0.03985595703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 7.0, 9.0, 11.0, 10.0, 15.0, 21.0, 14.0, 26.0, 44.0, 29.0, 35.0, 50.0, 34.0, 55.0, 33.0, 43.0, 54.0, 60.0, 51.0, 44.0, 61.0, 45.0, 40.0, 29.0, 31.0, 31.0, 18.0, 21.0, 20.0, 17.0, 10.0, 9.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.09844970703125, -0.0955953598022461, -0.09274101257324219, -0.08988666534423828, -0.08703231811523438, -0.08417797088623047, -0.08132362365722656, -0.07846927642822266, -0.07561492919921875, -0.07276058197021484, -0.06990623474121094, -0.06705188751220703, -0.06419754028320312, -0.06134319305419922, -0.05848884582519531, -0.055634498596191406, -0.0527801513671875, -0.049925804138183594, -0.04707145690917969, -0.04421710968017578, -0.041362762451171875, -0.03850841522216797, -0.03565406799316406, -0.032799720764160156, -0.02994537353515625, -0.027091026306152344, -0.024236679077148438, -0.02138233184814453, -0.018527984619140625, -0.01567363739013672, -0.012819290161132812, -0.009964942932128906, -0.007110595703125, -0.004256248474121094, -0.0014019012451171875, 0.0014524459838867188, 0.004306793212890625, 0.007161140441894531, 0.010015487670898438, 0.012869834899902344, 0.01572418212890625, 0.018578529357910156, 0.021432876586914062, 0.02428722381591797, 0.027141571044921875, 0.02999591827392578, 0.03285026550292969, 0.035704612731933594, 0.0385589599609375, 0.041413307189941406, 0.04426765441894531, 0.04712200164794922, 0.049976348876953125, 0.05283069610595703, 0.05568504333496094, 0.058539390563964844, 0.06139373779296875, 0.06424808502197266, 0.06710243225097656, 0.06995677947998047, 0.07281112670898438, 0.07566547393798828, 0.07851982116699219, 0.0813741683959961, 0.084228515625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 3.0, 8.0, 10.0, 14.0, 36.0, 70.0, 92.0, 180.0, 315.0, 747.0, 1644.0, 3985.0, 10493.0, 28682.0, 84089.0, 235390.0, 368145.0, 204137.0, 70827.0, 24653.0, 8971.0, 3388.0, 1396.0, 591.0, 290.0, 172.0, 87.0, 55.0, 25.0, 21.0, 11.0, 11.0, 4.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0135345458984375, -0.013089656829833984, -0.012644767761230469, -0.012199878692626953, -0.011754989624023438, -0.011310100555419922, -0.010865211486816406, -0.01042032241821289, -0.009975433349609375, -0.00953054428100586, -0.009085655212402344, -0.008640766143798828, -0.008195877075195312, -0.007750988006591797, -0.007306098937988281, -0.006861209869384766, -0.00641632080078125, -0.005971431732177734, -0.005526542663574219, -0.005081653594970703, -0.0046367645263671875, -0.004191875457763672, -0.0037469863891601562, -0.0033020973205566406, -0.002857208251953125, -0.0024123191833496094, -0.0019674301147460938, -0.0015225410461425781, -0.0010776519775390625, -0.0006327629089355469, -0.00018787384033203125, 0.0002570152282714844, 0.000701904296875, 0.0011467933654785156, 0.0015916824340820312, 0.002036571502685547, 0.0024814605712890625, 0.002926349639892578, 0.0033712387084960938, 0.0038161277770996094, 0.004261016845703125, 0.004705905914306641, 0.005150794982910156, 0.005595684051513672, 0.0060405731201171875, 0.006485462188720703, 0.006930351257324219, 0.007375240325927734, 0.00782012939453125, 0.008265018463134766, 0.008709907531738281, 0.009154796600341797, 0.009599685668945312, 0.010044574737548828, 0.010489463806152344, 0.01093435287475586, 0.011379241943359375, 0.01182413101196289, 0.012269020080566406, 0.012713909149169922, 0.013158798217773438, 0.013603687286376953, 0.014048576354980469, 0.014493465423583984, 0.0149383544921875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 4.0, 0.0, 2.0, 5.0, 3.0, 4.0, 15.0, 11.0, 16.0, 39.0, 24.0, 25.0, 56.0, 37.0, 71.0, 54.0, 47.0, 103.0, 57.0, 52.0, 82.0, 45.0, 41.0, 40.0, 30.0, 28.0, 16.0, 23.0, 8.0, 14.0, 10.0, 11.0, 5.0, 6.0, 4.0, 2.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.351139068603516e-06, -4.210509359836578e-06, -4.069879651069641e-06, -3.929249942302704e-06, -3.7886202335357666e-06, -3.6479905247688293e-06, -3.507360816001892e-06, -3.366731107234955e-06, -3.2261013984680176e-06, -3.0854716897010803e-06, -2.944841980934143e-06, -2.804212272167206e-06, -2.6635825634002686e-06, -2.5229528546333313e-06, -2.382323145866394e-06, -2.2416934370994568e-06, -2.1010637283325195e-06, -1.9604340195655823e-06, -1.819804310798645e-06, -1.6791746020317078e-06, -1.5385448932647705e-06, -1.3979151844978333e-06, -1.257285475730896e-06, -1.1166557669639587e-06, -9.760260581970215e-07, -8.353963494300842e-07, -6.94766640663147e-07, -5.541369318962097e-07, -4.1350722312927246e-07, -2.728775143623352e-07, -1.3224780559539795e-07, 8.381903171539307e-09, 1.4901161193847656e-07, 2.896413207054138e-07, 4.302710294723511e-07, 5.709007382392883e-07, 7.115304470062256e-07, 8.521601557731628e-07, 9.927898645401e-07, 1.1334195733070374e-06, 1.2740492820739746e-06, 1.4146789908409119e-06, 1.5553086996078491e-06, 1.6959384083747864e-06, 1.8365681171417236e-06, 1.977197825908661e-06, 2.117827534675598e-06, 2.2584572434425354e-06, 2.3990869522094727e-06, 2.53971666097641e-06, 2.680346369743347e-06, 2.8209760785102844e-06, 2.9616057872772217e-06, 3.102235496044159e-06, 3.242865204811096e-06, 3.3834949135780334e-06, 3.5241246223449707e-06, 3.664754331111908e-06, 3.8053840398788452e-06, 3.9460137486457825e-06, 4.08664345741272e-06, 4.227273166179657e-06, 4.367902874946594e-06, 4.5085325837135315e-06, 4.649162292480469e-06]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 11.0, 10.0, 7.0, 19.0, 19.0, 28.0, 29.0, 66.0, 81.0, 137.0, 238.0, 409.0, 729.0, 1373.0, 2593.0, 5294.0, 10665.0, 22303.0, 47005.0, 99608.0, 191974.0, 261463.0, 201260.0, 106119.0, 50307.0, 23738.0, 11436.0, 5521.0, 2769.0, 1423.0, 789.0, 432.0, 226.0, 159.0, 98.0, 72.0, 54.0, 32.0, 18.0, 13.0, 11.0, 6.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0107269287109375, -0.010416388511657715, -0.01010584831237793, -0.009795308113098145, -0.00948476791381836, -0.009174227714538574, -0.008863687515258789, -0.008553147315979004, -0.008242607116699219, -0.007932066917419434, -0.0076215267181396484, -0.007310986518859863, -0.007000446319580078, -0.006689906120300293, -0.006379365921020508, -0.006068825721740723, -0.0057582855224609375, -0.005447745323181152, -0.005137205123901367, -0.004826664924621582, -0.004516124725341797, -0.004205584526062012, -0.0038950443267822266, -0.0035845041275024414, -0.0032739639282226562, -0.002963423728942871, -0.002652883529663086, -0.0023423433303833008, -0.0020318031311035156, -0.0017212629318237305, -0.0014107227325439453, -0.0011001825332641602, -0.000789642333984375, -0.00047910213470458984, -0.0001685619354248047, 0.00014197826385498047, 0.0004525184631347656, 0.0007630586624145508, 0.001073598861694336, 0.001384139060974121, 0.0016946792602539062, 0.0020052194595336914, 0.0023157596588134766, 0.0026262998580932617, 0.002936840057373047, 0.003247380256652832, 0.003557920455932617, 0.0038684606552124023, 0.0041790008544921875, 0.004489541053771973, 0.004800081253051758, 0.005110621452331543, 0.005421161651611328, 0.005731701850891113, 0.0060422420501708984, 0.006352782249450684, 0.006663322448730469, 0.006973862648010254, 0.007284402847290039, 0.007594943046569824, 0.00790548324584961, 0.008216023445129395, 0.00852656364440918, 0.008837103843688965, 0.00914764404296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 5.0, 4.0, 2.0, 5.0, 5.0, 6.0, 11.0, 7.0, 14.0, 20.0, 19.0, 13.0, 36.0, 25.0, 40.0, 41.0, 50.0, 44.0, 62.0, 67.0, 62.0, 48.0, 49.0, 45.0, 49.0, 33.0, 45.0, 34.0, 25.0, 26.0, 26.0, 16.0, 13.0, 5.0, 6.0, 11.0, 8.0, 6.0, 6.0, 3.0, 5.0, 6.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.01210784912109375, -0.011771440505981445, -0.01143503189086914, -0.011098623275756836, -0.010762214660644531, -0.010425806045532227, -0.010089397430419922, -0.009752988815307617, -0.009416580200195312, -0.009080171585083008, -0.008743762969970703, -0.008407354354858398, -0.008070945739746094, -0.007734537124633789, -0.007398128509521484, -0.00706171989440918, -0.006725311279296875, -0.00638890266418457, -0.006052494049072266, -0.005716085433959961, -0.005379676818847656, -0.0050432682037353516, -0.004706859588623047, -0.004370450973510742, -0.0040340423583984375, -0.003697633743286133, -0.003361225128173828, -0.0030248165130615234, -0.0026884078979492188, -0.002351999282836914, -0.0020155906677246094, -0.0016791820526123047, -0.0013427734375, -0.0010063648223876953, -0.0006699562072753906, -0.00033354759216308594, 2.86102294921875e-06, 0.00033926963806152344, 0.0006756782531738281, 0.0010120868682861328, 0.0013484954833984375, 0.0016849040985107422, 0.002021312713623047, 0.0023577213287353516, 0.0026941299438476562, 0.003030538558959961, 0.0033669471740722656, 0.0037033557891845703, 0.004039764404296875, 0.00437617301940918, 0.004712581634521484, 0.005048990249633789, 0.005385398864746094, 0.0057218074798583984, 0.006058216094970703, 0.006394624710083008, 0.0067310333251953125, 0.007067441940307617, 0.007403850555419922, 0.0077402591705322266, 0.008076667785644531, 0.008413076400756836, 0.00874948501586914, 0.009085893630981445, 0.00942230224609375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 8.0, 7.0, 13.0, 37.0, 56.0, 121.0, 160.0, 174.0, 159.0, 109.0, 78.0, 30.0, 18.0, 11.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30164480209350586, -0.29292383790016174, -0.2842028737068176, -0.2754818797111511, -0.266760915517807, -0.2580399513244629, -0.24931897222995758, -0.24059799313545227, -0.23187702894210815, -0.22315606474876404, -0.21443508565425873, -0.20571410655975342, -0.1969931423664093, -0.18827217817306519, -0.17955119907855988, -0.17083021998405457, -0.16210925579071045, -0.15338829159736633, -0.14466731250286102, -0.1359463334083557, -0.1272253692150116, -0.11850439757108688, -0.10978342592716217, -0.10106245428323746, -0.09234148263931274, -0.08362051099538803, -0.07489953935146332, -0.0661785677075386, -0.05745759606361389, -0.04873662441968918, -0.040015652775764465, -0.03129468113183975, -0.02257367968559265, -0.013852708041667938, -0.005131736397743225, 0.003589235246181488, 0.012310206890106201, 0.021031178534030914, 0.029752150177955627, 0.03847312182188034, 0.047194093465805054, 0.05591506510972977, 0.06463603675365448, 0.0733570083975792, 0.0820779800415039, 0.09079895168542862, 0.09951992332935333, 0.10824089497327805, 0.11696186661720276, 0.12568283081054688, 0.13440380990505219, 0.1431247889995575, 0.1518457531929016, 0.16056671738624573, 0.16928769648075104, 0.17800867557525635, 0.18672963976860046, 0.19545060396194458, 0.2041715830564499, 0.2128925621509552, 0.22161352634429932, 0.23033449053764343, 0.23905546963214874, 0.24777644872665405, 0.25649741291999817]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 0.0, 5.0, 9.0, 11.0, 16.0, 17.0, 13.0, 10.0, 13.0, 20.0, 16.0, 15.0, 21.0, 29.0, 33.0, 26.0, 39.0, 34.0, 45.0, 42.0, 43.0, 45.0, 40.0, 40.0, 45.0, 40.0, 42.0, 34.0, 36.0, 31.0, 21.0, 26.0, 27.0, 14.0, 17.0, 11.0, 20.0, 12.0, 12.0, 9.0, 9.0, 7.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1990005373954773, -0.19328947365283966, -0.18757840991020203, -0.1818673461675644, -0.17615628242492676, -0.17044521868228912, -0.1647341549396515, -0.15902310609817505, -0.15331202745437622, -0.1476009637117386, -0.14188989996910095, -0.13617883622646332, -0.13046777248382568, -0.12475670874118805, -0.11904565244913101, -0.11333458870649338, -0.10762353241443634, -0.1019124686717987, -0.09620140492916107, -0.09049034118652344, -0.0847792774438858, -0.07906821370124817, -0.07335715740919113, -0.0676460936665535, -0.06193502992391586, -0.05622396618127823, -0.050512902438640594, -0.04480184242129326, -0.039090778678655624, -0.03337971493601799, -0.027668654918670654, -0.02195759117603302, -0.016246527433395386, -0.010535464622080326, -0.004824401810765266, 0.0008866600692272186, 0.006597723811864853, 0.012308787554502487, 0.018019847571849823, 0.023730911314487457, 0.02944197505712509, 0.035153038799762726, 0.04086410254240036, 0.046575162559747696, 0.05228622630238533, 0.057997290045022964, 0.0637083500623703, 0.06941941380500793, 0.07513047754764557, 0.0808415412902832, 0.08655260503292084, 0.09226366877555847, 0.0979747325181961, 0.10368579626083374, 0.10939685255289078, 0.11510791629552841, 0.12081898003816605, 0.12653003633022308, 0.13224110007286072, 0.13795216381549835, 0.143663227558136, 0.14937429130077362, 0.15508535504341125, 0.1607964187860489, 0.16650748252868652]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 11.0, 7.0, 11.0, 20.0, 32.0, 34.0, 55.0, 92.0, 131.0, 201.0, 358.0, 608.0, 1184.0, 2270.0, 4973.0, 10634.0, 24572.0, 63001.0, 156527.0, 354227.0, 669041.0, 936702.0, 890229.0, 586593.0, 283801.0, 119231.0, 47072.0, 20402.0, 10547.0, 5935.0, 2984.0, 1344.0, 611.0, 319.0, 196.0, 131.0, 60.0, 37.0, 27.0, 23.0, 14.0, 9.0, 5.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0198822021484375, -0.01923823356628418, -0.01859426498413086, -0.01795029640197754, -0.01730632781982422, -0.0166623592376709, -0.016018390655517578, -0.015374422073364258, -0.014730453491210938, -0.014086484909057617, -0.013442516326904297, -0.012798547744750977, -0.012154579162597656, -0.011510610580444336, -0.010866641998291016, -0.010222673416137695, -0.009578704833984375, -0.008934736251831055, -0.008290767669677734, -0.007646799087524414, -0.007002830505371094, -0.0063588619232177734, -0.005714893341064453, -0.005070924758911133, -0.0044269561767578125, -0.003782987594604492, -0.003139019012451172, -0.0024950504302978516, -0.0018510818481445312, -0.001207113265991211, -0.0005631446838378906, 8.082389831542969e-05, 0.00072479248046875, 0.0013687610626220703, 0.0020127296447753906, 0.002656698226928711, 0.0033006668090820312, 0.0039446353912353516, 0.004588603973388672, 0.005232572555541992, 0.0058765411376953125, 0.006520509719848633, 0.007164478302001953, 0.0078084468841552734, 0.008452415466308594, 0.009096384048461914, 0.009740352630615234, 0.010384321212768555, 0.011028289794921875, 0.011672258377075195, 0.012316226959228516, 0.012960195541381836, 0.013604164123535156, 0.014248132705688477, 0.014892101287841797, 0.015536069869995117, 0.016180038452148438, 0.016824007034301758, 0.017467975616455078, 0.0181119441986084, 0.01875591278076172, 0.01939988136291504, 0.02004384994506836, 0.02068781852722168, 0.021331787109375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 8.0, 9.0, 12.0, 9.0, 17.0, 22.0, 21.0, 45.0, 52.0, 44.0, 55.0, 43.0, 53.0, 71.0, 56.0, 58.0, 63.0, 47.0, 53.0, 47.0, 48.0, 29.0, 34.0, 21.0, 18.0, 13.0, 8.0, 12.0, 6.0, 3.0, 12.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041839599609375, -0.040592193603515625, -0.03934478759765625, -0.038097381591796875, -0.0368499755859375, -0.035602569580078125, -0.03435516357421875, -0.033107757568359375, -0.0318603515625, -0.030612945556640625, -0.02936553955078125, -0.028118133544921875, -0.0268707275390625, -0.025623321533203125, -0.02437591552734375, -0.023128509521484375, -0.021881103515625, -0.020633697509765625, -0.01938629150390625, -0.018138885498046875, -0.0168914794921875, -0.015644073486328125, -0.01439666748046875, -0.013149261474609375, -0.01190185546875, -0.010654449462890625, -0.00940704345703125, -0.008159637451171875, -0.0069122314453125, -0.005664825439453125, -0.00441741943359375, -0.003170013427734375, -0.001922607421875, -0.000675201416015625, 0.00057220458984375, 0.001819610595703125, 0.0030670166015625, 0.004314422607421875, 0.00556182861328125, 0.006809234619140625, 0.008056640625, 0.009304046630859375, 0.01055145263671875, 0.011798858642578125, 0.0130462646484375, 0.014293670654296875, 0.01554107666015625, 0.016788482666015625, 0.018035888671875, 0.019283294677734375, 0.02053070068359375, 0.021778106689453125, 0.0230255126953125, 0.024272918701171875, 0.02552032470703125, 0.026767730712890625, 0.02801513671875, 0.029262542724609375, 0.03050994873046875, 0.031757354736328125, 0.0330047607421875, 0.034252166748046875, 0.03549957275390625, 0.036746978759765625, 0.037994384765625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 7.0, 3.0, 6.0, 10.0, 18.0, 15.0, 18.0, 25.0, 28.0, 37.0, 64.0, 95.0, 110.0, 164.0, 277.0, 640.0, 2568.0, 23623.0, 893769.0, 3189473.0, 75962.0, 5391.0, 939.0, 369.0, 201.0, 128.0, 107.0, 76.0, 47.0, 20.0, 20.0, 14.0, 17.0, 14.0, 7.0, 8.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.09564208984375, -0.0925760269165039, -0.08950996398925781, -0.08644390106201172, -0.08337783813476562, -0.08031177520751953, -0.07724571228027344, -0.07417964935302734, -0.07111358642578125, -0.06804752349853516, -0.06498146057128906, -0.06191539764404297, -0.058849334716796875, -0.05578327178955078, -0.05271720886230469, -0.049651145935058594, -0.0465850830078125, -0.043519020080566406, -0.04045295715332031, -0.03738689422607422, -0.034320831298828125, -0.03125476837158203, -0.028188705444335938, -0.025122642517089844, -0.02205657958984375, -0.018990516662597656, -0.015924453735351562, -0.012858390808105469, -0.009792327880859375, -0.006726264953613281, -0.0036602020263671875, -0.0005941390991210938, 0.002471923828125, 0.005537986755371094, 0.008604049682617188, 0.011670112609863281, 0.014736175537109375, 0.01780223846435547, 0.020868301391601562, 0.023934364318847656, 0.02700042724609375, 0.030066490173339844, 0.03313255310058594, 0.03619861602783203, 0.039264678955078125, 0.04233074188232422, 0.04539680480957031, 0.048462867736816406, 0.0515289306640625, 0.054594993591308594, 0.05766105651855469, 0.06072711944580078, 0.06379318237304688, 0.06685924530029297, 0.06992530822753906, 0.07299137115478516, 0.07605743408203125, 0.07912349700927734, 0.08218955993652344, 0.08525562286376953, 0.08832168579101562, 0.09138774871826172, 0.09445381164550781, 0.0975198745727539, 0.1005859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 18.0, 32.0, 78.0, 158.0, 385.0, 876.0, 1221.0, 796.0, 293.0, 107.0, 54.0, 25.0, 15.0, 9.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11907958984375, -0.11571693420410156, -0.11235427856445312, -0.10899162292480469, -0.10562896728515625, -0.10226631164550781, -0.09890365600585938, -0.09554100036621094, -0.0921783447265625, -0.08881568908691406, -0.08545303344726562, -0.08209037780761719, -0.07872772216796875, -0.07536506652832031, -0.07200241088867188, -0.06863975524902344, -0.065277099609375, -0.06191444396972656, -0.058551788330078125, -0.05518913269042969, -0.05182647705078125, -0.04846382141113281, -0.045101165771484375, -0.04173851013183594, -0.0383758544921875, -0.03501319885253906, -0.031650543212890625, -0.028287887573242188, -0.02492523193359375, -0.021562576293945312, -0.018199920654296875, -0.014837265014648438, -0.011474609375, -0.008111953735351562, -0.004749298095703125, -0.0013866424560546875, 0.00197601318359375, 0.0053386688232421875, 0.008701324462890625, 0.012063980102539062, 0.0154266357421875, 0.018789291381835938, 0.022151947021484375, 0.025514602661132812, 0.02887725830078125, 0.03223991394042969, 0.035602569580078125, 0.03896522521972656, 0.042327880859375, 0.04569053649902344, 0.049053192138671875, 0.05241584777832031, 0.05577850341796875, 0.05914115905761719, 0.06250381469726562, 0.06586647033691406, 0.0692291259765625, 0.07259178161621094, 0.07595443725585938, 0.07931709289550781, 0.08267974853515625, 0.08604240417480469, 0.08940505981445312, 0.09276771545410156, 0.09613037109375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 15.0, 48.0, 157.0, 342.0, 283.0, 107.0, 33.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49309566617012024, -0.4704412817955017, -0.4477868676185608, -0.42513248324394226, -0.40247809886932373, -0.3798237144947052, -0.35716933012008667, -0.33451491594314575, -0.3118605315685272, -0.2892061471939087, -0.2665517330169678, -0.24389734864234924, -0.2212429642677307, -0.19858857989311218, -0.17593418061733246, -0.15327978134155273, -0.1306253969669342, -0.10797100514173508, -0.08531661331653595, -0.06266222149133682, -0.040007829666137695, -0.017353437840938568, 0.005300953984260559, 0.027955353260040283, 0.050609737634658813, 0.07326412945985794, 0.09591852128505707, 0.1185729131102562, 0.14122730493545532, 0.16388168931007385, 0.18653608858585358, 0.2091904878616333, 0.23184490203857422, 0.25449928641319275, 0.2771536707878113, 0.2998080849647522, 0.3224624693393707, 0.34511685371398926, 0.3677712678909302, 0.3904256522655487, 0.41308003664016724, 0.43573442101478577, 0.4583888053894043, 0.4810432195663452, 0.5036976337432861, 0.5263519883155823, 0.5490064024925232, 0.5716607570648193, 0.5943151712417603, 0.6169695854187012, 0.6396239399909973, 0.6622783541679382, 0.6849327087402344, 0.7075871229171753, 0.7302415370941162, 0.7528959512710571, 0.7755503058433533, 0.7982047200202942, 0.8208590745925903, 0.8435134887695312, 0.8661679029464722, 0.8888222575187683, 0.9114766716957092, 0.9341310262680054, 0.9567854404449463]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 10.0, 11.0, 8.0, 18.0, 19.0, 20.0, 18.0, 20.0, 26.0, 29.0, 31.0, 38.0, 43.0, 33.0, 46.0, 45.0, 60.0, 52.0, 51.0, 46.0, 42.0, 41.0, 41.0, 32.0, 31.0, 36.0, 33.0, 16.0, 21.0, 18.0, 21.0, 15.0, 6.0, 6.0, 7.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1588834524154663, -0.15380360186100006, -0.148723766207695, -0.14364391565322876, -0.1385640799999237, -0.13348422944545746, -0.1284043788909912, -0.12332453578710556, -0.11824469268321991, -0.11316484957933426, -0.10808500647544861, -0.10300515592098236, -0.09792531281709671, -0.09284546971321106, -0.08776561915874481, -0.08268577605485916, -0.07760593295097351, -0.07252608984708786, -0.06744624674320221, -0.06236639618873596, -0.05728655308485031, -0.05220670998096466, -0.04712686315178871, -0.04204701632261276, -0.03696717321872711, -0.03188733011484146, -0.026807483285665512, -0.021727638319134712, -0.016647793352603912, -0.011567948386073112, -0.006488103419542313, -0.0014082565903663635, 0.003671586513519287, 0.008751431480050087, 0.013831276446580887, 0.018911121413111687, 0.023990966379642487, 0.029070811346173286, 0.034150656312704086, 0.039230503141880035, 0.044310346245765686, 0.04939018934965134, 0.054470036178827286, 0.059549883008003235, 0.06462972611188889, 0.06970956921577454, 0.07478941977024078, 0.07986926287412643, 0.08494910597801208, 0.09002894908189774, 0.09510879218578339, 0.10018864274024963, 0.10526848584413528, 0.11034832894802094, 0.11542817950248718, 0.12050802260637283, 0.12558786571025848, 0.13066771626472473, 0.13574755191802979, 0.14082740247249603, 0.14590725302696228, 0.15098708868026733, 0.15606693923473358, 0.16114678978919983, 0.16622662544250488]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 10.0, 10.0, 15.0, 25.0, 32.0, 45.0, 76.0, 119.0, 159.0, 262.0, 421.0, 683.0, 1154.0, 2077.0, 3539.0, 6447.0, 11981.0, 24233.0, 50276.0, 108604.0, 204889.0, 258580.0, 188319.0, 95983.0, 44680.0, 21351.0, 10897.0, 5787.0, 3155.0, 1847.0, 1169.0, 598.0, 359.0, 270.0, 165.0, 104.0, 79.0, 50.0, 23.0, 18.0, 15.0, 11.0, 12.0, 1.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0243988037109375, -0.023540258407592773, -0.022681713104248047, -0.02182316780090332, -0.020964622497558594, -0.020106077194213867, -0.01924753189086914, -0.018388986587524414, -0.017530441284179688, -0.01667189598083496, -0.015813350677490234, -0.014954805374145508, -0.014096260070800781, -0.013237714767456055, -0.012379169464111328, -0.011520624160766602, -0.010662078857421875, -0.009803533554077148, -0.008944988250732422, -0.008086442947387695, -0.007227897644042969, -0.006369352340698242, -0.005510807037353516, -0.004652261734008789, -0.0037937164306640625, -0.002935171127319336, -0.0020766258239746094, -0.0012180805206298828, -0.00035953521728515625, 0.0004990100860595703, 0.0013575553894042969, 0.0022161006927490234, 0.00307464599609375, 0.0039331912994384766, 0.004791736602783203, 0.00565028190612793, 0.006508827209472656, 0.007367372512817383, 0.00822591781616211, 0.009084463119506836, 0.009943008422851562, 0.010801553726196289, 0.011660099029541016, 0.012518644332885742, 0.013377189636230469, 0.014235734939575195, 0.015094280242919922, 0.01595282554626465, 0.016811370849609375, 0.0176699161529541, 0.018528461456298828, 0.019387006759643555, 0.02024555206298828, 0.021104097366333008, 0.021962642669677734, 0.02282118797302246, 0.023679733276367188, 0.024538278579711914, 0.02539682388305664, 0.026255369186401367, 0.027113914489746094, 0.02797245979309082, 0.028831005096435547, 0.029689550399780273, 0.030548095703125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 9.0, 15.0, 19.0, 27.0, 16.0, 31.0, 38.0, 37.0, 57.0, 53.0, 73.0, 59.0, 80.0, 66.0, 69.0, 71.0, 51.0, 40.0, 44.0, 36.0, 26.0, 23.0, 15.0, 17.0, 12.0, 3.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051910400390625, -0.05041313171386719, -0.048915863037109375, -0.04741859436035156, -0.04592132568359375, -0.04442405700683594, -0.042926788330078125, -0.04142951965332031, -0.0399322509765625, -0.03843498229980469, -0.036937713623046875, -0.03544044494628906, -0.03394317626953125, -0.03244590759277344, -0.030948638916015625, -0.029451370239257812, -0.0279541015625, -0.026456832885742188, -0.024959564208984375, -0.023462295532226562, -0.02196502685546875, -0.020467758178710938, -0.018970489501953125, -0.017473220825195312, -0.0159759521484375, -0.014478683471679688, -0.012981414794921875, -0.011484146118164062, -0.00998687744140625, -0.008489608764648438, -0.006992340087890625, -0.0054950714111328125, -0.003997802734375, -0.0025005340576171875, -0.001003265380859375, 0.0004940032958984375, 0.00199127197265625, 0.0034885406494140625, 0.004985809326171875, 0.0064830780029296875, 0.0079803466796875, 0.009477615356445312, 0.010974884033203125, 0.012472152709960938, 0.01396942138671875, 0.015466690063476562, 0.016963958740234375, 0.018461227416992188, 0.01995849609375, 0.021455764770507812, 0.022953033447265625, 0.024450302124023438, 0.02594757080078125, 0.027444839477539062, 0.028942108154296875, 0.030439376831054688, 0.0319366455078125, 0.03343391418457031, 0.034931182861328125, 0.03642845153808594, 0.03792572021484375, 0.03942298889160156, 0.040920257568359375, 0.04241752624511719, 0.043914794921875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 1.0, 4.0, 4.0, 5.0, 4.0, 15.0, 9.0, 31.0, 19.0, 42.0, 77.0, 84.0, 133.0, 245.0, 389.0, 740.0, 1368.0, 2632.0, 5299.0, 11100.0, 23954.0, 55791.0, 139394.0, 293539.0, 285232.0, 131694.0, 52428.0, 23214.0, 10612.0, 5080.0, 2499.0, 1300.0, 635.0, 351.0, 229.0, 108.0, 92.0, 59.0, 48.0, 24.0, 28.0, 14.0, 11.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036163330078125, -0.03499555587768555, -0.033827781677246094, -0.03266000747680664, -0.03149223327636719, -0.030324459075927734, -0.02915668487548828, -0.027988910675048828, -0.026821136474609375, -0.025653362274169922, -0.02448558807373047, -0.023317813873291016, -0.022150039672851562, -0.02098226547241211, -0.019814491271972656, -0.018646717071533203, -0.01747894287109375, -0.016311168670654297, -0.015143394470214844, -0.01397562026977539, -0.012807846069335938, -0.011640071868896484, -0.010472297668457031, -0.009304523468017578, -0.008136749267578125, -0.006968975067138672, -0.005801200866699219, -0.004633426666259766, -0.0034656524658203125, -0.0022978782653808594, -0.0011301040649414062, 3.7670135498046875e-05, 0.0012054443359375, 0.002373218536376953, 0.0035409927368164062, 0.004708766937255859, 0.0058765411376953125, 0.007044315338134766, 0.008212089538574219, 0.009379863739013672, 0.010547637939453125, 0.011715412139892578, 0.012883186340332031, 0.014050960540771484, 0.015218734741210938, 0.01638650894165039, 0.017554283142089844, 0.018722057342529297, 0.01988983154296875, 0.021057605743408203, 0.022225379943847656, 0.02339315414428711, 0.024560928344726562, 0.025728702545166016, 0.02689647674560547, 0.028064250946044922, 0.029232025146484375, 0.030399799346923828, 0.03156757354736328, 0.032735347747802734, 0.03390312194824219, 0.03507089614868164, 0.036238670349121094, 0.03740644454956055, 0.03857421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 8.0, 2.0, 9.0, 9.0, 13.0, 11.0, 18.0, 20.0, 20.0, 22.0, 24.0, 23.0, 31.0, 30.0, 46.0, 23.0, 47.0, 49.0, 54.0, 57.0, 58.0, 40.0, 40.0, 35.0, 41.0, 27.0, 30.0, 37.0, 25.0, 19.0, 21.0, 25.0, 20.0, 13.0, 10.0, 7.0, 9.0, 9.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.09698486328125, -0.09441280364990234, -0.09184074401855469, -0.08926868438720703, -0.08669662475585938, -0.08412456512451172, -0.08155250549316406, -0.0789804458618164, -0.07640838623046875, -0.0738363265991211, -0.07126426696777344, -0.06869220733642578, -0.06612014770507812, -0.06354808807373047, -0.06097602844238281, -0.058403968811035156, -0.0558319091796875, -0.053259849548339844, -0.05068778991699219, -0.04811573028564453, -0.045543670654296875, -0.04297161102294922, -0.04039955139160156, -0.037827491760253906, -0.03525543212890625, -0.032683372497558594, -0.030111312866210938, -0.02753925323486328, -0.024967193603515625, -0.02239513397216797, -0.019823074340820312, -0.017251014709472656, -0.014678955078125, -0.012106895446777344, -0.009534835815429688, -0.006962776184082031, -0.004390716552734375, -0.0018186569213867188, 0.0007534027099609375, 0.0033254623413085938, 0.00589752197265625, 0.008469581604003906, 0.011041641235351562, 0.013613700866699219, 0.016185760498046875, 0.01875782012939453, 0.021329879760742188, 0.023901939392089844, 0.0264739990234375, 0.029046058654785156, 0.03161811828613281, 0.03419017791748047, 0.036762237548828125, 0.03933429718017578, 0.04190635681152344, 0.044478416442871094, 0.04705047607421875, 0.049622535705566406, 0.05219459533691406, 0.05476665496826172, 0.057338714599609375, 0.05991077423095703, 0.06248283386230469, 0.06505489349365234, 0.067626953125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 5.0, 3.0, 5.0, 14.0, 16.0, 25.0, 35.0, 65.0, 110.0, 170.0, 272.0, 419.0, 665.0, 1107.0, 1866.0, 3259.0, 5735.0, 10375.0, 19528.0, 39788.0, 84220.0, 163843.0, 238366.0, 217681.0, 131374.0, 64268.0, 30419.0, 15593.0, 8177.0, 4553.0, 2743.0, 1483.0, 888.0, 558.0, 326.0, 203.0, 146.0, 84.0, 47.0, 37.0, 23.0, 18.0, 16.0, 7.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00679779052734375, -0.006577193737030029, -0.006356596946716309, -0.006136000156402588, -0.005915403366088867, -0.0056948065757751465, -0.005474209785461426, -0.005253612995147705, -0.005033016204833984, -0.004812419414520264, -0.004591822624206543, -0.004371225833892822, -0.0041506290435791016, -0.003930032253265381, -0.00370943546295166, -0.0034888386726379395, -0.0032682418823242188, -0.003047645092010498, -0.0028270483016967773, -0.0026064515113830566, -0.002385854721069336, -0.0021652579307556152, -0.0019446611404418945, -0.0017240643501281738, -0.0015034675598144531, -0.0012828707695007324, -0.0010622739791870117, -0.000841677188873291, -0.0006210803985595703, -0.0004004836082458496, -0.0001798868179321289, 4.07099723815918e-05, 0.0002613067626953125, 0.0004819035530090332, 0.0007025003433227539, 0.0009230971336364746, 0.0011436939239501953, 0.001364290714263916, 0.0015848875045776367, 0.0018054842948913574, 0.002026081085205078, 0.002246677875518799, 0.0024672746658325195, 0.0026878714561462402, 0.002908468246459961, 0.0031290650367736816, 0.0033496618270874023, 0.003570258617401123, 0.0037908554077148438, 0.0040114521980285645, 0.004232048988342285, 0.004452645778656006, 0.0046732425689697266, 0.004893839359283447, 0.005114436149597168, 0.005335032939910889, 0.005555629730224609, 0.00577622652053833, 0.005996823310852051, 0.0062174201011657715, 0.006438016891479492, 0.006658613681793213, 0.006879210472106934, 0.007099807262420654, 0.007320404052734375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 2.0, 6.0, 9.0, 5.0, 9.0, 25.0, 19.0, 45.0, 30.0, 62.0, 72.0, 47.0, 107.0, 114.0, 58.0, 124.0, 46.0, 71.0, 50.0, 25.0, 30.0, 14.0, 2.0, 12.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.470348358154297e-06, -4.3138861656188965e-06, -4.157423973083496e-06, -4.000961780548096e-06, -3.844499588012695e-06, -3.688037395477295e-06, -3.5315752029418945e-06, -3.375113010406494e-06, -3.2186508178710938e-06, -3.0621886253356934e-06, -2.905726432800293e-06, -2.7492642402648926e-06, -2.592802047729492e-06, -2.436339855194092e-06, -2.2798776626586914e-06, -2.123415470123291e-06, -1.9669532775878906e-06, -1.8104910850524902e-06, -1.6540288925170898e-06, -1.4975666999816895e-06, -1.341104507446289e-06, -1.1846423149108887e-06, -1.0281801223754883e-06, -8.717179298400879e-07, -7.152557373046875e-07, -5.587935447692871e-07, -4.023313522338867e-07, -2.4586915969848633e-07, -8.940696716308594e-08, 6.705522537231445e-08, 2.2351741790771484e-07, 3.7997961044311523e-07, 5.364418029785156e-07, 6.92903995513916e-07, 8.493661880493164e-07, 1.0058283805847168e-06, 1.1622905731201172e-06, 1.3187527656555176e-06, 1.475214958190918e-06, 1.6316771507263184e-06, 1.7881393432617188e-06, 1.944601535797119e-06, 2.1010637283325195e-06, 2.25752592086792e-06, 2.4139881134033203e-06, 2.5704503059387207e-06, 2.726912498474121e-06, 2.8833746910095215e-06, 3.039836883544922e-06, 3.1962990760803223e-06, 3.3527612686157227e-06, 3.509223461151123e-06, 3.6656856536865234e-06, 3.822147846221924e-06, 3.978610038757324e-06, 4.135072231292725e-06, 4.291534423828125e-06, 4.447996616363525e-06, 4.604458808898926e-06, 4.760921001434326e-06, 4.9173831939697266e-06, 5.073845386505127e-06, 5.230307579040527e-06, 5.386769771575928e-06, 5.543231964111328e-06]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 1.0, 3.0, 7.0, 11.0, 16.0, 19.0, 24.0, 50.0, 99.0, 172.0, 338.0, 692.0, 1363.0, 2828.0, 5868.0, 12710.0, 29661.0, 76336.0, 184615.0, 297693.0, 242837.0, 114561.0, 44813.0, 18184.0, 8038.0, 3754.0, 1913.0, 899.0, 482.0, 261.0, 111.0, 78.0, 41.0, 29.0, 16.0, 12.0, 11.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00930023193359375, -0.009024381637573242, -0.008748531341552734, -0.008472681045532227, -0.008196830749511719, -0.007920980453491211, -0.007645130157470703, -0.007369279861450195, -0.0070934295654296875, -0.00681757926940918, -0.006541728973388672, -0.006265878677368164, -0.005990028381347656, -0.0057141780853271484, -0.005438327789306641, -0.005162477493286133, -0.004886627197265625, -0.004610776901245117, -0.004334926605224609, -0.0040590763092041016, -0.0037832260131835938, -0.003507375717163086, -0.003231525421142578, -0.0029556751251220703, -0.0026798248291015625, -0.0024039745330810547, -0.002128124237060547, -0.001852273941040039, -0.0015764236450195312, -0.0013005733489990234, -0.0010247230529785156, -0.0007488727569580078, -0.0004730224609375, -0.0001971721649169922, 7.867813110351562e-05, 0.00035452842712402344, 0.0006303787231445312, 0.0009062290191650391, 0.0011820793151855469, 0.0014579296112060547, 0.0017337799072265625, 0.0020096302032470703, 0.002285480499267578, 0.002561330795288086, 0.0028371810913085938, 0.0031130313873291016, 0.0033888816833496094, 0.003664731979370117, 0.003940582275390625, 0.004216432571411133, 0.004492282867431641, 0.0047681331634521484, 0.005043983459472656, 0.005319833755493164, 0.005595684051513672, 0.00587153434753418, 0.0061473846435546875, 0.006423234939575195, 0.006699085235595703, 0.006974935531616211, 0.007250785827636719, 0.0075266361236572266, 0.007802486419677734, 0.008078336715698242, 0.00835418701171875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 1.0, 5.0, 4.0, 2.0, 10.0, 10.0, 10.0, 12.0, 12.0, 18.0, 21.0, 23.0, 33.0, 35.0, 47.0, 57.0, 59.0, 63.0, 39.0, 57.0, 61.0, 59.0, 52.0, 54.0, 38.0, 31.0, 46.0, 28.0, 19.0, 16.0, 15.0, 9.0, 7.0, 10.0, 6.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.00948333740234375, -0.00916910171508789, -0.008854866027832031, -0.008540630340576172, -0.008226394653320312, -0.007912158966064453, -0.007597923278808594, -0.007283687591552734, -0.006969451904296875, -0.006655216217041016, -0.006340980529785156, -0.006026744842529297, -0.0057125091552734375, -0.005398273468017578, -0.005084037780761719, -0.004769802093505859, -0.00445556640625, -0.004141330718994141, -0.0038270950317382812, -0.003512859344482422, -0.0031986236572265625, -0.002884387969970703, -0.0025701522827148438, -0.0022559165954589844, -0.001941680908203125, -0.0016274452209472656, -0.0013132095336914062, -0.0009989738464355469, -0.0006847381591796875, -0.0003705024719238281, -5.626678466796875e-05, 0.0002579689025878906, 0.00057220458984375, 0.0008864402770996094, 0.0012006759643554688, 0.0015149116516113281, 0.0018291473388671875, 0.002143383026123047, 0.0024576187133789062, 0.0027718544006347656, 0.003086090087890625, 0.0034003257751464844, 0.0037145614624023438, 0.004028797149658203, 0.0043430328369140625, 0.004657268524169922, 0.004971504211425781, 0.005285739898681641, 0.0055999755859375, 0.005914211273193359, 0.006228446960449219, 0.006542682647705078, 0.0068569183349609375, 0.007171154022216797, 0.007485389709472656, 0.007799625396728516, 0.008113861083984375, 0.008428096771240234, 0.008742332458496094, 0.009056568145751953, 0.009370803833007812, 0.009685039520263672, 0.009999275207519531, 0.01031351089477539, 0.01062774658203125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 12.0, 27.0, 62.0, 197.0, 262.0, 235.0, 117.0, 41.0, 24.0, 8.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4855685532093048, -0.4726996123790741, -0.45983070135116577, -0.44696176052093506, -0.43409284949302673, -0.421223908662796, -0.4083549976348877, -0.395486056804657, -0.38261711597442627, -0.36974817514419556, -0.35687926411628723, -0.3440103232860565, -0.3311414122581482, -0.3182724714279175, -0.30540353059768677, -0.29253461956977844, -0.2796657085418701, -0.2667967677116394, -0.2539278566837311, -0.24105891585350037, -0.22819000482559204, -0.21532106399536133, -0.2024521380662918, -0.1895832121372223, -0.17671428620815277, -0.16384536027908325, -0.15097643435001373, -0.1381075084209442, -0.1252385675907135, -0.11236964911222458, -0.09950071573257446, -0.08663178980350494, -0.07376283407211304, -0.06089390814304352, -0.0480249784886837, -0.03515604883432388, -0.022287122905254364, -0.009418196976184845, 0.003450736403465271, 0.01631966233253479, 0.02918858826160431, 0.04205751419067383, 0.054926443845033646, 0.06779537349939346, 0.08066429942846298, 0.0935332253575325, 0.10640215873718262, 0.11927108466625214, 0.13214001059532166, 0.14500893652439117, 0.1578778624534607, 0.1707468032836914, 0.18361571431159973, 0.19648465514183044, 0.20935358107089996, 0.22222250699996948, 0.235091432929039, 0.24796035885810852, 0.26082929968833923, 0.27369821071624756, 0.28656715154647827, 0.2994360625743866, 0.3123050034046173, 0.32517391443252563, 0.33804285526275635]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 9.0, 14.0, 5.0, 12.0, 11.0, 28.0, 23.0, 28.0, 25.0, 37.0, 41.0, 38.0, 40.0, 53.0, 49.0, 37.0, 56.0, 54.0, 50.0, 41.0, 42.0, 45.0, 39.0, 32.0, 24.0, 28.0, 15.0, 26.0, 16.0, 15.0, 9.0, 14.0, 10.0, 10.0, 5.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.19511419534683228, -0.1886952668428421, -0.18227632343769073, -0.17585739493370056, -0.1694384664297104, -0.16301953792572021, -0.15660059452056885, -0.15018166601657867, -0.1437627375125885, -0.13734380900859833, -0.13092486560344696, -0.12450593709945679, -0.11808700859546661, -0.11166807264089584, -0.10524913668632507, -0.0988302081823349, -0.09241126477718353, -0.08599232882261276, -0.07957340031862259, -0.07315446436405182, -0.06673553586006165, -0.060316599905490875, -0.053897663950920105, -0.04747873172163963, -0.04105979949235916, -0.03464086726307869, -0.02822193317115307, -0.021802999079227448, -0.015384066849946976, -0.008965134620666504, -0.0025461986660957336, 0.003872733563184738, 0.01029166579246521, 0.016710598021745682, 0.023129532113671303, 0.029548466205596924, 0.035967398434877396, 0.04238633066415787, 0.04880526661872864, 0.05522419884800911, 0.06164313107728958, 0.06806206703186035, 0.07448099553585052, 0.0808999314904213, 0.08731886744499207, 0.09373779594898224, 0.10015673190355301, 0.10657566785812378, 0.11299459636211395, 0.11941353231668472, 0.1258324682712555, 0.13225139677524567, 0.13867032527923584, 0.1450892686843872, 0.15150819718837738, 0.15792712569236755, 0.16434606909751892, 0.1707649976015091, 0.17718394100666046, 0.18360286951065063, 0.1900217980146408, 0.19644072651863098, 0.20285966992378235, 0.20927859842777252, 0.2156975269317627]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 14.0, 12.0, 21.0, 40.0, 57.0, 83.0, 150.0, 322.0, 619.0, 1620.0, 4598.0, 15244.0, 62018.0, 354202.0, 1275486.0, 1613468.0, 682943.0, 139496.0, 29150.0, 9042.0, 3365.0, 1384.0, 443.0, 193.0, 101.0, 78.0, 43.0, 32.0, 21.0, 7.0, 9.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0347900390625, -0.03355741500854492, -0.032324790954589844, -0.031092166900634766, -0.029859542846679688, -0.02862691879272461, -0.02739429473876953, -0.026161670684814453, -0.024929046630859375, -0.023696422576904297, -0.02246379852294922, -0.02123117446899414, -0.019998550415039062, -0.018765926361083984, -0.017533302307128906, -0.016300678253173828, -0.01506805419921875, -0.013835430145263672, -0.012602806091308594, -0.011370182037353516, -0.010137557983398438, -0.00890493392944336, -0.007672309875488281, -0.006439685821533203, -0.005207061767578125, -0.003974437713623047, -0.0027418136596679688, -0.0015091896057128906, -0.0002765655517578125, 0.0009560585021972656, 0.0021886825561523438, 0.003421306610107422, 0.0046539306640625, 0.005886554718017578, 0.007119178771972656, 0.008351802825927734, 0.009584426879882812, 0.01081705093383789, 0.012049674987792969, 0.013282299041748047, 0.014514923095703125, 0.015747547149658203, 0.01698017120361328, 0.01821279525756836, 0.019445419311523438, 0.020678043365478516, 0.021910667419433594, 0.023143291473388672, 0.02437591552734375, 0.025608539581298828, 0.026841163635253906, 0.028073787689208984, 0.029306411743164062, 0.03053903579711914, 0.03177165985107422, 0.0330042839050293, 0.034236907958984375, 0.03546953201293945, 0.03670215606689453, 0.03793478012084961, 0.03916740417480469, 0.040400028228759766, 0.041632652282714844, 0.04286527633666992, 0.044097900390625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 10.0, 9.0, 15.0, 29.0, 31.0, 46.0, 48.0, 51.0, 62.0, 73.0, 78.0, 66.0, 75.0, 84.0, 56.0, 56.0, 49.0, 50.0, 38.0, 24.0, 22.0, 8.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.055938720703125, -0.05440378189086914, -0.05286884307861328, -0.05133390426635742, -0.04979896545410156, -0.0482640266418457, -0.046729087829589844, -0.045194149017333984, -0.043659210205078125, -0.042124271392822266, -0.040589332580566406, -0.03905439376831055, -0.03751945495605469, -0.03598451614379883, -0.03444957733154297, -0.03291463851928711, -0.03137969970703125, -0.02984476089477539, -0.02830982208251953, -0.026774883270263672, -0.025239944458007812, -0.023705005645751953, -0.022170066833496094, -0.020635128021240234, -0.019100189208984375, -0.017565250396728516, -0.016030311584472656, -0.014495372772216797, -0.012960433959960938, -0.011425495147705078, -0.009890556335449219, -0.00835561752319336, -0.0068206787109375, -0.005285739898681641, -0.0037508010864257812, -0.002215862274169922, -0.0006809234619140625, 0.0008540153503417969, 0.0023889541625976562, 0.003923892974853516, 0.005458831787109375, 0.006993770599365234, 0.008528709411621094, 0.010063648223876953, 0.011598587036132812, 0.013133525848388672, 0.014668464660644531, 0.01620340347290039, 0.01773834228515625, 0.01927328109741211, 0.02080821990966797, 0.022343158721923828, 0.023878097534179688, 0.025413036346435547, 0.026947975158691406, 0.028482913970947266, 0.030017852783203125, 0.031552791595458984, 0.033087730407714844, 0.0346226692199707, 0.03615760803222656, 0.03769254684448242, 0.03922748565673828, 0.04076242446899414, 0.04229736328125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 8.0, 8.0, 9.0, 13.0, 11.0, 18.0, 17.0, 47.0, 49.0, 57.0, 86.0, 146.0, 299.0, 688.0, 1983.0, 6801.0, 32755.0, 299833.0, 3156285.0, 629968.0, 50969.0, 9700.0, 2630.0, 943.0, 402.0, 183.0, 119.0, 73.0, 48.0, 42.0, 26.0, 21.0, 13.0, 8.0, 8.0, 8.0, 4.0, 5.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.07574462890625, -0.0737314224243164, -0.07171821594238281, -0.06970500946044922, -0.06769180297851562, -0.06567859649658203, -0.06366539001464844, -0.061652183532714844, -0.05963897705078125, -0.057625770568847656, -0.05561256408691406, -0.05359935760498047, -0.051586151123046875, -0.04957294464111328, -0.04755973815917969, -0.045546531677246094, -0.0435333251953125, -0.041520118713378906, -0.03950691223144531, -0.03749370574951172, -0.035480499267578125, -0.03346729278564453, -0.03145408630371094, -0.029440879821777344, -0.02742767333984375, -0.025414466857910156, -0.023401260375976562, -0.02138805389404297, -0.019374847412109375, -0.01736164093017578, -0.015348434448242188, -0.013335227966308594, -0.011322021484375, -0.009308815002441406, -0.0072956085205078125, -0.005282402038574219, -0.003269195556640625, -0.0012559890747070312, 0.0007572174072265625, 0.0027704238891601562, 0.00478363037109375, 0.006796836853027344, 0.008810043334960938, 0.010823249816894531, 0.012836456298828125, 0.014849662780761719, 0.016862869262695312, 0.018876075744628906, 0.0208892822265625, 0.022902488708496094, 0.024915695190429688, 0.02692890167236328, 0.028942108154296875, 0.03095531463623047, 0.03296852111816406, 0.034981727600097656, 0.03699493408203125, 0.039008140563964844, 0.04102134704589844, 0.04303455352783203, 0.045047760009765625, 0.04706096649169922, 0.04907417297363281, 0.051087379455566406, 0.0531005859375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 7.0, 7.0, 10.0, 17.0, 32.0, 56.0, 65.0, 156.0, 229.0, 364.0, 530.0, 640.0, 634.0, 469.0, 322.0, 182.0, 113.0, 72.0, 53.0, 27.0, 23.0, 21.0, 17.0, 8.0, 9.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06719970703125, -0.06532764434814453, -0.06345558166503906, -0.061583518981933594, -0.059711456298828125, -0.057839393615722656, -0.05596733093261719, -0.05409526824951172, -0.05222320556640625, -0.05035114288330078, -0.04847908020019531, -0.046607017517089844, -0.044734954833984375, -0.042862892150878906, -0.04099082946777344, -0.03911876678466797, -0.0372467041015625, -0.03537464141845703, -0.03350257873535156, -0.031630516052246094, -0.029758453369140625, -0.027886390686035156, -0.026014328002929688, -0.02414226531982422, -0.02227020263671875, -0.02039813995361328, -0.018526077270507812, -0.016654014587402344, -0.014781951904296875, -0.012909889221191406, -0.011037826538085938, -0.009165763854980469, -0.007293701171875, -0.005421638488769531, -0.0035495758056640625, -0.0016775131225585938, 0.000194549560546875, 0.0020666122436523438, 0.0039386749267578125, 0.005810737609863281, 0.00768280029296875, 0.009554862976074219, 0.011426925659179688, 0.013298988342285156, 0.015171051025390625, 0.017043113708496094, 0.018915176391601562, 0.02078723907470703, 0.0226593017578125, 0.02453136444091797, 0.026403427124023438, 0.028275489807128906, 0.030147552490234375, 0.032019615173339844, 0.03389167785644531, 0.03576374053955078, 0.03763580322265625, 0.03950786590576172, 0.04137992858886719, 0.043251991271972656, 0.045124053955078125, 0.046996116638183594, 0.04886817932128906, 0.05074024200439453, 0.0526123046875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 11.0, 36.0, 169.0, 400.0, 304.0, 64.0, 15.0, 5.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2977575957775116, -0.2670035660266876, -0.23624950647354126, -0.20549547672271729, -0.17474143207073212, -0.14398738741874695, -0.11323335766792297, -0.0824793130159378, -0.05172526836395264, -0.020971227437257767, 0.009782813489437103, 0.040536850690841675, 0.07129089534282684, 0.10204493999481201, 0.132798969745636, 0.16355301439762115, 0.19430705904960632, 0.2250611037015915, 0.25581514835357666, 0.28656917810440063, 0.3173232078552246, 0.34807726740837097, 0.37883129715919495, 0.4095853567123413, 0.4403393864631653, 0.47109341621398926, 0.5018474459648132, 0.5326014757156372, 0.563355565071106, 0.5941095948219299, 0.6248636245727539, 0.6556176543235779, 0.6863716840744019, 0.7171257138252258, 0.7478797435760498, 0.7786338329315186, 0.8093878626823425, 0.8401418924331665, 0.8708959221839905, 0.9016499519348145, 0.9324040412902832, 0.9631580710411072, 0.9939121007919312, 1.0246661901474, 1.055420160293579, 1.0861742496490479, 1.1169283390045166, 1.1476823091506958, 1.178436279296875, 1.2091903686523438, 1.239944338798523, 1.2706984281539917, 1.301452398300171, 1.3322064876556396, 1.3629605770111084, 1.3937145471572876, 1.4244686365127563, 1.455222725868225, 1.4859766960144043, 1.516730785369873, 1.5474847555160522, 1.578238844871521, 1.6089928150177002, 1.639746904373169, 1.6705009937286377]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 10.0, 4.0, 9.0, 14.0, 15.0, 13.0, 24.0, 26.0, 33.0, 25.0, 22.0, 52.0, 38.0, 34.0, 50.0, 54.0, 56.0, 47.0, 49.0, 40.0, 40.0, 39.0, 38.0, 25.0, 32.0, 38.0, 23.0, 21.0, 27.0, 25.0, 14.0, 10.0, 11.0, 9.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.16542911529541016, -0.1604420393705368, -0.15545494854450226, -0.1504678726196289, -0.14548078179359436, -0.140493705868721, -0.13550661504268646, -0.1305195391178131, -0.12553244829177856, -0.12054536491632462, -0.11555828154087067, -0.11057119816541672, -0.10558411478996277, -0.10059703886508942, -0.09560995548963547, -0.09062287211418152, -0.08563579618930817, -0.08064871281385422, -0.07566162943840027, -0.07067454606294632, -0.06568746268749237, -0.06070038303732872, -0.05571330338716507, -0.05072622001171112, -0.04573913663625717, -0.04075205326080322, -0.035764969885349274, -0.030777890235185623, -0.025790806859731674, -0.020803723484277725, -0.015816641971468925, -0.010829560458660126, -0.005842477083206177, -0.0008553946390748024, 0.004131687805056572, 0.009118770249187946, 0.01410585269331932, 0.01909293606877327, 0.02408001758158207, 0.02906709909439087, 0.03405418246984482, 0.03904126584529877, 0.044028349220752716, 0.04901542887091637, 0.054002512246370316, 0.058989595621824265, 0.06397667527198792, 0.06896375864744186, 0.07395084202289581, 0.07893792539834976, 0.08392500877380371, 0.08891209214925766, 0.09389917552471161, 0.09888625144958496, 0.10387333482503891, 0.10886041820049286, 0.11384750157594681, 0.11883458495140076, 0.1238216683268547, 0.12880875170230865, 0.133795827627182, 0.13878291845321655, 0.1437699943780899, 0.14875707030296326, 0.1537441611289978]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 2.0, 4.0, 10.0, 12.0, 20.0, 25.0, 38.0, 43.0, 92.0, 128.0, 154.0, 300.0, 522.0, 877.0, 1726.0, 3427.0, 7399.0, 15689.0, 34885.0, 76503.0, 153203.0, 237386.0, 233753.0, 147569.0, 72678.0, 33051.0, 14977.0, 7057.0, 3287.0, 1657.0, 832.0, 452.0, 264.0, 179.0, 125.0, 77.0, 47.0, 30.0, 26.0, 17.0, 10.0, 4.0, 7.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0288543701171875, -0.027979135513305664, -0.027103900909423828, -0.026228666305541992, -0.025353431701660156, -0.02447819709777832, -0.023602962493896484, -0.02272772789001465, -0.021852493286132812, -0.020977258682250977, -0.02010202407836914, -0.019226789474487305, -0.01835155487060547, -0.017476320266723633, -0.016601085662841797, -0.01572585105895996, -0.014850616455078125, -0.013975381851196289, -0.013100147247314453, -0.012224912643432617, -0.011349678039550781, -0.010474443435668945, -0.00959920883178711, -0.008723974227905273, -0.007848739624023438, -0.0069735050201416016, -0.006098270416259766, -0.00522303581237793, -0.004347801208496094, -0.003472566604614258, -0.002597332000732422, -0.001722097396850586, -0.00084686279296875, 2.8371810913085938e-05, 0.0009036064147949219, 0.0017788410186767578, 0.0026540756225585938, 0.0035293102264404297, 0.004404544830322266, 0.0052797794342041016, 0.0061550140380859375, 0.0070302486419677734, 0.00790548324584961, 0.008780717849731445, 0.009655952453613281, 0.010531187057495117, 0.011406421661376953, 0.012281656265258789, 0.013156890869140625, 0.014032125473022461, 0.014907360076904297, 0.015782594680786133, 0.01665782928466797, 0.017533063888549805, 0.01840829849243164, 0.019283533096313477, 0.020158767700195312, 0.02103400230407715, 0.021909236907958984, 0.02278447151184082, 0.023659706115722656, 0.024534940719604492, 0.025410175323486328, 0.026285409927368164, 0.02716064453125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 9.0, 3.0, 15.0, 17.0, 13.0, 29.0, 28.0, 42.0, 36.0, 49.0, 48.0, 64.0, 77.0, 63.0, 68.0, 71.0, 59.0, 55.0, 63.0, 49.0, 39.0, 23.0, 26.0, 18.0, 13.0, 13.0, 12.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05670166015625, -0.05512380599975586, -0.05354595184326172, -0.05196809768676758, -0.05039024353027344, -0.0488123893737793, -0.047234535217285156, -0.045656681060791016, -0.044078826904296875, -0.042500972747802734, -0.040923118591308594, -0.03934526443481445, -0.03776741027832031, -0.03618955612182617, -0.03461170196533203, -0.03303384780883789, -0.03145599365234375, -0.02987813949584961, -0.02830028533935547, -0.026722431182861328, -0.025144577026367188, -0.023566722869873047, -0.021988868713378906, -0.020411014556884766, -0.018833160400390625, -0.017255306243896484, -0.015677452087402344, -0.014099597930908203, -0.012521743774414062, -0.010943889617919922, -0.009366035461425781, -0.007788181304931641, -0.0062103271484375, -0.004632472991943359, -0.0030546188354492188, -0.0014767646789550781, 0.0001010894775390625, 0.0016789436340332031, 0.0032567977905273438, 0.004834651947021484, 0.006412506103515625, 0.007990360260009766, 0.009568214416503906, 0.011146068572998047, 0.012723922729492188, 0.014301776885986328, 0.01587963104248047, 0.01745748519897461, 0.01903533935546875, 0.02061319351196289, 0.02219104766845703, 0.023768901824951172, 0.025346755981445312, 0.026924610137939453, 0.028502464294433594, 0.030080318450927734, 0.031658172607421875, 0.033236026763916016, 0.034813880920410156, 0.0363917350769043, 0.03796958923339844, 0.03954744338989258, 0.04112529754638672, 0.04270315170288086, 0.044281005859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 4.0, 6.0, 10.0, 11.0, 7.0, 24.0, 47.0, 48.0, 90.0, 140.0, 209.0, 368.0, 642.0, 1132.0, 1989.0, 3730.0, 7090.0, 14121.0, 29226.0, 59869.0, 120963.0, 209866.0, 265709.0, 163258.0, 86125.0, 41836.0, 20552.0, 10099.0, 5115.0, 2703.0, 1508.0, 820.0, 449.0, 263.0, 173.0, 137.0, 62.0, 45.0, 34.0, 24.0, 10.0, 11.0, 5.0, 10.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0241851806640625, -0.02335834503173828, -0.022531509399414062, -0.021704673767089844, -0.020877838134765625, -0.020051002502441406, -0.019224166870117188, -0.01839733123779297, -0.01757049560546875, -0.01674365997314453, -0.015916824340820312, -0.015089988708496094, -0.014263153076171875, -0.013436317443847656, -0.012609481811523438, -0.011782646179199219, -0.010955810546875, -0.010128974914550781, -0.009302139282226562, -0.008475303649902344, -0.007648468017578125, -0.006821632385253906, -0.0059947967529296875, -0.005167961120605469, -0.00434112548828125, -0.0035142898559570312, -0.0026874542236328125, -0.0018606185913085938, -0.001033782958984375, -0.00020694732666015625, 0.0006198883056640625, 0.0014467239379882812, 0.0022735595703125, 0.0031003952026367188, 0.0039272308349609375, 0.004754066467285156, 0.005580902099609375, 0.006407737731933594, 0.0072345733642578125, 0.008061408996582031, 0.00888824462890625, 0.009715080261230469, 0.010541915893554688, 0.011368751525878906, 0.012195587158203125, 0.013022422790527344, 0.013849258422851562, 0.014676094055175781, 0.0155029296875, 0.01632976531982422, 0.017156600952148438, 0.017983436584472656, 0.018810272216796875, 0.019637107849121094, 0.020463943481445312, 0.02129077911376953, 0.02211761474609375, 0.02294445037841797, 0.023771286010742188, 0.024598121643066406, 0.025424957275390625, 0.026251792907714844, 0.027078628540039062, 0.02790546417236328, 0.0287322998046875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 5.0, 6.0, 8.0, 7.0, 7.0, 11.0, 11.0, 15.0, 23.0, 20.0, 20.0, 30.0, 22.0, 27.0, 37.0, 34.0, 28.0, 52.0, 48.0, 47.0, 32.0, 36.0, 43.0, 35.0, 47.0, 34.0, 43.0, 42.0, 33.0, 25.0, 28.0, 20.0, 13.0, 24.0, 12.0, 10.0, 12.0, 9.0, 9.0, 8.0, 7.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.068603515625, -0.066314697265625, -0.06402587890625, -0.061737060546875, -0.0594482421875, -0.057159423828125, -0.05487060546875, -0.052581787109375, -0.05029296875, -0.048004150390625, -0.04571533203125, -0.043426513671875, -0.0411376953125, -0.038848876953125, -0.03656005859375, -0.034271240234375, -0.031982421875, -0.029693603515625, -0.02740478515625, -0.025115966796875, -0.0228271484375, -0.020538330078125, -0.01824951171875, -0.015960693359375, -0.013671875, -0.011383056640625, -0.00909423828125, -0.006805419921875, -0.0045166015625, -0.002227783203125, 6.103515625e-05, 0.002349853515625, 0.004638671875, 0.006927490234375, 0.00921630859375, 0.011505126953125, 0.0137939453125, 0.016082763671875, 0.01837158203125, 0.020660400390625, 0.02294921875, 0.025238037109375, 0.02752685546875, 0.029815673828125, 0.0321044921875, 0.034393310546875, 0.03668212890625, 0.038970947265625, 0.041259765625, 0.043548583984375, 0.04583740234375, 0.048126220703125, 0.0504150390625, 0.052703857421875, 0.05499267578125, 0.057281494140625, 0.0595703125, 0.061859130859375, 0.06414794921875, 0.066436767578125, 0.0687255859375, 0.071014404296875, 0.07330322265625, 0.075592041015625, 0.077880859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 4.0, 2.0, 2.0, 5.0, 5.0, 7.0, 7.0, 14.0, 13.0, 19.0, 33.0, 40.0, 64.0, 122.0, 185.0, 304.0, 451.0, 838.0, 1383.0, 2366.0, 4259.0, 7791.0, 13989.0, 25539.0, 46449.0, 82307.0, 135826.0, 202490.0, 202343.0, 135214.0, 82302.0, 46751.0, 25894.0, 13863.0, 7600.0, 4209.0, 2393.0, 1376.0, 837.0, 466.0, 268.0, 194.0, 119.0, 61.0, 40.0, 38.0, 21.0, 19.0, 14.0, 9.0, 4.0, 7.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0041961669921875, -0.004060804843902588, -0.003925442695617676, -0.0037900805473327637, -0.0036547183990478516, -0.0035193562507629395, -0.0033839941024780273, -0.0032486319541931152, -0.003113269805908203, -0.002977907657623291, -0.002842545509338379, -0.002707183361053467, -0.0025718212127685547, -0.0024364590644836426, -0.0023010969161987305, -0.0021657347679138184, -0.0020303726196289062, -0.0018950104713439941, -0.001759648323059082, -0.00162428617477417, -0.0014889240264892578, -0.0013535618782043457, -0.0012181997299194336, -0.0010828375816345215, -0.0009474754333496094, -0.0008121132850646973, -0.0006767511367797852, -0.000541388988494873, -0.00040602684020996094, -0.00027066469192504883, -0.00013530254364013672, 5.960464477539063e-08, 0.0001354217529296875, 0.0002707839012145996, 0.0004061460494995117, 0.0005415081977844238, 0.0006768703460693359, 0.000812232494354248, 0.0009475946426391602, 0.0010829567909240723, 0.0012183189392089844, 0.0013536810874938965, 0.0014890432357788086, 0.0016244053840637207, 0.0017597675323486328, 0.001895129680633545, 0.002030491828918457, 0.002165853977203369, 0.0023012161254882812, 0.0024365782737731934, 0.0025719404220581055, 0.0027073025703430176, 0.0028426647186279297, 0.002978026866912842, 0.003113389015197754, 0.003248751163482666, 0.003384113311767578, 0.0035194754600524902, 0.0036548376083374023, 0.0037901997566223145, 0.0039255619049072266, 0.004060924053192139, 0.004196286201477051, 0.004331648349761963, 0.004467010498046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 3.0, 6.0, 7.0, 13.0, 19.0, 19.0, 7.0, 27.0, 35.0, 41.0, 17.0, 49.0, 59.0, 70.0, 38.0, 66.0, 72.0, 74.0, 24.0, 62.0, 50.0, 59.0, 14.0, 38.0, 30.0, 26.0, 9.0, 18.0, 17.0, 9.0, 2.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.039836883544922e-06, -2.9355287551879883e-06, -2.8312206268310547e-06, -2.726912498474121e-06, -2.6226043701171875e-06, -2.518296241760254e-06, -2.4139881134033203e-06, -2.3096799850463867e-06, -2.205371856689453e-06, -2.1010637283325195e-06, -1.996755599975586e-06, -1.8924474716186523e-06, -1.7881393432617188e-06, -1.6838312149047852e-06, -1.5795230865478516e-06, -1.475214958190918e-06, -1.3709068298339844e-06, -1.2665987014770508e-06, -1.1622905731201172e-06, -1.0579824447631836e-06, -9.5367431640625e-07, -8.493661880493164e-07, -7.450580596923828e-07, -6.407499313354492e-07, -5.364418029785156e-07, -4.3213367462158203e-07, -3.2782554626464844e-07, -2.2351741790771484e-07, -1.1920928955078125e-07, -1.4901161193847656e-08, 8.940696716308594e-08, 1.9371509552001953e-07, 2.980232238769531e-07, 4.023313522338867e-07, 5.066394805908203e-07, 6.109476089477539e-07, 7.152557373046875e-07, 8.195638656616211e-07, 9.238719940185547e-07, 1.0281801223754883e-06, 1.1324882507324219e-06, 1.2367963790893555e-06, 1.341104507446289e-06, 1.4454126358032227e-06, 1.5497207641601562e-06, 1.6540288925170898e-06, 1.7583370208740234e-06, 1.862645149230957e-06, 1.9669532775878906e-06, 2.0712614059448242e-06, 2.175569534301758e-06, 2.2798776626586914e-06, 2.384185791015625e-06, 2.4884939193725586e-06, 2.592802047729492e-06, 2.6971101760864258e-06, 2.8014183044433594e-06, 2.905726432800293e-06, 3.0100345611572266e-06, 3.11434268951416e-06, 3.2186508178710938e-06, 3.3229589462280273e-06, 3.427267074584961e-06, 3.5315752029418945e-06, 3.635883331298828e-06]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 8.0, 13.0, 17.0, 40.0, 37.0, 50.0, 79.0, 117.0, 217.0, 387.0, 632.0, 1159.0, 1912.0, 3691.0, 6783.0, 13384.0, 26164.0, 51361.0, 97756.0, 167129.0, 247112.0, 187511.0, 115575.0, 61866.0, 31438.0, 16123.0, 8159.0, 4271.0, 2351.0, 1266.0, 722.0, 474.0, 278.0, 164.0, 115.0, 67.0, 38.0, 31.0, 23.0, 11.0, 10.0, 8.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0054931640625, -0.00533902645111084, -0.00518488883972168, -0.0050307512283325195, -0.004876613616943359, -0.004722476005554199, -0.004568338394165039, -0.004414200782775879, -0.004260063171386719, -0.004105925559997559, -0.0039517879486083984, -0.0037976503372192383, -0.003643512725830078, -0.003489375114440918, -0.003335237503051758, -0.0031810998916625977, -0.0030269622802734375, -0.0028728246688842773, -0.002718687057495117, -0.002564549446105957, -0.002410411834716797, -0.0022562742233276367, -0.0021021366119384766, -0.0019479990005493164, -0.0017938613891601562, -0.001639723777770996, -0.001485586166381836, -0.0013314485549926758, -0.0011773109436035156, -0.0010231733322143555, -0.0008690357208251953, -0.0007148981094360352, -0.000560760498046875, -0.00040662288665771484, -0.0002524852752685547, -9.834766387939453e-05, 5.5789947509765625e-05, 0.00020992755889892578, 0.00036406517028808594, 0.0005182027816772461, 0.0006723403930664062, 0.0008264780044555664, 0.0009806156158447266, 0.0011347532272338867, 0.0012888908386230469, 0.001443028450012207, 0.0015971660614013672, 0.0017513036727905273, 0.0019054412841796875, 0.0020595788955688477, 0.002213716506958008, 0.002367854118347168, 0.002521991729736328, 0.0026761293411254883, 0.0028302669525146484, 0.0029844045639038086, 0.0031385421752929688, 0.003292679786682129, 0.003446817398071289, 0.0036009550094604492, 0.0037550926208496094, 0.0039092302322387695, 0.00406336784362793, 0.00421750545501709, 0.00437164306640625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 8.0, 1.0, 5.0, 9.0, 16.0, 13.0, 14.0, 21.0, 16.0, 28.0, 30.0, 31.0, 33.0, 35.0, 45.0, 36.0, 45.0, 49.0, 46.0, 49.0, 51.0, 55.0, 49.0, 43.0, 35.0, 32.0, 31.0, 32.0, 29.0, 23.0, 19.0, 15.0, 17.0, 12.0, 9.0, 5.0, 8.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.007457733154296875, -0.007250726222991943, -0.007043719291687012, -0.00683671236038208, -0.0066297054290771484, -0.006422698497772217, -0.006215691566467285, -0.0060086846351623535, -0.005801677703857422, -0.00559467077255249, -0.005387663841247559, -0.005180656909942627, -0.004973649978637695, -0.004766643047332764, -0.004559636116027832, -0.0043526291847229, -0.004145622253417969, -0.003938615322113037, -0.0037316083908081055, -0.003524601459503174, -0.003317594528198242, -0.0031105875968933105, -0.002903580665588379, -0.0026965737342834473, -0.0024895668029785156, -0.002282559871673584, -0.0020755529403686523, -0.0018685460090637207, -0.001661539077758789, -0.0014545321464538574, -0.0012475252151489258, -0.0010405182838439941, -0.0008335113525390625, -0.0006265044212341309, -0.0004194974899291992, -0.00021249055862426758, -5.4836273193359375e-06, 0.0002015233039855957, 0.00040853023529052734, 0.000615537166595459, 0.0008225440979003906, 0.0010295510292053223, 0.001236557960510254, 0.0014435648918151855, 0.0016505718231201172, 0.0018575787544250488, 0.0020645856857299805, 0.002271592617034912, 0.0024785995483398438, 0.0026856064796447754, 0.002892613410949707, 0.0030996203422546387, 0.0033066272735595703, 0.003513634204864502, 0.0037206411361694336, 0.003927648067474365, 0.004134654998779297, 0.0043416619300842285, 0.00454866886138916, 0.004755675792694092, 0.0049626827239990234, 0.005169689655303955, 0.005376696586608887, 0.005583703517913818, 0.00579071044921875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 4.0, 7.0, 5.0, 18.0, 62.0, 115.0, 158.0, 274.0, 160.0, 103.0, 58.0, 15.0, 9.0, 6.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.46561822295188904, -0.4558370113372803, -0.4460558295249939, -0.43627461791038513, -0.42649340629577637, -0.41671222448349, -0.4069310128688812, -0.39714980125427246, -0.3873686194419861, -0.3775874078273773, -0.36780622601509094, -0.3580250144004822, -0.3482438027858734, -0.33846259117126465, -0.32868140935897827, -0.3189001977443695, -0.30911898612976074, -0.299337774515152, -0.2895565927028656, -0.27977538108825684, -0.26999416947364807, -0.2602129578590393, -0.25043177604675293, -0.24065056443214417, -0.2308693677186966, -0.22108817100524902, -0.21130695939064026, -0.2015257626771927, -0.19174456596374512, -0.18196335434913635, -0.17218215763568878, -0.1624009609222412, -0.15261973440647125, -0.14283853769302368, -0.13305732607841492, -0.12327612936496735, -0.11349492520093918, -0.10371372103691101, -0.09393252432346344, -0.08415132015943527, -0.0743701159954071, -0.06458891183137894, -0.05480771139264107, -0.0450265109539032, -0.03524530678987503, -0.025464102625846863, -0.015682902187108994, -0.005901701748371124, 0.0038795024156570435, 0.013660704717040062, 0.02344190701842308, 0.03322310745716095, 0.04300431162118912, 0.052785515785217285, 0.06256671249866486, 0.07234791666269302, 0.08212912082672119, 0.09191032499074936, 0.10169152915477753, 0.1114727258682251, 0.12125393003225327, 0.13103513419628143, 0.140816330909729, 0.15059754252433777, 0.16037873923778534]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 3.0, 5.0, 15.0, 10.0, 9.0, 7.0, 10.0, 15.0, 19.0, 17.0, 18.0, 15.0, 19.0, 29.0, 33.0, 37.0, 37.0, 39.0, 39.0, 42.0, 55.0, 65.0, 42.0, 33.0, 38.0, 38.0, 34.0, 28.0, 38.0, 27.0, 20.0, 19.0, 29.0, 28.0, 16.0, 15.0, 13.0, 8.0, 3.0, 7.0, 6.0, 6.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.1821625828742981, -0.17678111791610718, -0.17139965295791626, -0.16601818799972534, -0.16063672304153442, -0.1552552729845047, -0.14987380802631378, -0.14449234306812286, -0.13911087810993195, -0.13372941315174103, -0.1283479481935501, -0.12296649068593979, -0.11758502572774887, -0.11220356076955795, -0.10682210326194763, -0.10144063830375671, -0.0960591733455658, -0.09067770838737488, -0.08529624342918396, -0.07991478592157364, -0.07453332096338272, -0.0691518560051918, -0.06377039849758148, -0.058388933539390564, -0.053007468581199646, -0.04762600362300873, -0.04224454239010811, -0.03686308115720749, -0.03148161619901657, -0.026100153103470802, -0.020718690007925034, -0.015337228775024414, -0.009955763816833496, -0.004574300721287727, 0.0008071623742580414, 0.00618862546980381, 0.011570088565349579, 0.016951551660895348, 0.022333014756441116, 0.027714475989341736, 0.033095940947532654, 0.03847740590572357, 0.04385886713862419, 0.04924032837152481, 0.05462179332971573, 0.06000325828790665, 0.06538471579551697, 0.07076618075370789, 0.0761476457118988, 0.08152911067008972, 0.08691057562828064, 0.09229203313589096, 0.09767349809408188, 0.1030549630522728, 0.10843642055988312, 0.11381788551807404, 0.11919935047626495, 0.12458081543445587, 0.1299622803926468, 0.1353437453508377, 0.14072519540786743, 0.14610666036605835, 0.15148812532424927, 0.15686959028244019, 0.1622510552406311]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 5.0, 11.0, 11.0, 20.0, 42.0, 36.0, 73.0, 102.0, 158.0, 256.0, 420.0, 1069.0, 17906.0, 2931269.0, 1233244.0, 7839.0, 801.0, 370.0, 211.0, 126.0, 112.0, 67.0, 43.0, 32.0, 25.0, 14.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1348876953125, -0.1298675537109375, -0.124847412109375, -0.1198272705078125, -0.11480712890625, -0.1097869873046875, -0.104766845703125, -0.0997467041015625, -0.0947265625, -0.0897064208984375, -0.084686279296875, -0.0796661376953125, -0.07464599609375, -0.0696258544921875, -0.064605712890625, -0.0595855712890625, -0.0545654296875, -0.0495452880859375, -0.044525146484375, -0.0395050048828125, -0.03448486328125, -0.0294647216796875, -0.024444580078125, -0.0194244384765625, -0.014404296875, -0.0093841552734375, -0.004364013671875, 0.0006561279296875, 0.00567626953125, 0.0106964111328125, 0.015716552734375, 0.0207366943359375, 0.0257568359375, 0.0307769775390625, 0.035797119140625, 0.0408172607421875, 0.04583740234375, 0.0508575439453125, 0.055877685546875, 0.0608978271484375, 0.06591796875, 0.0709381103515625, 0.075958251953125, 0.0809783935546875, 0.08599853515625, 0.0910186767578125, 0.096038818359375, 0.1010589599609375, 0.1060791015625, 0.1110992431640625, 0.116119384765625, 0.1211395263671875, 0.12615966796875, 0.1311798095703125, 0.136199951171875, 0.1412200927734375, 0.146240234375, 0.1512603759765625, 0.156280517578125, 0.1613006591796875, 0.16632080078125, 0.1713409423828125, 0.176361083984375, 0.1813812255859375, 0.1864013671875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 23.0, 22.0, 34.0, 42.0, 49.0, 65.0, 81.0, 78.0, 90.0, 81.0, 81.0, 83.0, 59.0, 58.0, 35.0, 29.0, 25.0, 22.0, 11.0, 8.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05609130859375, -0.05438995361328125, -0.0526885986328125, -0.05098724365234375, -0.049285888671875, -0.04758453369140625, -0.0458831787109375, -0.04418182373046875, -0.04248046875, -0.04077911376953125, -0.0390777587890625, -0.03737640380859375, -0.035675048828125, -0.03397369384765625, -0.0322723388671875, -0.03057098388671875, -0.02886962890625, -0.02716827392578125, -0.0254669189453125, -0.02376556396484375, -0.022064208984375, -0.02036285400390625, -0.0186614990234375, -0.01696014404296875, -0.0152587890625, -0.01355743408203125, -0.0118560791015625, -0.01015472412109375, -0.008453369140625, -0.00675201416015625, -0.0050506591796875, -0.00334930419921875, -0.00164794921875, 5.340576171875e-05, 0.0017547607421875, 0.00345611572265625, 0.005157470703125, 0.00685882568359375, 0.0085601806640625, 0.01026153564453125, 0.011962890625, 0.01366424560546875, 0.0153656005859375, 0.01706695556640625, 0.018768310546875, 0.02046966552734375, 0.0221710205078125, 0.02387237548828125, 0.02557373046875, 0.02727508544921875, 0.0289764404296875, 0.03067779541015625, 0.032379150390625, 0.03408050537109375, 0.0357818603515625, 0.03748321533203125, 0.0391845703125, 0.04088592529296875, 0.0425872802734375, 0.04428863525390625, 0.045989990234375, 0.04769134521484375, 0.0493927001953125, 0.05109405517578125, 0.05279541015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 6.0, 8.0, 9.0, 19.0, 19.0, 38.0, 55.0, 110.0, 214.0, 462.0, 1134.0, 3270.0, 13472.0, 141710.0, 3441207.0, 556436.0, 28082.0, 5156.0, 1596.0, 632.0, 276.0, 170.0, 75.0, 52.0, 19.0, 19.0, 16.0, 8.0, 3.0, 7.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.09521484375, -0.09247016906738281, -0.08972549438476562, -0.08698081970214844, -0.08423614501953125, -0.08149147033691406, -0.07874679565429688, -0.07600212097167969, -0.0732574462890625, -0.07051277160644531, -0.06776809692382812, -0.06502342224121094, -0.06227874755859375, -0.05953407287597656, -0.056789398193359375, -0.05404472351074219, -0.051300048828125, -0.04855537414550781, -0.045810699462890625, -0.04306602478027344, -0.04032135009765625, -0.03757667541503906, -0.034832000732421875, -0.03208732604980469, -0.0293426513671875, -0.026597976684570312, -0.023853302001953125, -0.021108627319335938, -0.01836395263671875, -0.015619277954101562, -0.012874603271484375, -0.010129928588867188, -0.00738525390625, -0.0046405792236328125, -0.001895904541015625, 0.0008487701416015625, 0.00359344482421875, 0.0063381195068359375, 0.009082794189453125, 0.011827468872070312, 0.0145721435546875, 0.017316818237304688, 0.020061492919921875, 0.022806167602539062, 0.02555084228515625, 0.028295516967773438, 0.031040191650390625, 0.03378486633300781, 0.036529541015625, 0.03927421569824219, 0.042018890380859375, 0.04476356506347656, 0.04750823974609375, 0.05025291442871094, 0.052997589111328125, 0.05574226379394531, 0.0584869384765625, 0.06123161315917969, 0.06397628784179688, 0.06672096252441406, 0.06946563720703125, 0.07221031188964844, 0.07495498657226562, 0.07769966125488281, 0.0804443359375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 8.0, 9.0, 7.0, 8.0, 18.0, 30.0, 54.0, 76.0, 128.0, 161.0, 272.0, 410.0, 525.0, 596.0, 550.0, 410.0, 293.0, 200.0, 117.0, 75.0, 48.0, 23.0, 21.0, 17.0, 5.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07135009765625, -0.06883907318115234, -0.06632804870605469, -0.06381702423095703, -0.061305999755859375, -0.05879497528076172, -0.05628395080566406, -0.053772926330566406, -0.05126190185546875, -0.048750877380371094, -0.04623985290527344, -0.04372882843017578, -0.041217803955078125, -0.03870677947998047, -0.03619575500488281, -0.033684730529785156, -0.0311737060546875, -0.028662681579589844, -0.026151657104492188, -0.02364063262939453, -0.021129608154296875, -0.01861858367919922, -0.016107559204101562, -0.013596534729003906, -0.01108551025390625, -0.008574485778808594, -0.0060634613037109375, -0.0035524368286132812, -0.001041412353515625, 0.0014696121215820312, 0.0039806365966796875, 0.006491661071777344, 0.009002685546875, 0.011513710021972656, 0.014024734497070312, 0.01653575897216797, 0.019046783447265625, 0.02155780792236328, 0.024068832397460938, 0.026579856872558594, 0.02909088134765625, 0.031601905822753906, 0.03411293029785156, 0.03662395477294922, 0.039134979248046875, 0.04164600372314453, 0.04415702819824219, 0.046668052673339844, 0.0491790771484375, 0.051690101623535156, 0.05420112609863281, 0.05671215057373047, 0.059223175048828125, 0.06173419952392578, 0.06424522399902344, 0.0667562484741211, 0.06926727294921875, 0.0717782974243164, 0.07428932189941406, 0.07680034637451172, 0.07931137084960938, 0.08182239532470703, 0.08433341979980469, 0.08684444427490234, 0.08935546875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 10.0, 14.0, 20.0, 35.0, 56.0, 94.0, 124.0, 134.0, 135.0, 110.0, 93.0, 54.0, 34.0, 20.0, 17.0, 16.0, 6.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.48169568181037903, -0.4636991322040558, -0.44570258259773254, -0.4277060329914093, -0.40970945358276367, -0.39171290397644043, -0.3737163543701172, -0.35571980476379395, -0.3377232551574707, -0.31972670555114746, -0.3017301559448242, -0.283733606338501, -0.26573705673217773, -0.2477404922246933, -0.22974392771720886, -0.21174737811088562, -0.19375082850456238, -0.17575427889823914, -0.1577577292919159, -0.13976116478443146, -0.12176461517810822, -0.10376806557178497, -0.08577150851488113, -0.0677749514579773, -0.04977840185165405, -0.03178184852004051, -0.013785295188426971, 0.004211258143186569, 0.02220781147480011, 0.04020436108112335, 0.05820091813802719, 0.07619747519493103, 0.09419405460357666, 0.1121906042098999, 0.13018715381622314, 0.14818371832370758, 0.16618026793003082, 0.18417681753635406, 0.2021733820438385, 0.22016993165016174, 0.23816648125648499, 0.2561630308628082, 0.27415958046913147, 0.2921561300754547, 0.31015270948410034, 0.3281492590904236, 0.3461458086967468, 0.36414235830307007, 0.3821389079093933, 0.40013545751571655, 0.4181320071220398, 0.43612855672836304, 0.4541251063346863, 0.4721216559410095, 0.49011823534965515, 0.5081148147583008, 0.526111364364624, 0.5441079139709473, 0.5621044635772705, 0.5801010131835938, 0.598097562789917, 0.6160941123962402, 0.6340906620025635, 0.6520872116088867, 0.67008376121521]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 5.0, 3.0, 7.0, 5.0, 7.0, 10.0, 13.0, 19.0, 11.0, 38.0, 27.0, 38.0, 39.0, 45.0, 52.0, 50.0, 55.0, 52.0, 57.0, 61.0, 51.0, 48.0, 38.0, 37.0, 43.0, 30.0, 30.0, 28.0, 11.0, 21.0, 16.0, 12.0, 9.0, 5.0, 5.0, 9.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.32050347328186035, -0.3106463551521301, -0.3007892072200775, -0.2909320890903473, -0.28107497096061707, -0.27121785283088684, -0.26136070489883423, -0.251503586769104, -0.24164646863937378, -0.23178933560848236, -0.22193221747875214, -0.21207508444786072, -0.2022179663181305, -0.19236083328723907, -0.18250370025634766, -0.17264658212661743, -0.162789449095726, -0.1529323160648346, -0.14307519793510437, -0.13321806490421295, -0.12336094677448273, -0.11350381374359131, -0.10364668816328049, -0.09378956258296967, -0.08393243700265884, -0.07407531142234802, -0.0642181858420372, -0.05436105653643608, -0.04450393095612526, -0.03464680537581444, -0.024789676070213318, -0.014932550489902496, -0.005075424909591675, 0.004781701602041721, 0.014638828113675117, 0.024495955556631088, 0.03435308113694191, 0.04421020671725273, 0.05406733602285385, 0.06392446160316467, 0.0737815871834755, 0.08363871276378632, 0.09349583834409714, 0.10335296392440796, 0.11321009695529938, 0.1230672150850296, 0.13292434811592102, 0.14278146624565125, 0.15263859927654266, 0.16249573230743408, 0.1723528504371643, 0.18220998346805573, 0.19206710159778595, 0.20192423462867737, 0.2117813527584076, 0.221638485789299, 0.23149561882019043, 0.24135275185108185, 0.25120988488197327, 0.2610670030117035, 0.2709241211414337, 0.28078123927116394, 0.29063838720321655, 0.3004955053329468, 0.310352623462677]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 8.0, 6.0, 12.0, 7.0, 16.0, 5.0, 20.0, 24.0, 36.0, 39.0, 60.0, 73.0, 115.0, 139.0, 178.0, 315.0, 483.0, 758.0, 1354.0, 3217.0, 10080.0, 55431.0, 578907.0, 350326.0, 33864.0, 7210.0, 2591.0, 1225.0, 663.0, 390.0, 262.0, 205.0, 160.0, 79.0, 74.0, 49.0, 33.0, 33.0, 22.0, 17.0, 15.0, 8.0, 3.0, 9.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.0892333984375, -0.08659934997558594, -0.08396530151367188, -0.08133125305175781, -0.07869720458984375, -0.07606315612792969, -0.07342910766601562, -0.07079505920410156, -0.0681610107421875, -0.06552696228027344, -0.06289291381835938, -0.06025886535644531, -0.05762481689453125, -0.05499076843261719, -0.052356719970703125, -0.04972267150878906, -0.047088623046875, -0.04445457458496094, -0.041820526123046875, -0.03918647766113281, -0.03655242919921875, -0.03391838073730469, -0.031284332275390625, -0.028650283813476562, -0.0260162353515625, -0.023382186889648438, -0.020748138427734375, -0.018114089965820312, -0.01548004150390625, -0.012845993041992188, -0.010211944580078125, -0.0075778961181640625, -0.00494384765625, -0.0023097991943359375, 0.000324249267578125, 0.0029582977294921875, 0.00559234619140625, 0.008226394653320312, 0.010860443115234375, 0.013494491577148438, 0.0161285400390625, 0.018762588500976562, 0.021396636962890625, 0.024030685424804688, 0.02666473388671875, 0.029298782348632812, 0.031932830810546875, 0.03456687927246094, 0.037200927734375, 0.03983497619628906, 0.042469024658203125, 0.04510307312011719, 0.04773712158203125, 0.05037117004394531, 0.053005218505859375, 0.05563926696777344, 0.0582733154296875, 0.06090736389160156, 0.06354141235351562, 0.06617546081542969, 0.06880950927734375, 0.07144355773925781, 0.07407760620117188, 0.07671165466308594, 0.079345703125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 0.0, 2.0, 3.0, 3.0, 9.0, 7.0, 8.0, 11.0, 14.0, 18.0, 25.0, 22.0, 28.0, 34.0, 40.0, 54.0, 62.0, 52.0, 63.0, 55.0, 74.0, 39.0, 46.0, 54.0, 37.0, 44.0, 35.0, 32.0, 33.0, 23.0, 15.0, 19.0, 8.0, 6.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.053009033203125, -0.05148124694824219, -0.049953460693359375, -0.04842567443847656, -0.04689788818359375, -0.04537010192871094, -0.043842315673828125, -0.04231452941894531, -0.0407867431640625, -0.03925895690917969, -0.037731170654296875, -0.03620338439941406, -0.03467559814453125, -0.03314781188964844, -0.031620025634765625, -0.030092239379882812, -0.028564453125, -0.027036666870117188, -0.025508880615234375, -0.023981094360351562, -0.02245330810546875, -0.020925521850585938, -0.019397735595703125, -0.017869949340820312, -0.0163421630859375, -0.014814376831054688, -0.013286590576171875, -0.011758804321289062, -0.01023101806640625, -0.008703231811523438, -0.007175445556640625, -0.0056476593017578125, -0.004119873046875, -0.0025920867919921875, -0.001064300537109375, 0.0004634857177734375, 0.00199127197265625, 0.0035190582275390625, 0.005046844482421875, 0.0065746307373046875, 0.0081024169921875, 0.009630203247070312, 0.011157989501953125, 0.012685775756835938, 0.01421356201171875, 0.015741348266601562, 0.017269134521484375, 0.018796920776367188, 0.02032470703125, 0.021852493286132812, 0.023380279541015625, 0.024908065795898438, 0.02643585205078125, 0.027963638305664062, 0.029491424560546875, 0.031019210815429688, 0.0325469970703125, 0.03407478332519531, 0.035602569580078125, 0.03713035583496094, 0.03865814208984375, 0.04018592834472656, 0.041713714599609375, 0.04324150085449219, 0.044769287109375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 10.0, 20.0, 25.0, 20.0, 34.0, 59.0, 103.0, 191.0, 392.0, 1867.0, 79685.0, 956389.0, 8258.0, 817.0, 278.0, 154.0, 102.0, 43.0, 35.0, 15.0, 9.0, 12.0, 2.0, 6.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169189453125, -0.16439056396484375, -0.1595916748046875, -0.15479278564453125, -0.149993896484375, -0.14519500732421875, -0.1403961181640625, -0.13559722900390625, -0.13079833984375, -0.12599945068359375, -0.1212005615234375, -0.11640167236328125, -0.111602783203125, -0.10680389404296875, -0.1020050048828125, -0.09720611572265625, -0.0924072265625, -0.08760833740234375, -0.0828094482421875, -0.07801055908203125, -0.073211669921875, -0.06841278076171875, -0.0636138916015625, -0.05881500244140625, -0.05401611328125, -0.04921722412109375, -0.0444183349609375, -0.03961944580078125, -0.034820556640625, -0.03002166748046875, -0.0252227783203125, -0.02042388916015625, -0.015625, -0.01082611083984375, -0.0060272216796875, -0.00122833251953125, 0.003570556640625, 0.00836944580078125, 0.0131683349609375, 0.01796722412109375, 0.02276611328125, 0.02756500244140625, 0.0323638916015625, 0.03716278076171875, 0.041961669921875, 0.04676055908203125, 0.0515594482421875, 0.05635833740234375, 0.0611572265625, 0.06595611572265625, 0.0707550048828125, 0.07555389404296875, 0.080352783203125, 0.08515167236328125, 0.0899505615234375, 0.09474945068359375, 0.09954833984375, 0.10434722900390625, 0.1091461181640625, 0.11394500732421875, 0.118743896484375, 0.12354278564453125, 0.1283416748046875, 0.13314056396484375, 0.137939453125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 9.0, 17.0, 23.0, 22.0, 32.0, 40.0, 61.0, 69.0, 74.0, 90.0, 90.0, 100.0, 75.0, 67.0, 56.0, 37.0, 33.0, 27.0, 20.0, 16.0, 6.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.1575298309326172, -0.15307235717773438, -0.14861488342285156, -0.14415740966796875, -0.13969993591308594, -0.13524246215820312, -0.1307849884033203, -0.1263275146484375, -0.12187004089355469, -0.11741256713867188, -0.11295509338378906, -0.10849761962890625, -0.10404014587402344, -0.09958267211914062, -0.09512519836425781, -0.090667724609375, -0.08621025085449219, -0.08175277709960938, -0.07729530334472656, -0.07283782958984375, -0.06838035583496094, -0.06392288208007812, -0.05946540832519531, -0.0550079345703125, -0.05055046081542969, -0.046092987060546875, -0.04163551330566406, -0.03717803955078125, -0.03272056579589844, -0.028263092041015625, -0.023805618286132812, -0.01934814453125, -0.014890670776367188, -0.010433197021484375, -0.0059757232666015625, -0.00151824951171875, 0.0029392242431640625, 0.007396697998046875, 0.011854171752929688, 0.0163116455078125, 0.020769119262695312, 0.025226593017578125, 0.029684066772460938, 0.03414154052734375, 0.03859901428222656, 0.043056488037109375, 0.04751396179199219, 0.051971435546875, 0.05642890930175781, 0.060886383056640625, 0.06534385681152344, 0.06980133056640625, 0.07425880432128906, 0.07871627807617188, 0.08317375183105469, 0.0876312255859375, 0.09208869934082031, 0.09654617309570312, 0.10100364685058594, 0.10546112060546875, 0.10991859436035156, 0.11437606811523438, 0.11883354187011719, 0.123291015625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 10.0, 14.0, 19.0, 20.0, 56.0, 108.0, 254.0, 802.0, 6450.0, 878576.0, 158540.0, 2725.0, 554.0, 198.0, 82.0, 48.0, 22.0, 20.0, 17.0, 6.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.043121337890625, -0.041808128356933594, -0.04049491882324219, -0.03918170928955078, -0.037868499755859375, -0.03655529022216797, -0.03524208068847656, -0.033928871154785156, -0.03261566162109375, -0.031302452087402344, -0.029989242553710938, -0.02867603302001953, -0.027362823486328125, -0.02604961395263672, -0.024736404418945312, -0.023423194885253906, -0.0221099853515625, -0.020796775817871094, -0.019483566284179688, -0.01817035675048828, -0.016857147216796875, -0.015543937683105469, -0.014230728149414062, -0.012917518615722656, -0.01160430908203125, -0.010291099548339844, -0.008977890014648438, -0.007664680480957031, -0.006351470947265625, -0.005038261413574219, -0.0037250518798828125, -0.0024118423461914062, -0.0010986328125, 0.00021457672119140625, 0.0015277862548828125, 0.0028409957885742188, 0.004154205322265625, 0.005467414855957031, 0.0067806243896484375, 0.008093833923339844, 0.00940704345703125, 0.010720252990722656, 0.012033462524414062, 0.013346672058105469, 0.014659881591796875, 0.01597309112548828, 0.017286300659179688, 0.018599510192871094, 0.0199127197265625, 0.021225929260253906, 0.022539138793945312, 0.02385234832763672, 0.025165557861328125, 0.02647876739501953, 0.027791976928710938, 0.029105186462402344, 0.03041839599609375, 0.031731605529785156, 0.03304481506347656, 0.03435802459716797, 0.035671234130859375, 0.03698444366455078, 0.03829765319824219, 0.039610862731933594, 0.040924072265625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 9.0, 13.0, 17.0, 8.0, 15.0, 32.0, 18.0, 45.0, 51.0, 25.0, 54.0, 68.0, 36.0, 65.0, 85.0, 37.0, 71.0, 66.0, 51.0, 26.0, 40.0, 29.0, 14.0, 30.0, 16.0, 7.0, 20.0, 16.0, 2.0, 3.0, 8.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.039836883544922e-06, -2.93925404548645e-06, -2.8386712074279785e-06, -2.738088369369507e-06, -2.637505531311035e-06, -2.5369226932525635e-06, -2.436339855194092e-06, -2.33575701713562e-06, -2.2351741790771484e-06, -2.1345913410186768e-06, -2.034008502960205e-06, -1.9334256649017334e-06, -1.8328428268432617e-06, -1.73225998878479e-06, -1.6316771507263184e-06, -1.5310943126678467e-06, -1.430511474609375e-06, -1.3299286365509033e-06, -1.2293457984924316e-06, -1.12876296043396e-06, -1.0281801223754883e-06, -9.275972843170166e-07, -8.270144462585449e-07, -7.264316082000732e-07, -6.258487701416016e-07, -5.252659320831299e-07, -4.246830940246582e-07, -3.241002559661865e-07, -2.2351741790771484e-07, -1.2293457984924316e-07, -2.2351741790771484e-08, 7.82310962677002e-08, 1.7881393432617188e-07, 2.7939677238464355e-07, 3.7997961044311523e-07, 4.805624485015869e-07, 5.811452865600586e-07, 6.817281246185303e-07, 7.82310962677002e-07, 8.828938007354736e-07, 9.834766387939453e-07, 1.084059476852417e-06, 1.1846423149108887e-06, 1.2852251529693604e-06, 1.385807991027832e-06, 1.4863908290863037e-06, 1.5869736671447754e-06, 1.687556505203247e-06, 1.7881393432617188e-06, 1.8887221813201904e-06, 1.989305019378662e-06, 2.089887857437134e-06, 2.1904706954956055e-06, 2.291053533554077e-06, 2.391636371612549e-06, 2.4922192096710205e-06, 2.592802047729492e-06, 2.693384885787964e-06, 2.7939677238464355e-06, 2.8945505619049072e-06, 2.995133399963379e-06, 3.0957162380218506e-06, 3.1962990760803223e-06, 3.296881914138794e-06, 3.3974647521972656e-06]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 9.0, 12.0, 18.0, 40.0, 79.0, 160.0, 535.0, 4021.0, 897382.0, 143893.0, 1845.0, 346.0, 130.0, 46.0, 16.0, 10.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07232666015625, -0.07063913345336914, -0.06895160675048828, -0.06726408004760742, -0.06557655334472656, -0.0638890266418457, -0.062201499938964844, -0.060513973236083984, -0.058826446533203125, -0.057138919830322266, -0.055451393127441406, -0.05376386642456055, -0.05207633972167969, -0.05038881301879883, -0.04870128631591797, -0.04701375961303711, -0.04532623291015625, -0.04363870620727539, -0.04195117950439453, -0.04026365280151367, -0.03857612609863281, -0.03688859939575195, -0.035201072692871094, -0.033513545989990234, -0.031826019287109375, -0.030138492584228516, -0.028450965881347656, -0.026763439178466797, -0.025075912475585938, -0.023388385772705078, -0.02170085906982422, -0.02001333236694336, -0.0183258056640625, -0.01663827896118164, -0.014950752258300781, -0.013263225555419922, -0.011575698852539062, -0.009888172149658203, -0.008200645446777344, -0.006513118743896484, -0.004825592041015625, -0.0031380653381347656, -0.0014505386352539062, 0.00023698806762695312, 0.0019245147705078125, 0.003612041473388672, 0.005299568176269531, 0.006987094879150391, 0.00867462158203125, 0.01036214828491211, 0.012049674987792969, 0.013737201690673828, 0.015424728393554688, 0.017112255096435547, 0.018799781799316406, 0.020487308502197266, 0.022174835205078125, 0.023862361907958984, 0.025549888610839844, 0.027237415313720703, 0.028924942016601562, 0.030612468719482422, 0.03229999542236328, 0.03398752212524414, 0.035675048828125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 2.0, 10.0, 18.0, 33.0, 41.0, 71.0, 130.0, 187.0, 182.0, 139.0, 89.0, 45.0, 26.0, 7.0, 11.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03326416015625, -0.032291412353515625, -0.03131866455078125, -0.030345916748046875, -0.0293731689453125, -0.028400421142578125, -0.02742767333984375, -0.026454925537109375, -0.025482177734375, -0.024509429931640625, -0.02353668212890625, -0.022563934326171875, -0.0215911865234375, -0.020618438720703125, -0.01964569091796875, -0.018672943115234375, -0.0177001953125, -0.016727447509765625, -0.01575469970703125, -0.014781951904296875, -0.0138092041015625, -0.012836456298828125, -0.01186370849609375, -0.010890960693359375, -0.009918212890625, -0.008945465087890625, -0.00797271728515625, -0.006999969482421875, -0.0060272216796875, -0.005054473876953125, -0.00408172607421875, -0.003108978271484375, -0.00213623046875, -0.001163482666015625, -0.00019073486328125, 0.000782012939453125, 0.0017547607421875, 0.002727508544921875, 0.00370025634765625, 0.004673004150390625, 0.005645751953125, 0.006618499755859375, 0.00759124755859375, 0.008563995361328125, 0.0095367431640625, 0.010509490966796875, 0.01148223876953125, 0.012454986572265625, 0.013427734375, 0.014400482177734375, 0.01537322998046875, 0.016345977783203125, 0.0173187255859375, 0.018291473388671875, 0.01926422119140625, 0.020236968994140625, 0.021209716796875, 0.022182464599609375, 0.02315521240234375, 0.024127960205078125, 0.0251007080078125, 0.026073455810546875, 0.02704620361328125, 0.028018951416015625, 0.02899169921875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 22.0, 62.0, 265.0, 505.0, 103.0, 28.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5306867361068726, -1.497685432434082, -1.464684247970581, -1.4316829442977905, -1.3986817598342896, -1.365680456161499, -1.332679271697998, -1.2996779680252075, -1.266676664352417, -1.2336753606796265, -1.2006741762161255, -1.167672872543335, -1.134671688079834, -1.1016703844070435, -1.0686691999435425, -1.035667896270752, -1.002666711807251, -0.9696654677391052, -0.9366642236709595, -0.9036629796028137, -0.870661735534668, -0.8376604318618774, -0.8046591877937317, -0.7716579437255859, -0.7386566996574402, -0.7056554555892944, -0.6726542115211487, -0.6396529674530029, -0.6066516637802124, -0.5736504793167114, -0.5406491756439209, -0.5076479315757751, -0.4746466279029846, -0.44164538383483887, -0.4086441397666931, -0.375642865896225, -0.3426416218280792, -0.30964037775993347, -0.27663910388946533, -0.24363785982131958, -0.21063661575317383, -0.17763537168502808, -0.14463411271572113, -0.11163286119699478, -0.07863160967826843, -0.04563036561012268, -0.012629106640815735, 0.02037215232849121, 0.05337339639663696, 0.08637464791536331, 0.11937589943408966, 0.1523771584033966, 0.18537840247154236, 0.2183796465396881, 0.25138092041015625, 0.284382164478302, 0.31738340854644775, 0.3503846526145935, 0.38338589668273926, 0.4163871705532074, 0.44938841462135315, 0.4823896586894989, 0.515390932559967, 0.5483921766281128, 0.5813934206962585]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 11.0, 22.0, 37.0, 47.0, 79.0, 68.0, 112.0, 189.0, 125.0, 97.0, 63.0, 55.0, 39.0, 22.0, 12.0, 5.0, 3.0, 7.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8924422264099121, -0.8734107613563538, -0.8543792963027954, -0.8353478312492371, -0.8163163661956787, -0.7972848415374756, -0.778253436088562, -0.7592219114303589, -0.7401904463768005, -0.7211589813232422, -0.7021275162696838, -0.6830960512161255, -0.6640645861625671, -0.6450331211090088, -0.6260015964508057, -0.6069701313972473, -0.587938666343689, -0.5689072012901306, -0.5498757362365723, -0.5308442711830139, -0.5118128061294556, -0.49278131127357483, -0.4737498462200165, -0.45471835136413574, -0.43568694591522217, -0.4166554808616638, -0.39762401580810547, -0.3785925507545471, -0.3595610558986664, -0.34052959084510803, -0.3214981257915497, -0.30246663093566895, -0.2834351658821106, -0.26440370082855225, -0.2453722208738327, -0.22634075582027435, -0.2073092758655548, -0.18827781081199646, -0.1692463457584381, -0.15021486580371857, -0.13118340075016022, -0.11215192824602127, -0.09312045574188232, -0.07408899068832397, -0.05505751818418503, -0.03602604568004608, -0.016994580626487732, 0.0020368993282318115, 0.02106836438179016, 0.04009983688592911, 0.059131305664777756, 0.0781627744436264, 0.09719424694776535, 0.1162257194519043, 0.13525718450546265, 0.1542886644601822, 0.17332012951374054, 0.1923515945672989, 0.21138307452201843, 0.23041453957557678, 0.24944600462913513, 0.26847749948501587, 0.2875089645385742, 0.30654042959213257, 0.3255718946456909]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 11.0, 15.0, 40.0, 84.0, 540.0, 153.0, 80.0, 33.0, 27.0, 16.0, 4.0, 6.0, 2.0, 2.0], "bins": [-0.338623046875, -0.33243513107299805, -0.3262472152709961, -0.32005929946899414, -0.3138713836669922, -0.30768346786499023, -0.3014955520629883, -0.29530763626098633, -0.2891197204589844, -0.2829318046569824, -0.27674388885498047, -0.2705559730529785, -0.26436805725097656, -0.2581801414489746, -0.25199222564697266, -0.2458043098449707, -0.23961639404296875, -0.2334284782409668, -0.22724056243896484, -0.2210526466369629, -0.21486473083496094, -0.20867681503295898, -0.20248889923095703, -0.19630098342895508, -0.19011306762695312, -0.18392515182495117, -0.17773723602294922, -0.17154932022094727, -0.1653614044189453, -0.15917348861694336, -0.1529855728149414, -0.14679765701293945, -0.1406097412109375, -0.13442182540893555, -0.1282339096069336, -0.12204599380493164, -0.11585807800292969, -0.10967016220092773, -0.10348224639892578, -0.09729433059692383, -0.09110641479492188, -0.08491849899291992, -0.07873058319091797, -0.07254266738891602, -0.06635475158691406, -0.06016683578491211, -0.053978919982910156, -0.0477910041809082, -0.04160308837890625, -0.0354151725769043, -0.029227256774902344, -0.02303934097290039, -0.016851425170898438, -0.010663509368896484, -0.004475593566894531, 0.0017123222351074219, 0.007900238037109375, 0.014088153839111328, 0.02027606964111328, 0.026463985443115234, 0.03265190124511719, 0.03883981704711914, 0.045027732849121094, 0.05121564865112305, 0.057403564453125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 6.0, 1.0, 7.0, 13.0, 6.0, 13.0, 10.0, 12.0, 14.0, 21.0, 18.0, 35.0, 35.0, 45.0, 68.0, 121.0, 213.0, 460.0, 1090.0, 3841.0, 30481.0, 8330386.0, 17616.0, 2645.0, 750.0, 272.0, 146.0, 90.0, 55.0, 29.0, 25.0, 16.0, 10.0, 6.0, 4.0, 3.0, 7.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2039896547794342, -0.19806107878684998, -0.19213250279426575, -0.18620392680168152, -0.1802753508090973, -0.17434677481651306, -0.16841819882392883, -0.1624896228313446, -0.15656104683876038, -0.15063247084617615, -0.14470389485359192, -0.1387753188610077, -0.13284674286842346, -0.12691816687583923, -0.120989590883255, -0.11506101489067078, -0.10913243889808655, -0.10320386290550232, -0.09727528691291809, -0.09134671092033386, -0.08541813492774963, -0.0794895589351654, -0.07356098294258118, -0.06763240694999695, -0.06170383095741272, -0.05577525496482849, -0.04984667897224426, -0.043918102979660034, -0.037989526987075806, -0.03206095099449158, -0.02613237500190735, -0.02020379900932312, -0.014275208115577698, -0.00834663212299347, -0.0024180561304092407, 0.003510519862174988, 0.009439095854759216, 0.015367671847343445, 0.021296247839927673, 0.027224823832511902, 0.03315339982509613, 0.03908197581768036, 0.04501055181026459, 0.050939127802848816, 0.056867703795433044, 0.06279627978801727, 0.0687248557806015, 0.07465343177318573, 0.08058200776576996, 0.08651058375835419, 0.09243915975093842, 0.09836773574352264, 0.10429631173610687, 0.1102248877286911, 0.11615346372127533, 0.12208203971385956, 0.1280106157064438, 0.13393919169902802, 0.13986776769161224, 0.14579634368419647, 0.1517249196767807, 0.15765349566936493, 0.16358207166194916, 0.1695106476545334, 0.17543922364711761]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 27.0, 4.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.017036374658346176, -0.012969929724931717, -0.008903484791517258, -0.0048370398581027985, -0.0007705949246883392, 0.00329585000872612, 0.007362294942140579, 0.011428739875555038, 0.015495184808969498, 0.019561629742383957, 0.023628074675798416, 0.027694519609212875, 0.031760964542627335, 0.035827409476041794, 0.03989385440945625, 0.04396029934287071, 0.04802674427628517, 0.05209318920969963, 0.05615963414311409, 0.06022607907652855, 0.06429252028465271, 0.06835897266864777, 0.07242541015148163, 0.07649186253547668, 0.08055830001831055, 0.084624744951725, 0.08869118988513947, 0.09275763481855392, 0.09682407975196838, 0.10089052468538284, 0.1049569696187973, 0.10902341455221176, 0.11308987438678741, 0.11715631932020187, 0.12122276425361633, 0.1252892017364502, 0.12935565412044525, 0.1334221065044403, 0.13748854398727417, 0.14155498147010803, 0.1456214338541031, 0.14968788623809814, 0.153754323720932, 0.15782076120376587, 0.16188721358776093, 0.16595366597175598, 0.17002010345458984, 0.1740865409374237, 0.17815299332141876, 0.18221944570541382, 0.18628588318824768, 0.19035232067108154, 0.1944187730550766, 0.19848522543907166, 0.20255166292190552, 0.20661810040473938, 0.21068455278873444, 0.2147510051727295, 0.21881744265556335, 0.22288388013839722, 0.22695033252239227, 0.23101678490638733, 0.2350832223892212, 0.23914965987205505, 0.2432161122560501]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 8.0, 4.0, 12.0, 20.0, 20.0, 32.0, 34.0, 54.0, 54.0, 76.0, 69.0, 88.0, 93.0, 88.0, 50.0, 61.0, 43.0, 44.0, 38.0, 29.0, 13.0, 12.0, 7.0, 6.0, 8.0, 4.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.044647216796875, -0.042859554290771484, -0.04107189178466797, -0.03928422927856445, -0.03749656677246094, -0.03570890426635742, -0.033921241760253906, -0.03213357925415039, -0.030345916748046875, -0.02855825424194336, -0.026770591735839844, -0.024982929229736328, -0.023195266723632812, -0.021407604217529297, -0.01961994171142578, -0.017832279205322266, -0.01604461669921875, -0.014256954193115234, -0.012469291687011719, -0.010681629180908203, -0.008893966674804688, -0.007106304168701172, -0.005318641662597656, -0.0035309791564941406, -0.001743316650390625, 4.4345855712890625e-05, 0.0018320083618164062, 0.003619670867919922, 0.0054073333740234375, 0.007194995880126953, 0.008982658386230469, 0.010770320892333984, 0.0125579833984375, 0.014345645904541016, 0.01613330841064453, 0.017920970916748047, 0.019708633422851562, 0.021496295928955078, 0.023283958435058594, 0.02507162094116211, 0.026859283447265625, 0.02864694595336914, 0.030434608459472656, 0.03222227096557617, 0.03400993347167969, 0.0357975959777832, 0.03758525848388672, 0.039372920989990234, 0.04116058349609375, 0.042948246002197266, 0.04473590850830078, 0.0465235710144043, 0.04831123352050781, 0.05009889602661133, 0.051886558532714844, 0.05367422103881836, 0.055461883544921875, 0.05724954605102539, 0.059037208557128906, 0.06082487106323242, 0.06261253356933594, 0.06440019607543945, 0.06618785858154297, 0.06797552108764648, 0.06976318359375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 6.0, 5.0, 8.0, 8.0, 17.0, 39.0, 42.0, 72.0, 128.0, 210.0, 411.0, 742.0, 1649.0, 3852.0, 10857.0, 34822.0, 169818.0, 231738.0, 47000.0, 13886.0, 4895.0, 1972.0, 950.0, 474.0, 283.0, 138.0, 82.0, 59.0, 42.0, 20.0, 11.0, 11.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.41162109375, -0.3983917236328125, -0.385162353515625, -0.3719329833984375, -0.35870361328125, -0.3454742431640625, -0.332244873046875, -0.3190155029296875, -0.3057861328125, -0.2925567626953125, -0.279327392578125, -0.2660980224609375, -0.25286865234375, -0.2396392822265625, -0.226409912109375, -0.2131805419921875, -0.199951171875, -0.1867218017578125, -0.173492431640625, -0.1602630615234375, -0.14703369140625, -0.1338043212890625, -0.120574951171875, -0.1073455810546875, -0.0941162109375, -0.0808868408203125, -0.067657470703125, -0.0544281005859375, -0.04119873046875, -0.0279693603515625, -0.014739990234375, -0.0015106201171875, 0.01171875, 0.0249481201171875, 0.038177490234375, 0.0514068603515625, 0.06463623046875, 0.0778656005859375, 0.091094970703125, 0.1043243408203125, 0.1175537109375, 0.1307830810546875, 0.144012451171875, 0.1572418212890625, 0.17047119140625, 0.1837005615234375, 0.196929931640625, 0.2101593017578125, 0.223388671875, 0.2366180419921875, 0.249847412109375, 0.2630767822265625, 0.27630615234375, 0.2895355224609375, 0.302764892578125, 0.3159942626953125, 0.3292236328125, 0.3424530029296875, 0.355682373046875, 0.3689117431640625, 0.38214111328125, 0.3953704833984375, 0.408599853515625, 0.4218292236328125, 0.43505859375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 2.0, 5.0, 8.0, 20.0, 16.0, 22.0, 19.0, 32.0, 39.0, 46.0, 57.0, 51.0, 83.0, 79.0, 57.0, 78.0, 64.0, 69.0, 50.0, 52.0, 42.0, 32.0, 29.0, 16.0, 12.0, 9.0, 2.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0440673828125, -0.04251813888549805, -0.040968894958496094, -0.03941965103149414, -0.03787040710449219, -0.036321163177490234, -0.03477191925048828, -0.03322267532348633, -0.031673431396484375, -0.030124187469482422, -0.02857494354248047, -0.027025699615478516, -0.025476455688476562, -0.02392721176147461, -0.022377967834472656, -0.020828723907470703, -0.01927947998046875, -0.017730236053466797, -0.016180992126464844, -0.01463174819946289, -0.013082504272460938, -0.011533260345458984, -0.009984016418457031, -0.008434772491455078, -0.006885528564453125, -0.005336284637451172, -0.0037870407104492188, -0.0022377967834472656, -0.0006885528564453125, 0.0008606910705566406, 0.0024099349975585938, 0.003959178924560547, 0.0055084228515625, 0.007057666778564453, 0.008606910705566406, 0.01015615463256836, 0.011705398559570312, 0.013254642486572266, 0.014803886413574219, 0.016353130340576172, 0.017902374267578125, 0.019451618194580078, 0.02100086212158203, 0.022550106048583984, 0.024099349975585938, 0.02564859390258789, 0.027197837829589844, 0.028747081756591797, 0.03029632568359375, 0.0318455696105957, 0.033394813537597656, 0.03494405746459961, 0.03649330139160156, 0.038042545318603516, 0.03959178924560547, 0.04114103317260742, 0.042690277099609375, 0.04423952102661133, 0.04578876495361328, 0.047338008880615234, 0.04888725280761719, 0.05043649673461914, 0.051985740661621094, 0.05353498458862305, 0.055084228515625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 8.0, 6.0, 2.0, 4.0, 20.0, 46.0, 65.0, 73.0, 72.0, 45.0, 40.0, 26.0, 26.0, 18.0, 16.0, 9.0, 5.0, 7.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14482873678207397, -0.14072056114673615, -0.13661237061023712, -0.1325041949748993, -0.12839600443840027, -0.12428782880306244, -0.12017965316772461, -0.11607147008180618, -0.11196328699588776, -0.10785510390996933, -0.1037469208240509, -0.09963874518871307, -0.09553056210279465, -0.09142237901687622, -0.08731420338153839, -0.08320602029561996, -0.07909783720970154, -0.07498965412378311, -0.07088147103786469, -0.06677329540252686, -0.06266511231660843, -0.05855692923069, -0.054448749870061874, -0.050340570509433746, -0.04623238742351532, -0.04212420433759689, -0.038016024976968765, -0.03390784561634064, -0.02979966253042221, -0.025691481307148933, -0.021583300083875656, -0.01747511886060238, -0.013366937637329102, -0.009258756414055824, -0.005150575190782547, -0.0010423939675092697, 0.0030657872557640076, 0.007173968479037285, 0.011282149702310562, 0.01539033092558384, 0.019498512148857117, 0.023606693372130394, 0.02771487459540367, 0.0318230539560318, 0.035931237041950226, 0.04003942012786865, 0.04414759948849678, 0.04825577884912491, 0.052363961935043335, 0.05647214502096176, 0.06058032438158989, 0.06468850374221802, 0.06879668682813644, 0.07290486991405487, 0.0770130455493927, 0.08112122863531113, 0.08522941172122955, 0.08933759480714798, 0.0934457778930664, 0.09755395352840424, 0.10166213661432266, 0.10577031970024109, 0.10987849533557892, 0.11398667842149734, 0.11809486150741577]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 6.0, 5.0, 4.0, 11.0, 15.0, 19.0, 24.0, 133.0, 137.0, 30.0, 18.0, 16.0, 11.0, 12.0, 10.0, 10.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21974027156829834, -0.21256747841835022, -0.2053946852684021, -0.19822190701961517, -0.19104911386966705, -0.18387632071971893, -0.176703542470932, -0.1695307493209839, -0.16235795617103577, -0.15518516302108765, -0.14801236987113953, -0.1408395916223526, -0.13366679847240448, -0.12649400532245636, -0.11932121962308884, -0.11214843392372131, -0.1049756407737732, -0.09780284762382507, -0.09063006192445755, -0.08345727622509003, -0.0762844830751419, -0.06911168992519379, -0.06193890422582626, -0.05476611480116844, -0.04759332537651062, -0.0404205359518528, -0.03324774652719498, -0.026074957102537155, -0.018902167677879333, -0.011729378253221512, -0.00455658882856369, 0.0026162005960941315, 0.009788990020751953, 0.016961779445409775, 0.024134568870067596, 0.03130735829472542, 0.03848014771938324, 0.04565293714404106, 0.05282572656869888, 0.059998515993356705, 0.06717130541801453, 0.07434409856796265, 0.08151688426733017, 0.08868966996669769, 0.09586246311664581, 0.10303525626659393, 0.11020804196596146, 0.11738082766532898, 0.1245536208152771, 0.13172641396522522, 0.13889920711517334, 0.14607198536396027, 0.1532447785139084, 0.1604175716638565, 0.16759034991264343, 0.17476314306259155, 0.18193593621253967, 0.1891087293624878, 0.1962815225124359, 0.20345430076122284, 0.21062709391117096, 0.21779988706111908, 0.224972665309906, 0.23214545845985413, 0.23931825160980225]}, "eval/loss": 4.375434398651123, "eval/bleu": 0.0, "eval/runtime": 2564.062, "eval/samples_per_second": 5.756, "eval/steps_per_second": 0.72} \ No newline at end of file