diff --git "a/wandb/run-20220503_171959-a6039xud/files/wandb-summary.json" "b/wandb/run-20220503_171959-a6039xud/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220503_171959-a6039xud/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 5.0306, "train/learning_rate": 0.00047705196375492806, "train/epoch": 0.08, "train/global_step": 500, "_runtime": 5323, "_timestamp": 1651603723, "_step": 500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 10.0, 57.0, 318.0, 524.0, 86.0, 17.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.751711368560791, -2.6421878337860107, -2.5326640605926514, -2.423140525817871, -2.313616991043091, -2.2040932178497314, -2.094569683074951, -1.9850460290908813, -1.8755223751068115, -1.7659987211227417, -1.6564751863479614, -1.5469515323638916, -1.4374278783798218, -1.327904224395752, -1.2183806896209717, -1.1088570356369019, -0.9993335008621216, -0.8898099064826965, -0.7802862524986267, -0.6707626581192017, -0.5612390041351318, -0.4517154097557068, -0.34219181537628174, -0.23266816139221191, -0.12314456701278687, -0.013620950281620026, 0.09590266644954681, 0.20542627573013306, 0.3149498999118805, 0.42447352409362793, 0.533997118473053, 0.6435207724571228, 0.7530443668365479, 0.8625679612159729, 0.9720916152000427, 1.0816152095794678, 1.1911388635635376, 1.3006625175476074, 1.4101860523223877, 1.5197097063064575, 1.6292333602905273, 1.7387570142745972, 1.8482805490493774, 1.9578042030334473, 2.0673277378082275, 2.176851511001587, 2.286375045776367, 2.3958988189697266, 2.5054221153259277, 2.614945650100708, 2.7244694232940674, 2.8339929580688477, 2.943516492843628, 3.0530402660369873, 3.1625638008117676, 3.272087574005127, 3.3816111087799072, 3.4911346435546875, 3.600658416748047, 3.710181951522827, 3.8197054862976074, 3.929229259490967, 4.038752555847168, 4.148276329040527, 4.257800102233887]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 10.0, 3.0, 11.0, 12.0, 15.0, 12.0, 19.0, 26.0, 32.0, 45.0, 30.0, 38.0, 26.0, 39.0, 38.0, 39.0, 41.0, 57.0, 37.0, 45.0, 31.0, 55.0, 35.0, 55.0, 39.0, 30.0, 24.0, 36.0, 13.0, 19.0, 23.0, 14.0, 19.0, 9.0, 6.0, 7.0, 6.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3896210193634033, -1.3365920782089233, -1.283563256263733, -1.230534315109253, -1.1775054931640625, -1.1244765520095825, -1.0714476108551025, -1.018418788909912, -0.9653898477554321, -0.9123609662055969, -0.8593320846557617, -0.8063031435012817, -0.7532742619514465, -0.7002453804016113, -0.6472164392471313, -0.5941875576972961, -0.5411586761474609, -0.48812979459762573, -0.43510088324546814, -0.38207197189331055, -0.32904309034347534, -0.27601420879364014, -0.22298529744148254, -0.16995638608932495, -0.11692750453948975, -0.06389860808849335, -0.010869711637496948, 0.04215918481349945, 0.09518808126449585, 0.14821696281433105, 0.20124587416648865, 0.25427478551864624, 0.30730366706848145, 0.36033254861831665, 0.41336145997047424, 0.46639037132263184, 0.519419252872467, 0.5724481344223022, 0.6254770755767822, 0.6785059571266174, 0.7315348386764526, 0.7845637202262878, 0.837592601776123, 0.890621542930603, 0.9436504244804382, 0.9966793060302734, 1.0497082471847534, 1.1027371883392334, 1.1557660102844238, 1.2087949514389038, 1.2618237733840942, 1.3148527145385742, 1.3678815364837646, 1.4209104776382446, 1.4739394187927246, 1.526968240737915, 1.579997181892395, 1.633026123046875, 1.6860549449920654, 1.7390838861465454, 1.7921128273010254, 1.8451416492462158, 1.8981705904006958, 1.9511995315551758, 2.004228353500366]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 7.0, 8.0, 20.0, 25.0, 24.0, 28.0, 43.0, 78.0, 133.0, 422.0, 2598.0, 123452.0, 4051252.0, 14772.0, 859.0, 215.0, 106.0, 57.0, 51.0, 29.0, 28.0, 25.0, 21.0, 8.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.58984375, -3.42138671875, -3.2529296875, -3.08447265625, -2.916015625, -2.74755859375, -2.5791015625, -2.41064453125, -2.2421875, -2.07373046875, -1.9052734375, -1.73681640625, -1.568359375, -1.39990234375, -1.2314453125, -1.06298828125, -0.89453125, -0.72607421875, -0.5576171875, -0.38916015625, -0.220703125, -0.05224609375, 0.1162109375, 0.28466796875, 0.453125, 0.62158203125, 0.7900390625, 0.95849609375, 1.126953125, 1.29541015625, 1.4638671875, 1.63232421875, 1.80078125, 1.96923828125, 2.1376953125, 2.30615234375, 2.474609375, 2.64306640625, 2.8115234375, 2.97998046875, 3.1484375, 3.31689453125, 3.4853515625, 3.65380859375, 3.822265625, 3.99072265625, 4.1591796875, 4.32763671875, 4.49609375, 4.66455078125, 4.8330078125, 5.00146484375, 5.169921875, 5.33837890625, 5.5068359375, 5.67529296875, 5.84375, 6.01220703125, 6.1806640625, 6.34912109375, 6.517578125, 6.68603515625, 6.8544921875, 7.02294921875, 7.19140625]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 6.0, 7.0, 9.0, 14.0, 18.0, 20.0, 29.0, 29.0, 29.0, 27.0, 43.0, 39.0, 44.0, 38.0, 59.0, 56.0, 43.0, 54.0, 35.0, 56.0, 38.0, 48.0, 41.0, 29.0, 40.0, 25.0, 22.0, 21.0, 17.0, 19.0, 15.0, 4.0, 8.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0439453125, -1.0031890869140625, -0.962432861328125, -0.9216766357421875, -0.88092041015625, -0.8401641845703125, -0.799407958984375, -0.7586517333984375, -0.7178955078125, -0.6771392822265625, -0.636383056640625, -0.5956268310546875, -0.55487060546875, -0.5141143798828125, -0.473358154296875, -0.4326019287109375, -0.391845703125, -0.3510894775390625, -0.310333251953125, -0.2695770263671875, -0.22882080078125, -0.1880645751953125, -0.147308349609375, -0.1065521240234375, -0.0657958984375, -0.0250396728515625, 0.015716552734375, 0.0564727783203125, 0.09722900390625, 0.1379852294921875, 0.178741455078125, 0.2194976806640625, 0.26025390625, 0.3010101318359375, 0.341766357421875, 0.3825225830078125, 0.42327880859375, 0.4640350341796875, 0.504791259765625, 0.5455474853515625, 0.5863037109375, 0.6270599365234375, 0.667816162109375, 0.7085723876953125, 0.74932861328125, 0.7900848388671875, 0.830841064453125, 0.8715972900390625, 0.912353515625, 0.9531097412109375, 0.993865966796875, 1.0346221923828125, 1.07537841796875, 1.1161346435546875, 1.156890869140625, 1.1976470947265625, 1.2384033203125, 1.2791595458984375, 1.319915771484375, 1.3606719970703125, 1.40142822265625, 1.4421844482421875, 1.482940673828125, 1.5236968994140625, 1.564453125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 13.0, 17.0, 62.0, 4193207.0, 936.0, 37.0, 14.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-213.125, -207.177734375, -201.23046875, -195.283203125, -189.3359375, -183.388671875, -177.44140625, -171.494140625, -165.546875, -159.599609375, -153.65234375, -147.705078125, -141.7578125, -135.810546875, -129.86328125, -123.916015625, -117.96875, -112.021484375, -106.07421875, -100.126953125, -94.1796875, -88.232421875, -82.28515625, -76.337890625, -70.390625, -64.443359375, -58.49609375, -52.548828125, -46.6015625, -40.654296875, -34.70703125, -28.759765625, -22.8125, -16.865234375, -10.91796875, -4.970703125, 0.9765625, 6.923828125, 12.87109375, 18.818359375, 24.765625, 30.712890625, 36.66015625, 42.607421875, 48.5546875, 54.501953125, 60.44921875, 66.396484375, 72.34375, 78.291015625, 84.23828125, 90.185546875, 96.1328125, 102.080078125, 108.02734375, 113.974609375, 119.921875, 125.869140625, 131.81640625, 137.763671875, 143.7109375, 149.658203125, 155.60546875, 161.552734375, 167.5]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 15.0, 53.0, 3246.0, 718.0, 35.0, 12.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.662109375, -3.55084228515625, -3.4395751953125, -3.32830810546875, -3.217041015625, -3.10577392578125, -2.9945068359375, -2.88323974609375, -2.77197265625, -2.66070556640625, -2.5494384765625, -2.43817138671875, -2.326904296875, -2.21563720703125, -2.1043701171875, -1.99310302734375, -1.8818359375, -1.77056884765625, -1.6593017578125, -1.54803466796875, -1.436767578125, -1.32550048828125, -1.2142333984375, -1.10296630859375, -0.99169921875, -0.88043212890625, -0.7691650390625, -0.65789794921875, -0.546630859375, -0.43536376953125, -0.3240966796875, -0.21282958984375, -0.1015625, 0.00970458984375, 0.1209716796875, 0.23223876953125, 0.343505859375, 0.45477294921875, 0.5660400390625, 0.67730712890625, 0.78857421875, 0.89984130859375, 1.0111083984375, 1.12237548828125, 1.233642578125, 1.34490966796875, 1.4561767578125, 1.56744384765625, 1.6787109375, 1.78997802734375, 1.9012451171875, 2.01251220703125, 2.123779296875, 2.23504638671875, 2.3463134765625, 2.45758056640625, 2.56884765625, 2.68011474609375, 2.7913818359375, 2.90264892578125, 3.013916015625, 3.12518310546875, 3.2364501953125, 3.34771728515625, 3.458984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 7.0, 7.0, 11.0, 33.0, 46.0, 65.0, 114.0, 175.0, 209.0, 125.0, 71.0, 47.0, 33.0, 26.0, 12.0, 10.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3749637603759766, -1.2905852794647217, -1.2062067985534668, -1.121828317642212, -1.0374499559402466, -0.9530714750289917, -0.8686929941177368, -0.7843145728111267, -0.6999360918998718, -0.6155576109886169, -0.5311791896820068, -0.44680070877075195, -0.36242225766181946, -0.27804380655288696, -0.19366532564163208, -0.10928690433502197, -0.02490842342376709, 0.059470035135746, 0.1438484936952591, 0.22822695970535278, 0.3126054108142853, 0.3969838619232178, 0.48136234283447266, 0.5657407641410828, 0.6501192450523376, 0.7344977259635925, 0.8188761472702026, 0.9032546281814575, 0.9876331090927124, 1.0720114707946777, 1.1563899517059326, 1.2407684326171875, 1.3251469135284424, 1.4095253944396973, 1.4939038753509521, 1.578282356262207, 1.6626607179641724, 1.7470391988754272, 1.8314176797866821, 1.9157960414886475, 2.0001745223999023, 2.0845530033111572, 2.168931484222412, 2.253309965133667, 2.337688446044922, 2.4220666885375977, 2.5064454078674316, 2.5908236503601074, 2.6752023696899414, 2.7595808506011963, 2.843959331512451, 2.928337812423706, 3.012716293334961, 3.0970945358276367, 3.1814732551574707, 3.2658514976501465, 3.3502299785614014, 3.4346084594726562, 3.518986940383911, 3.603365421295166, 3.687743902206421, 3.772122383117676, 3.8565006256103516, 3.9408791065216064, 4.025257587432861]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 5.0, 8.0, 11.0, 13.0, 19.0, 16.0, 26.0, 34.0, 48.0, 37.0, 46.0, 45.0, 46.0, 49.0, 72.0, 60.0, 60.0, 52.0, 56.0, 48.0, 44.0, 43.0, 30.0, 29.0, 25.0, 20.0, 16.0, 15.0, 8.0, 7.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.079002857208252, -2.997662305831909, -2.9163217544555664, -2.8349812030792236, -2.753640651702881, -2.672300100326538, -2.5909595489501953, -2.5096192359924316, -2.4282784461975098, -2.346937894821167, -2.265597343444824, -2.1842567920684814, -2.1029162406921387, -2.021575689315796, -1.9402352571487427, -1.8588947057724, -1.7775542736053467, -1.696213722229004, -1.6148731708526611, -1.5335326194763184, -1.4521920680999756, -1.3708515167236328, -1.2895110845565796, -1.2081705331802368, -1.126829981803894, -1.0454894304275513, -0.9641488790512085, -0.8828083872795105, -0.8014678359031677, -0.720127284526825, -0.638786792755127, -0.5574462413787842, -0.4761059284210205, -0.39476537704467773, -0.31342485547065735, -0.23208431899547577, -0.1507437825202942, -0.06940323114395142, 0.01193729043006897, 0.09327781200408936, 0.17461836338043213, 0.2559589147567749, 0.3372994363307953, 0.4186399579048157, 0.49998050928115845, 0.5813210606575012, 0.6626615524291992, 0.744002103805542, 0.8253426551818848, 0.9066832065582275, 0.9880237579345703, 1.069364309310913, 1.1507048606872559, 1.2320454120635986, 1.3133858442306519, 1.3947263956069946, 1.4760669469833374, 1.5574074983596802, 1.638748049736023, 1.7200886011123657, 1.801429033279419, 1.8827695846557617, 1.9641101360321045, 2.0454506874084473, 2.12679123878479]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 9.0, 12.0, 18.0, 24.0, 36.0, 48.0, 88.0, 118.0, 177.0, 312.0, 487.0, 851.0, 1485.0, 3025.0, 6415.0, 15064.0, 39468.0, 126314.0, 543220.0, 214958.0, 58268.0, 21139.0, 8561.0, 3899.0, 2020.0, 997.0, 591.0, 314.0, 208.0, 133.0, 108.0, 53.0, 45.0, 24.0, 13.0, 14.0, 10.0, 6.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.453125, -0.43785858154296875, -0.4225921630859375, -0.40732574462890625, -0.392059326171875, -0.37679290771484375, -0.3615264892578125, -0.34626007080078125, -0.33099365234375, -0.31572723388671875, -0.3004608154296875, -0.28519439697265625, -0.269927978515625, -0.25466156005859375, -0.2393951416015625, -0.22412872314453125, -0.2088623046875, -0.19359588623046875, -0.1783294677734375, -0.16306304931640625, -0.147796630859375, -0.13253021240234375, -0.1172637939453125, -0.10199737548828125, -0.08673095703125, -0.07146453857421875, -0.0561981201171875, -0.04093170166015625, -0.025665283203125, -0.01039886474609375, 0.0048675537109375, 0.02013397216796875, 0.035400390625, 0.05066680908203125, 0.0659332275390625, 0.08119964599609375, 0.096466064453125, 0.11173248291015625, 0.1269989013671875, 0.14226531982421875, 0.15753173828125, 0.17279815673828125, 0.1880645751953125, 0.20333099365234375, 0.218597412109375, 0.23386383056640625, 0.2491302490234375, 0.26439666748046875, 0.2796630859375, 0.29492950439453125, 0.3101959228515625, 0.32546234130859375, 0.340728759765625, 0.35599517822265625, 0.3712615966796875, 0.38652801513671875, 0.40179443359375, 0.41706085205078125, 0.4323272705078125, 0.44759368896484375, 0.462860107421875, 0.47812652587890625, 0.4933929443359375, 0.5086593627929688, 0.52392578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 6.0, 10.0, 8.0, 12.0, 9.0, 15.0, 17.0, 24.0, 40.0, 43.0, 39.0, 41.0, 45.0, 55.0, 52.0, 50.0, 61.0, 52.0, 54.0, 60.0, 45.0, 40.0, 43.0, 27.0, 36.0, 25.0, 17.0, 17.0, 16.0, 11.0, 7.0, 7.0, 5.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.748046875, -1.6971282958984375, -1.646209716796875, -1.5952911376953125, -1.54437255859375, -1.4934539794921875, -1.442535400390625, -1.3916168212890625, -1.3406982421875, -1.2897796630859375, -1.238861083984375, -1.1879425048828125, -1.13702392578125, -1.0861053466796875, -1.035186767578125, -0.9842681884765625, -0.933349609375, -0.8824310302734375, -0.831512451171875, -0.7805938720703125, -0.72967529296875, -0.6787567138671875, -0.627838134765625, -0.5769195556640625, -0.5260009765625, -0.4750823974609375, -0.424163818359375, -0.3732452392578125, -0.32232666015625, -0.2714080810546875, -0.220489501953125, -0.1695709228515625, -0.11865234375, -0.0677337646484375, -0.016815185546875, 0.0341033935546875, 0.08502197265625, 0.1359405517578125, 0.186859130859375, 0.2377777099609375, 0.2886962890625, 0.3396148681640625, 0.390533447265625, 0.4414520263671875, 0.49237060546875, 0.5432891845703125, 0.594207763671875, 0.6451263427734375, 0.696044921875, 0.7469635009765625, 0.797882080078125, 0.8488006591796875, 0.89971923828125, 0.9506378173828125, 1.001556396484375, 1.0524749755859375, 1.1033935546875, 1.1543121337890625, 1.205230712890625, 1.2561492919921875, 1.30706787109375, 1.3579864501953125, 1.408905029296875, 1.4598236083984375, 1.5107421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 6.0, 9.0, 15.0, 21.0, 29.0, 44.0, 68.0, 69.0, 124.0, 195.0, 299.0, 419.0, 651.0, 1008.0, 1642.0, 2734.0, 4441.0, 7450.0, 12968.0, 22901.0, 42106.0, 78167.0, 170093.0, 345016.0, 178181.0, 80794.0, 42470.0, 23759.0, 13401.0, 7779.0, 4500.0, 2760.0, 1657.0, 1053.0, 598.0, 391.0, 247.0, 151.0, 108.0, 73.0, 45.0, 33.0, 26.0, 17.0, 14.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.12890625, -0.12517261505126953, -0.12143898010253906, -0.1177053451538086, -0.11397171020507812, -0.11023807525634766, -0.10650444030761719, -0.10277080535888672, -0.09903717041015625, -0.09530353546142578, -0.09156990051269531, -0.08783626556396484, -0.08410263061523438, -0.0803689956665039, -0.07663536071777344, -0.07290172576904297, -0.0691680908203125, -0.06543445587158203, -0.06170082092285156, -0.057967185974121094, -0.054233551025390625, -0.050499916076660156, -0.04676628112792969, -0.04303264617919922, -0.03929901123046875, -0.03556537628173828, -0.03183174133300781, -0.028098106384277344, -0.024364471435546875, -0.020630836486816406, -0.016897201538085938, -0.013163566589355469, -0.009429931640625, -0.005696296691894531, -0.0019626617431640625, 0.0017709732055664062, 0.005504608154296875, 0.009238243103027344, 0.012971878051757812, 0.01670551300048828, 0.02043914794921875, 0.02417278289794922, 0.027906417846679688, 0.031640052795410156, 0.035373687744140625, 0.039107322692871094, 0.04284095764160156, 0.04657459259033203, 0.0503082275390625, 0.05404186248779297, 0.05777549743652344, 0.061509132385253906, 0.06524276733398438, 0.06897640228271484, 0.07271003723144531, 0.07644367218017578, 0.08017730712890625, 0.08391094207763672, 0.08764457702636719, 0.09137821197509766, 0.09511184692382812, 0.0988454818725586, 0.10257911682128906, 0.10631275177001953, 0.11004638671875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 3.0, 8.0, 6.0, 11.0, 10.0, 6.0, 18.0, 23.0, 18.0, 14.0, 29.0, 40.0, 39.0, 37.0, 23.0, 48.0, 60.0, 36.0, 53.0, 42.0, 56.0, 37.0, 43.0, 44.0, 31.0, 44.0, 29.0, 31.0, 33.0, 20.0, 27.0, 20.0, 14.0, 7.0, 10.0, 5.0, 9.0, 2.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.53515625, -2.465606689453125, -2.39605712890625, -2.326507568359375, -2.2569580078125, -2.187408447265625, -2.11785888671875, -2.048309326171875, -1.978759765625, -1.909210205078125, -1.83966064453125, -1.770111083984375, -1.7005615234375, -1.631011962890625, -1.56146240234375, -1.491912841796875, -1.42236328125, -1.352813720703125, -1.28326416015625, -1.213714599609375, -1.1441650390625, -1.074615478515625, -1.00506591796875, -0.935516357421875, -0.865966796875, -0.796417236328125, -0.72686767578125, -0.657318115234375, -0.5877685546875, -0.518218994140625, -0.44866943359375, -0.379119873046875, -0.3095703125, -0.240020751953125, -0.17047119140625, -0.100921630859375, -0.0313720703125, 0.038177490234375, 0.10772705078125, 0.177276611328125, 0.246826171875, 0.316375732421875, 0.38592529296875, 0.455474853515625, 0.5250244140625, 0.594573974609375, 0.66412353515625, 0.733673095703125, 0.80322265625, 0.872772216796875, 0.94232177734375, 1.011871337890625, 1.0814208984375, 1.150970458984375, 1.22052001953125, 1.290069580078125, 1.359619140625, 1.429168701171875, 1.49871826171875, 1.568267822265625, 1.6378173828125, 1.707366943359375, 1.77691650390625, 1.846466064453125, 1.916015625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 3.0, 10.0, 8.0, 6.0, 11.0, 22.0, 30.0, 57.0, 77.0, 155.0, 251.0, 515.0, 946.0, 2236.0, 5959.0, 24562.0, 178269.0, 743841.0, 70495.0, 13433.0, 4040.0, 1706.0, 860.0, 425.0, 248.0, 150.0, 85.0, 44.0, 38.0, 17.0, 13.0, 10.0, 2.0, 6.0, 3.0, 3.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0137939453125, -0.013391733169555664, -0.012989521026611328, -0.012587308883666992, -0.012185096740722656, -0.01178288459777832, -0.011380672454833984, -0.010978460311889648, -0.010576248168945312, -0.010174036026000977, -0.00977182388305664, -0.009369611740112305, -0.008967399597167969, -0.008565187454223633, -0.008162975311279297, -0.007760763168334961, -0.007358551025390625, -0.006956338882446289, -0.006554126739501953, -0.006151914596557617, -0.005749702453613281, -0.005347490310668945, -0.004945278167724609, -0.0045430660247802734, -0.0041408538818359375, -0.0037386417388916016, -0.0033364295959472656, -0.0029342174530029297, -0.0025320053100585938, -0.002129793167114258, -0.0017275810241699219, -0.001325368881225586, -0.00092315673828125, -0.0005209445953369141, -0.00011873245239257812, 0.0002834796905517578, 0.0006856918334960938, 0.0010879039764404297, 0.0014901161193847656, 0.0018923282623291016, 0.0022945404052734375, 0.0026967525482177734, 0.0030989646911621094, 0.0035011768341064453, 0.0039033889770507812, 0.004305601119995117, 0.004707813262939453, 0.005110025405883789, 0.005512237548828125, 0.005914449691772461, 0.006316661834716797, 0.006718873977661133, 0.007121086120605469, 0.007523298263549805, 0.00792551040649414, 0.008327722549438477, 0.008729934692382812, 0.009132146835327148, 0.009534358978271484, 0.00993657112121582, 0.010338783264160156, 0.010740995407104492, 0.011143207550048828, 0.011545419692993164, 0.0119476318359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 4.0, 9.0, 20.0, 15.0, 31.0, 56.0, 85.0, 146.0, 264.0, 156.0, 80.0, 27.0, 27.0, 16.0, 19.0, 10.0, 9.0, 4.0, 1.0, 9.0, 2.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.601478576660156e-05, -4.4821761548519135e-05, -4.3628737330436707e-05, -4.243571311235428e-05, -4.124268889427185e-05, -4.004966467618942e-05, -3.8856640458106995e-05, -3.766361624002457e-05, -3.647059202194214e-05, -3.527756780385971e-05, -3.408454358577728e-05, -3.2891519367694855e-05, -3.169849514961243e-05, -3.050547093153e-05, -2.931244671344757e-05, -2.8119422495365143e-05, -2.6926398277282715e-05, -2.5733374059200287e-05, -2.454034984111786e-05, -2.334732562303543e-05, -2.2154301404953003e-05, -2.0961277186870575e-05, -1.9768252968788147e-05, -1.857522875070572e-05, -1.738220453262329e-05, -1.6189180314540863e-05, -1.4996156096458435e-05, -1.3803131878376007e-05, -1.2610107660293579e-05, -1.1417083442211151e-05, -1.0224059224128723e-05, -9.031035006046295e-06, -7.838010787963867e-06, -6.644986569881439e-06, -5.451962351799011e-06, -4.258938133716583e-06, -3.0659139156341553e-06, -1.8728896975517273e-06, -6.798654794692993e-07, 5.131587386131287e-07, 1.7061829566955566e-06, 2.8992071747779846e-06, 4.092231392860413e-06, 5.2852556109428406e-06, 6.4782798290252686e-06, 7.671304047107697e-06, 8.864328265190125e-06, 1.0057352483272552e-05, 1.125037670135498e-05, 1.2443400919437408e-05, 1.3636425137519836e-05, 1.4829449355602264e-05, 1.6022473573684692e-05, 1.721549779176712e-05, 1.840852200984955e-05, 1.9601546227931976e-05, 2.0794570446014404e-05, 2.1987594664096832e-05, 2.318061888217926e-05, 2.4373643100261688e-05, 2.5566667318344116e-05, 2.6759691536426544e-05, 2.7952715754508972e-05, 2.91457399725914e-05, 3.0338764190673828e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 3.0, 0.0, 1.0, 3.0, 5.0, 7.0, 6.0, 9.0, 4.0, 15.0, 14.0, 25.0, 31.0, 34.0, 56.0, 78.0, 133.0, 295.0, 21390.0, 1024487.0, 1439.0, 168.0, 102.0, 64.0, 45.0, 30.0, 22.0, 20.0, 12.0, 6.0, 13.0, 8.0, 9.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06597900390625, -0.06355953216552734, -0.06114006042480469, -0.05872058868408203, -0.056301116943359375, -0.05388164520263672, -0.05146217346191406, -0.049042701721191406, -0.04662322998046875, -0.044203758239746094, -0.04178428649902344, -0.03936481475830078, -0.036945343017578125, -0.03452587127685547, -0.03210639953613281, -0.029686927795410156, -0.0272674560546875, -0.024847984313964844, -0.022428512573242188, -0.02000904083251953, -0.017589569091796875, -0.015170097351074219, -0.012750625610351562, -0.010331153869628906, -0.00791168212890625, -0.005492210388183594, -0.0030727386474609375, -0.0006532669067382812, 0.001766204833984375, 0.004185676574707031, 0.0066051483154296875, 0.009024620056152344, 0.011444091796875, 0.013863563537597656, 0.016283035278320312, 0.01870250701904297, 0.021121978759765625, 0.02354145050048828, 0.025960922241210938, 0.028380393981933594, 0.03079986572265625, 0.033219337463378906, 0.03563880920410156, 0.03805828094482422, 0.040477752685546875, 0.04289722442626953, 0.04531669616699219, 0.047736167907714844, 0.0501556396484375, 0.052575111389160156, 0.05499458312988281, 0.05741405487060547, 0.059833526611328125, 0.06225299835205078, 0.06467247009277344, 0.0670919418334961, 0.06951141357421875, 0.0719308853149414, 0.07435035705566406, 0.07676982879638672, 0.07918930053710938, 0.08160877227783203, 0.08402824401855469, 0.08644771575927734, 0.0888671875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 5.0, 8.0, 11.0, 7.0, 8.0, 14.0, 16.0, 24.0, 28.0, 24.0, 42.0, 57.0, 80.0, 70.0, 85.0, 81.0, 82.0, 80.0, 54.0, 52.0, 23.0, 19.0, 22.0, 22.0, 16.0, 6.0, 9.0, 7.0, 7.0, 5.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0029697418212890625, -0.0028603971004486084, -0.0027510523796081543, -0.0026417076587677, -0.002532362937927246, -0.002423018217086792, -0.002313673496246338, -0.002204328775405884, -0.0020949840545654297, -0.0019856393337249756, -0.0018762946128845215, -0.0017669498920440674, -0.0016576051712036133, -0.0015482604503631592, -0.001438915729522705, -0.001329571008682251, -0.0012202262878417969, -0.0011108815670013428, -0.0010015368461608887, -0.0008921921253204346, -0.0007828474044799805, -0.0006735026836395264, -0.0005641579627990723, -0.00045481324195861816, -0.00034546852111816406, -0.00023612380027770996, -0.00012677907943725586, -1.7434358596801758e-05, 9.191036224365234e-05, 0.00020125508308410645, 0.00031059980392456055, 0.00041994452476501465, 0.0005292892456054688, 0.0006386339664459229, 0.000747978687286377, 0.0008573234081268311, 0.0009666681289672852, 0.0010760128498077393, 0.0011853575706481934, 0.0012947022914886475, 0.0014040470123291016, 0.0015133917331695557, 0.0016227364540100098, 0.0017320811748504639, 0.001841425895690918, 0.001950770616531372, 0.002060115337371826, 0.0021694600582122803, 0.0022788047790527344, 0.0023881494998931885, 0.0024974942207336426, 0.0026068389415740967, 0.0027161836624145508, 0.002825528383255005, 0.002934873104095459, 0.003044217824935913, 0.003153562545776367, 0.0032629072666168213, 0.0033722519874572754, 0.0034815967082977295, 0.0035909414291381836, 0.0037002861499786377, 0.003809630870819092, 0.003918975591659546, 0.0040283203125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 7.0, 19.0, 31.0, 69.0, 146.0, 250.0, 252.0, 109.0, 58.0, 29.0, 11.0, 8.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.800173044204712, -1.714323878288269, -1.6284747123718262, -1.5426255464553833, -1.4567763805389404, -1.3709272146224976, -1.2850780487060547, -1.1992288827896118, -1.113379716873169, -1.027530550956726, -0.9416813850402832, -0.8558322191238403, -0.7699830532073975, -0.6841338872909546, -0.5982847213745117, -0.5124355554580688, -0.426586389541626, -0.3407372236251831, -0.25488805770874023, -0.16903889179229736, -0.08318972587585449, 0.002659440040588379, 0.08850860595703125, 0.17435777187347412, 0.260206937789917, 0.34605610370635986, 0.43190526962280273, 0.5177544355392456, 0.6036036014556885, 0.6894527673721313, 0.7753019332885742, 0.8611510992050171, 0.9470000267028809, 1.0328491926193237, 1.1186983585357666, 1.2045475244522095, 1.2903966903686523, 1.3762458562850952, 1.462095022201538, 1.547944188117981, 1.6337933540344238, 1.7196425199508667, 1.8054916858673096, 1.8913408517837524, 1.9771900177001953, 2.0630393028259277, 2.148888349533081, 2.2347373962402344, 2.320586681365967, 2.406435966491699, 2.4922850131988525, 2.578134059906006, 2.6639833450317383, 2.7498326301574707, 2.835681676864624, 2.9215307235717773, 3.0073800086975098, 3.093229293823242, 3.1790783405303955, 3.264927387237549, 3.3507766723632812, 3.4366259574890137, 3.522475004196167, 3.6083240509033203, 3.6941733360290527]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 5.0, 8.0, 11.0, 11.0, 13.0, 15.0, 23.0, 21.0, 38.0, 35.0, 38.0, 42.0, 53.0, 34.0, 53.0, 61.0, 58.0, 55.0, 50.0, 47.0, 41.0, 43.0, 45.0, 33.0, 29.0, 31.0, 15.0, 17.0, 15.0, 14.0, 13.0, 7.0, 5.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5968492031097412, -1.5504605770111084, -1.5040719509124756, -1.4576833248138428, -1.41129469871521, -1.3649060726165771, -1.3185174465179443, -1.2721288204193115, -1.2257401943206787, -1.179351568222046, -1.132962942123413, -1.0865743160247803, -1.0401856899261475, -0.9937970638275146, -0.9474084377288818, -0.901019811630249, -0.854631245136261, -0.8082426190376282, -0.7618539929389954, -0.7154653668403625, -0.6690767407417297, -0.6226881146430969, -0.5762995481491089, -0.5299109220504761, -0.4835222661495209, -0.43713364005088806, -0.39074501395225525, -0.3443564176559448, -0.297967791557312, -0.2515791654586792, -0.2051905393600464, -0.15880191326141357, -0.11241328716278076, -0.06602466106414795, -0.019636042416095734, 0.026752576231956482, 0.0731412023305893, 0.1195298284292221, 0.16591843962669373, 0.21230706572532654, 0.25869569182395935, 0.30508431792259216, 0.351472944021225, 0.3978615403175354, 0.4442501664161682, 0.490638792514801, 0.5370274186134338, 0.5834160447120667, 0.6298046708106995, 0.6761932969093323, 0.7225819230079651, 0.7689705491065979, 0.8153591752052307, 0.8617478013038635, 0.9081363677978516, 0.9545249938964844, 1.0009136199951172, 1.04730224609375, 1.0936908721923828, 1.1400794982910156, 1.1864681243896484, 1.2328567504882812, 1.279245376586914, 1.3256340026855469, 1.3720226287841797]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 0.0, 4.0, 6.0, 11.0, 7.0, 13.0, 17.0, 26.0, 40.0, 46.0, 65.0, 93.0, 138.0, 225.0, 346.0, 504.0, 842.0, 1332.0, 2273.0, 3921.0, 7421.0, 15008.0, 35243.0, 103236.0, 439461.0, 304714.0, 77660.0, 28429.0, 12370.0, 6301.0, 3486.0, 1968.0, 1202.0, 772.0, 456.0, 293.0, 188.0, 121.0, 94.0, 66.0, 45.0, 27.0, 26.0, 15.0, 14.0, 11.0, 4.0, 11.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.4794921875, -1.43157958984375, -1.3836669921875, -1.33575439453125, -1.287841796875, -1.23992919921875, -1.1920166015625, -1.14410400390625, -1.09619140625, -1.04827880859375, -1.0003662109375, -0.95245361328125, -0.904541015625, -0.85662841796875, -0.8087158203125, -0.76080322265625, -0.712890625, -0.66497802734375, -0.6170654296875, -0.56915283203125, -0.521240234375, -0.47332763671875, -0.4254150390625, -0.37750244140625, -0.32958984375, -0.28167724609375, -0.2337646484375, -0.18585205078125, -0.137939453125, -0.09002685546875, -0.0421142578125, 0.00579833984375, 0.0537109375, 0.10162353515625, 0.1495361328125, 0.19744873046875, 0.245361328125, 0.29327392578125, 0.3411865234375, 0.38909912109375, 0.43701171875, 0.48492431640625, 0.5328369140625, 0.58074951171875, 0.628662109375, 0.67657470703125, 0.7244873046875, 0.77239990234375, 0.8203125, 0.86822509765625, 0.9161376953125, 0.96405029296875, 1.011962890625, 1.05987548828125, 1.1077880859375, 1.15570068359375, 1.20361328125, 1.25152587890625, 1.2994384765625, 1.34735107421875, 1.395263671875, 1.44317626953125, 1.4910888671875, 1.53900146484375, 1.5869140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 6.0, 4.0, 4.0, 14.0, 10.0, 12.0, 16.0, 11.0, 20.0, 23.0, 29.0, 26.0, 35.0, 33.0, 44.0, 41.0, 56.0, 53.0, 54.0, 46.0, 44.0, 39.0, 53.0, 50.0, 22.0, 39.0, 31.0, 32.0, 26.0, 28.0, 19.0, 12.0, 19.0, 11.0, 8.0, 5.0, 7.0, 5.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.859375, -9.5712890625, -9.283203125, -8.9951171875, -8.70703125, -8.4189453125, -8.130859375, -7.8427734375, -7.5546875, -7.2666015625, -6.978515625, -6.6904296875, -6.40234375, -6.1142578125, -5.826171875, -5.5380859375, -5.25, -4.9619140625, -4.673828125, -4.3857421875, -4.09765625, -3.8095703125, -3.521484375, -3.2333984375, -2.9453125, -2.6572265625, -2.369140625, -2.0810546875, -1.79296875, -1.5048828125, -1.216796875, -0.9287109375, -0.640625, -0.3525390625, -0.064453125, 0.2236328125, 0.51171875, 0.7998046875, 1.087890625, 1.3759765625, 1.6640625, 1.9521484375, 2.240234375, 2.5283203125, 2.81640625, 3.1044921875, 3.392578125, 3.6806640625, 3.96875, 4.2568359375, 4.544921875, 4.8330078125, 5.12109375, 5.4091796875, 5.697265625, 5.9853515625, 6.2734375, 6.5615234375, 6.849609375, 7.1376953125, 7.42578125, 7.7138671875, 8.001953125, 8.2900390625, 8.578125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 8.0, 4.0, 13.0, 9.0, 13.0, 12.0, 28.0, 14.0, 29.0, 43.0, 44.0, 55.0, 81.0, 138.0, 194.0, 361.0, 621.0, 14672.0, 1028466.0, 2302.0, 498.0, 286.0, 198.0, 117.0, 66.0, 55.0, 41.0, 33.0, 31.0, 24.0, 13.0, 17.0, 14.0, 8.0, 8.0, 10.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.5078125, -11.1822509765625, -10.856689453125, -10.5311279296875, -10.20556640625, -9.8800048828125, -9.554443359375, -9.2288818359375, -8.9033203125, -8.5777587890625, -8.252197265625, -7.9266357421875, -7.60107421875, -7.2755126953125, -6.949951171875, -6.6243896484375, -6.298828125, -5.9732666015625, -5.647705078125, -5.3221435546875, -4.99658203125, -4.6710205078125, -4.345458984375, -4.0198974609375, -3.6943359375, -3.3687744140625, -3.043212890625, -2.7176513671875, -2.39208984375, -2.0665283203125, -1.740966796875, -1.4154052734375, -1.08984375, -0.7642822265625, -0.438720703125, -0.1131591796875, 0.21240234375, 0.5379638671875, 0.863525390625, 1.1890869140625, 1.5146484375, 1.8402099609375, 2.165771484375, 2.4913330078125, 2.81689453125, 3.1424560546875, 3.468017578125, 3.7935791015625, 4.119140625, 4.4447021484375, 4.770263671875, 5.0958251953125, 5.42138671875, 5.7469482421875, 6.072509765625, 6.3980712890625, 6.7236328125, 7.0491943359375, 7.374755859375, 7.7003173828125, 8.02587890625, 8.3514404296875, 8.677001953125, 9.0025634765625, 9.328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 8.0, 7.0, 9.0, 14.0, 12.0, 11.0, 10.0, 18.0, 21.0, 25.0, 31.0, 33.0, 32.0, 34.0, 59.0, 42.0, 45.0, 43.0, 37.0, 55.0, 60.0, 35.0, 45.0, 37.0, 28.0, 38.0, 28.0, 24.0, 22.0, 27.0, 21.0, 20.0, 14.0, 8.0, 16.0, 2.0, 8.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6953125, -9.4166259765625, -9.137939453125, -8.8592529296875, -8.58056640625, -8.3018798828125, -8.023193359375, -7.7445068359375, -7.4658203125, -7.1871337890625, -6.908447265625, -6.6297607421875, -6.35107421875, -6.0723876953125, -5.793701171875, -5.5150146484375, -5.236328125, -4.9576416015625, -4.678955078125, -4.4002685546875, -4.12158203125, -3.8428955078125, -3.564208984375, -3.2855224609375, -3.0068359375, -2.7281494140625, -2.449462890625, -2.1707763671875, -1.89208984375, -1.6134033203125, -1.334716796875, -1.0560302734375, -0.77734375, -0.4986572265625, -0.219970703125, 0.0587158203125, 0.33740234375, 0.6160888671875, 0.894775390625, 1.1734619140625, 1.4521484375, 1.7308349609375, 2.009521484375, 2.2882080078125, 2.56689453125, 2.8455810546875, 3.124267578125, 3.4029541015625, 3.681640625, 3.9603271484375, 4.239013671875, 4.5177001953125, 4.79638671875, 5.0750732421875, 5.353759765625, 5.6324462890625, 5.9111328125, 6.1898193359375, 6.468505859375, 6.7471923828125, 7.02587890625, 7.3045654296875, 7.583251953125, 7.8619384765625, 8.140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 18.0, 91.0, 1116.0, 1046239.0, 961.0, 84.0, 27.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-3.60546875, -3.529541015625, -3.45361328125, -3.377685546875, -3.3017578125, -3.225830078125, -3.14990234375, -3.073974609375, -2.998046875, -2.922119140625, -2.84619140625, -2.770263671875, -2.6943359375, -2.618408203125, -2.54248046875, -2.466552734375, -2.390625, -2.314697265625, -2.23876953125, -2.162841796875, -2.0869140625, -2.010986328125, -1.93505859375, -1.859130859375, -1.783203125, -1.707275390625, -1.63134765625, -1.555419921875, -1.4794921875, -1.403564453125, -1.32763671875, -1.251708984375, -1.17578125, -1.099853515625, -1.02392578125, -0.947998046875, -0.8720703125, -0.796142578125, -0.72021484375, -0.644287109375, -0.568359375, -0.492431640625, -0.41650390625, -0.340576171875, -0.2646484375, -0.188720703125, -0.11279296875, -0.036865234375, 0.0390625, 0.114990234375, 0.19091796875, 0.266845703125, 0.3427734375, 0.418701171875, 0.49462890625, 0.570556640625, 0.646484375, 0.722412109375, 0.79833984375, 0.874267578125, 0.9501953125, 1.026123046875, 1.10205078125, 1.177978515625, 1.25390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 5.0, 7.0, 11.0, 21.0, 44.0, 211.0, 480.0, 118.0, 43.0, 18.0, 6.0, 15.0, 10.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.59634780883789e-05, -9.308569133281708e-05, -9.020790457725525e-05, -8.733011782169342e-05, -8.445233106613159e-05, -8.157454431056976e-05, -7.869675755500793e-05, -7.58189707994461e-05, -7.294118404388428e-05, -7.006339728832245e-05, -6.718561053276062e-05, -6.430782377719879e-05, -6.143003702163696e-05, -5.8552250266075134e-05, -5.5674463510513306e-05, -5.279667675495148e-05, -4.991888999938965e-05, -4.704110324382782e-05, -4.416331648826599e-05, -4.128552973270416e-05, -3.8407742977142334e-05, -3.5529956221580505e-05, -3.265216946601868e-05, -2.9774382710456848e-05, -2.689659595489502e-05, -2.401880919933319e-05, -2.1141022443771362e-05, -1.8263235688209534e-05, -1.5385448932647705e-05, -1.2507662177085876e-05, -9.629875421524048e-06, -6.752088665962219e-06, -3.874301910400391e-06, -9.96515154838562e-07, 1.8812716007232666e-06, 4.759058356285095e-06, 7.636845111846924e-06, 1.0514631867408752e-05, 1.3392418622970581e-05, 1.627020537853241e-05, 1.9147992134094238e-05, 2.2025778889656067e-05, 2.4903565645217896e-05, 2.7781352400779724e-05, 3.065913915634155e-05, 3.353692591190338e-05, 3.641471266746521e-05, 3.929249942302704e-05, 4.217028617858887e-05, 4.5048072934150696e-05, 4.7925859689712524e-05, 5.080364644527435e-05, 5.368143320083618e-05, 5.655921995639801e-05, 5.943700671195984e-05, 6.231479346752167e-05, 6.51925802230835e-05, 6.807036697864532e-05, 7.094815373420715e-05, 7.382594048976898e-05, 7.670372724533081e-05, 7.958151400089264e-05, 8.245930075645447e-05, 8.53370875120163e-05, 8.821487426757812e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 7.0, 1.0, 2.0, 8.0, 8.0, 5.0, 31.0, 192.0, 6786.0, 1040186.0, 1154.0, 89.0, 26.0, 14.0, 9.0, 6.0, 8.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5576171875, -0.5434303283691406, -0.5292434692382812, -0.5150566101074219, -0.5008697509765625, -0.4866828918457031, -0.47249603271484375, -0.4583091735839844, -0.444122314453125, -0.4299354553222656, -0.41574859619140625, -0.4015617370605469, -0.3873748779296875, -0.3731880187988281, -0.35900115966796875, -0.3448143005371094, -0.33062744140625, -0.3164405822753906, -0.30225372314453125, -0.2880668640136719, -0.2738800048828125, -0.2596931457519531, -0.24550628662109375, -0.23131942749023438, -0.217132568359375, -0.20294570922851562, -0.18875885009765625, -0.17457199096679688, -0.1603851318359375, -0.14619827270507812, -0.13201141357421875, -0.11782455444335938, -0.1036376953125, -0.08945083618164062, -0.07526397705078125, -0.061077117919921875, -0.0468902587890625, -0.032703399658203125, -0.01851654052734375, -0.004329681396484375, 0.009857177734375, 0.024044036865234375, 0.03823089599609375, 0.052417755126953125, 0.0666046142578125, 0.08079147338867188, 0.09497833251953125, 0.10916519165039062, 0.12335205078125, 0.13753890991210938, 0.15172576904296875, 0.16591262817382812, 0.1800994873046875, 0.19428634643554688, 0.20847320556640625, 0.22266006469726562, 0.236846923828125, 0.2510337829589844, 0.26522064208984375, 0.2794075012207031, 0.2935943603515625, 0.3077812194824219, 0.32196807861328125, 0.3361549377441406, 0.350341796875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 6.0, 6.0, 14.0, 13.0, 9.0, 29.0, 45.0, 84.0, 228.0, 264.0, 120.0, 49.0, 28.0, 15.0, 11.0, 11.0, 12.0, 8.0, 5.0, 5.0, 6.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039337158203125, -0.03763628005981445, -0.035935401916503906, -0.03423452377319336, -0.03253364562988281, -0.030832767486572266, -0.02913188934326172, -0.027431011199951172, -0.025730133056640625, -0.024029254913330078, -0.02232837677001953, -0.020627498626708984, -0.018926620483398438, -0.01722574234008789, -0.015524864196777344, -0.013823986053466797, -0.01212310791015625, -0.010422229766845703, -0.008721351623535156, -0.007020473480224609, -0.0053195953369140625, -0.0036187171936035156, -0.0019178390502929688, -0.00021696090698242188, 0.001483917236328125, 0.003184795379638672, 0.004885673522949219, 0.006586551666259766, 0.008287429809570312, 0.00998830795288086, 0.011689186096191406, 0.013390064239501953, 0.0150909423828125, 0.016791820526123047, 0.018492698669433594, 0.02019357681274414, 0.021894454956054688, 0.023595333099365234, 0.02529621124267578, 0.026997089385986328, 0.028697967529296875, 0.030398845672607422, 0.03209972381591797, 0.033800601959228516, 0.03550148010253906, 0.03720235824584961, 0.038903236389160156, 0.0406041145324707, 0.04230499267578125, 0.0440058708190918, 0.045706748962402344, 0.04740762710571289, 0.04910850524902344, 0.050809383392333984, 0.05251026153564453, 0.05421113967895508, 0.055912017822265625, 0.05761289596557617, 0.05931377410888672, 0.061014652252197266, 0.06271553039550781, 0.06441640853881836, 0.0661172866821289, 0.06781816482543945, 0.06951904296875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 79.0, 807.0, 119.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9333388805389404, -2.4048168659210205, -1.876294732093811, -1.3477725982666016, -0.8192505836486816, -0.2907285690307617, 0.2377936840057373, 0.7663156986236572, 1.2948377132415771, 1.823359727859497, 2.351881980895996, 2.880403995513916, 3.408926010131836, 3.937448024749756, 4.465970039367676, 4.994492530822754, 5.523014068603516, 6.0515360832214355, 6.5800580978393555, 7.108580589294434, 7.637102127075195, 8.165624618530273, 8.694147109985352, 9.222668647766113, 9.751191139221191, 10.27971363067627, 10.808235168457031, 11.33675765991211, 11.865279197692871, 12.39380168914795, 12.922323226928711, 13.450845718383789, 13.979366302490234, 14.507888793945312, 15.036410331726074, 15.564932823181152, 16.093454360961914, 16.621976852416992, 17.15049934387207, 17.679019927978516, 18.207542419433594, 18.736064910888672, 19.26458740234375, 19.793107986450195, 20.321630477905273, 20.85015296936035, 21.37867546081543, 21.907196044921875, 22.435718536376953, 22.96424102783203, 23.49276351928711, 24.021284103393555, 24.549806594848633, 25.07832908630371, 25.60685157775879, 26.135372161865234, 26.663896560668945, 27.192419052124023, 27.7209415435791, 28.249462127685547, 28.777984619140625, 29.306507110595703, 29.83502960205078, 30.36355209350586, 30.892072677612305]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 4.0, 8.0, 5.0, 10.0, 10.0, 10.0, 14.0, 17.0, 17.0, 27.0, 23.0, 17.0, 21.0, 24.0, 32.0, 33.0, 28.0, 39.0, 43.0, 41.0, 38.0, 27.0, 39.0, 33.0, 37.0, 41.0, 32.0, 33.0, 35.0, 26.0, 38.0, 32.0, 19.0, 20.0, 16.0, 22.0, 20.0, 15.0, 16.0, 13.0, 6.0, 5.0, 5.0, 2.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.561980247497559, -12.118780136108398, -11.675579071044922, -11.232378959655762, -10.789178848266602, -10.345978736877441, -9.902778625488281, -9.459577560424805, -9.016377449035645, -8.573177337646484, -8.129976272583008, -7.686776161193848, -7.2435760498046875, -6.800375938415527, -6.357175350189209, -5.913974761962891, -5.4707746505737305, -5.02757453918457, -4.584373950958252, -4.141173362731934, -3.6979732513427734, -3.254772901535034, -2.811572551727295, -2.3683722019195557, -1.9251718521118164, -1.4819715023040771, -1.038771152496338, -0.5955708026885986, -0.15237045288085938, 0.2908298969268799, 0.7340302467346191, 1.1772305965423584, 1.6204309463500977, 2.063631296157837, 2.506831645965576, 2.9500319957733154, 3.3932323455810547, 3.836432695388794, 4.279633045196533, 4.722833633422852, 5.166033744812012, 5.609233856201172, 6.05243444442749, 6.495635032653809, 6.938835144042969, 7.382035255432129, 7.825235843658447, 8.268436431884766, 8.711636543273926, 9.154836654663086, 9.598037719726562, 10.041237831115723, 10.484437942504883, 10.927638053894043, 11.370838165283203, 11.81403923034668, 12.25723934173584, 12.700439453125, 13.143640518188477, 13.586840629577637, 14.030040740966797, 14.473240852355957, 14.916440963745117, 15.359642028808594, 15.802842140197754]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 7.0, 7.0, 6.0, 4.0, 15.0, 20.0, 17.0, 18.0, 24.0, 15.0, 24.0, 23.0, 33.0, 30.0, 50.0, 66.0, 156.0, 264.0, 586.0, 2448.0, 4185287.0, 3665.0, 698.0, 289.0, 135.0, 80.0, 60.0, 30.0, 37.0, 36.0, 19.0, 19.0, 18.0, 21.0, 15.0, 14.0, 5.0, 10.0, 7.0, 5.0, 4.0, 9.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6875, -8.4034423828125, -8.119384765625, -7.8353271484375, -7.55126953125, -7.2672119140625, -6.983154296875, -6.6990966796875, -6.4150390625, -6.1309814453125, -5.846923828125, -5.5628662109375, -5.27880859375, -4.9947509765625, -4.710693359375, -4.4266357421875, -4.142578125, -3.8585205078125, -3.574462890625, -3.2904052734375, -3.00634765625, -2.7222900390625, -2.438232421875, -2.1541748046875, -1.8701171875, -1.5860595703125, -1.302001953125, -1.0179443359375, -0.73388671875, -0.4498291015625, -0.165771484375, 0.1182861328125, 0.40234375, 0.6864013671875, 0.970458984375, 1.2545166015625, 1.53857421875, 1.8226318359375, 2.106689453125, 2.3907470703125, 2.6748046875, 2.9588623046875, 3.242919921875, 3.5269775390625, 3.81103515625, 4.0950927734375, 4.379150390625, 4.6632080078125, 4.947265625, 5.2313232421875, 5.515380859375, 5.7994384765625, 6.08349609375, 6.3675537109375, 6.651611328125, 6.9356689453125, 7.2197265625, 7.5037841796875, 7.787841796875, 8.0718994140625, 8.35595703125, 8.6400146484375, 8.924072265625, 9.2081298828125, 9.4921875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 5.0, 1.0, 6.0, 11.0, 17.0, 14.0, 14.0, 20.0, 18.0, 25.0, 21.0, 30.0, 34.0, 28.0, 31.0, 39.0, 42.0, 47.0, 54.0, 49.0, 42.0, 41.0, 45.0, 42.0, 41.0, 34.0, 39.0, 39.0, 27.0, 30.0, 17.0, 26.0, 20.0, 13.0, 10.0, 8.0, 10.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.62890625, -0.6104202270507812, -0.5919342041015625, -0.5734481811523438, -0.554962158203125, -0.5364761352539062, -0.5179901123046875, -0.49950408935546875, -0.48101806640625, -0.46253204345703125, -0.4440460205078125, -0.42555999755859375, -0.407073974609375, -0.38858795166015625, -0.3701019287109375, -0.35161590576171875, -0.3331298828125, -0.31464385986328125, -0.2961578369140625, -0.27767181396484375, -0.259185791015625, -0.24069976806640625, -0.2222137451171875, -0.20372772216796875, -0.18524169921875, -0.16675567626953125, -0.1482696533203125, -0.12978363037109375, -0.111297607421875, -0.09281158447265625, -0.0743255615234375, -0.05583953857421875, -0.037353515625, -0.01886749267578125, -0.0003814697265625, 0.01810455322265625, 0.036590576171875, 0.05507659912109375, 0.0735626220703125, 0.09204864501953125, 0.11053466796875, 0.12902069091796875, 0.1475067138671875, 0.16599273681640625, 0.184478759765625, 0.20296478271484375, 0.2214508056640625, 0.23993682861328125, 0.2584228515625, 0.27690887451171875, 0.2953948974609375, 0.31388092041015625, 0.332366943359375, 0.35085296630859375, 0.3693389892578125, 0.38782501220703125, 0.40631103515625, 0.42479705810546875, 0.4432830810546875, 0.46176910400390625, 0.480255126953125, 0.49874114990234375, 0.5172271728515625, 0.5357131958007812, 0.55419921875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 0.0, 4.0, 1.0, 7.0, 8.0, 21.0, 74.0, 329.0, 4191090.0, 2531.0, 141.0, 41.0, 14.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.9375, -26.24365234375, -25.5498046875, -24.85595703125, -24.162109375, -23.46826171875, -22.7744140625, -22.08056640625, -21.38671875, -20.69287109375, -19.9990234375, -19.30517578125, -18.611328125, -17.91748046875, -17.2236328125, -16.52978515625, -15.8359375, -15.14208984375, -14.4482421875, -13.75439453125, -13.060546875, -12.36669921875, -11.6728515625, -10.97900390625, -10.28515625, -9.59130859375, -8.8974609375, -8.20361328125, -7.509765625, -6.81591796875, -6.1220703125, -5.42822265625, -4.734375, -4.04052734375, -3.3466796875, -2.65283203125, -1.958984375, -1.26513671875, -0.5712890625, 0.12255859375, 0.81640625, 1.51025390625, 2.2041015625, 2.89794921875, 3.591796875, 4.28564453125, 4.9794921875, 5.67333984375, 6.3671875, 7.06103515625, 7.7548828125, 8.44873046875, 9.142578125, 9.83642578125, 10.5302734375, 11.22412109375, 11.91796875, 12.61181640625, 13.3056640625, 13.99951171875, 14.693359375, 15.38720703125, 16.0810546875, 16.77490234375, 17.46875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 6.0, 20.0, 34.0, 96.0, 262.0, 970.0, 1997.0, 465.0, 128.0, 36.0, 15.0, 9.0, 10.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27490234375, -0.26517486572265625, -0.2554473876953125, -0.24571990966796875, -0.235992431640625, -0.22626495361328125, -0.2165374755859375, -0.20680999755859375, -0.19708251953125, -0.18735504150390625, -0.1776275634765625, -0.16790008544921875, -0.158172607421875, -0.14844512939453125, -0.1387176513671875, -0.12899017333984375, -0.1192626953125, -0.10953521728515625, -0.0998077392578125, -0.09008026123046875, -0.080352783203125, -0.07062530517578125, -0.0608978271484375, -0.05117034912109375, -0.04144287109375, -0.03171539306640625, -0.0219879150390625, -0.01226043701171875, -0.002532958984375, 0.00719451904296875, 0.0169219970703125, 0.02664947509765625, 0.036376953125, 0.04610443115234375, 0.0558319091796875, 0.06555938720703125, 0.075286865234375, 0.08501434326171875, 0.0947418212890625, 0.10446929931640625, 0.11419677734375, 0.12392425537109375, 0.1336517333984375, 0.14337921142578125, 0.153106689453125, 0.16283416748046875, 0.1725616455078125, 0.18228912353515625, 0.1920166015625, 0.20174407958984375, 0.2114715576171875, 0.22119903564453125, 0.230926513671875, 0.24065399169921875, 0.2503814697265625, 0.26010894775390625, 0.26983642578125, 0.27956390380859375, 0.2892913818359375, 0.29901885986328125, 0.308746337890625, 0.31847381591796875, 0.3282012939453125, 0.33792877197265625, 0.34765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 13.0, 23.0, 41.0, 77.0, 139.0, 277.0, 205.0, 101.0, 44.0, 31.0, 20.0, 15.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6656585931777954, -0.6136078834533691, -0.5615571141242981, -0.5095064043998718, -0.45745566487312317, -0.4054049253463745, -0.35335421562194824, -0.3013034760951996, -0.24925273656845093, -0.19720199704170227, -0.1451512724161148, -0.09310054779052734, -0.041049808263778687, 0.01100093126296997, 0.06305164098739624, 0.1151023805141449, 0.16715312004089355, 0.2192038595676422, 0.27125459909439087, 0.32330530881881714, 0.3753560483455658, 0.42740678787231445, 0.4794574975967407, 0.531508207321167, 0.583558976650238, 0.6356096863746643, 0.6876604557037354, 0.7397111654281616, 0.7917618751525879, 0.8438126444816589, 0.8958633542060852, 0.9479141235351562, 0.9999649524688721, 1.0520156621932983, 1.1040663719177246, 1.1561172008514404, 1.2081679105758667, 1.260218620300293, 1.3122693300247192, 1.3643200397491455, 1.4163708686828613, 1.4684215784072876, 1.5204722881317139, 1.5725231170654297, 1.624573826789856, 1.6766245365142822, 1.7286752462387085, 1.7807259559631348, 1.832776665687561, 1.8848273754119873, 1.9368780851364136, 1.9889287948608398, 2.0409796237945557, 2.0930304527282715, 2.145081043243408, 2.197131872177124, 2.2491824626922607, 2.3012332916259766, 2.3532838821411133, 2.405334711074829, 2.457385301589966, 2.5094361305236816, 2.5614867210388184, 2.613537549972534, 2.66558837890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 6.0, 10.0, 3.0, 10.0, 13.0, 10.0, 13.0, 15.0, 20.0, 22.0, 17.0, 23.0, 29.0, 36.0, 35.0, 29.0, 36.0, 51.0, 40.0, 49.0, 44.0, 33.0, 38.0, 42.0, 34.0, 33.0, 35.0, 36.0, 46.0, 22.0, 27.0, 21.0, 24.0, 25.0, 18.0, 13.0, 12.0, 8.0, 7.0, 10.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6245119571685791, -0.6054648756980896, -0.5864178538322449, -0.5673707723617554, -0.5483236908912659, -0.5292766094207764, -0.5102295875549316, -0.49118250608444214, -0.472135454416275, -0.4530884027481079, -0.4340413212776184, -0.4149942696094513, -0.3959472179412842, -0.3769001364707947, -0.35785308480262756, -0.33880603313446045, -0.31975895166397095, -0.30071189999580383, -0.28166481852531433, -0.2626177668571472, -0.2435707002878189, -0.2245236337184906, -0.2054765820503235, -0.18642951548099518, -0.16738244891166687, -0.14833538234233856, -0.12928831577301025, -0.11024126410484314, -0.09119419753551483, -0.07214713096618652, -0.05310007184743881, -0.0340530127286911, -0.015005886554718018, 0.004041176289319992, 0.023088239133358, 0.04213530197739601, 0.06118236482143402, 0.08022943139076233, 0.09927649050951004, 0.11832354962825775, 0.13737061619758606, 0.15641768276691437, 0.17546474933624268, 0.1945118010044098, 0.2135588675737381, 0.2326059341430664, 0.2516529858112335, 0.27070003747940063, 0.28974711894989014, 0.30879417061805725, 0.32784125208854675, 0.34688830375671387, 0.36593538522720337, 0.3849824368953705, 0.4040294885635376, 0.4230765700340271, 0.4421236217021942, 0.46117067337036133, 0.48021775484085083, 0.49926480650901794, 0.5183118581771851, 0.5373589396476746, 0.5564060211181641, 0.5754530429840088, 0.5945001244544983]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 7.0, 11.0, 5.0, 23.0, 33.0, 40.0, 62.0, 74.0, 106.0, 157.0, 209.0, 316.0, 442.0, 632.0, 1097.0, 1872.0, 3672.0, 8693.0, 26567.0, 102667.0, 594807.0, 232489.0, 48241.0, 14356.0, 5340.0, 2618.0, 1356.0, 886.0, 543.0, 351.0, 249.0, 179.0, 130.0, 91.0, 78.0, 50.0, 34.0, 21.0, 13.0, 11.0, 3.0, 7.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.154541015625, -0.14982032775878906, -0.14509963989257812, -0.1403789520263672, -0.13565826416015625, -0.1309375762939453, -0.12621688842773438, -0.12149620056152344, -0.1167755126953125, -0.11205482482910156, -0.10733413696289062, -0.10261344909667969, -0.09789276123046875, -0.09317207336425781, -0.08845138549804688, -0.08373069763183594, -0.079010009765625, -0.07428932189941406, -0.06956863403320312, -0.06484794616699219, -0.06012725830078125, -0.05540657043457031, -0.050685882568359375, -0.04596519470214844, -0.0412445068359375, -0.03652381896972656, -0.031803131103515625, -0.027082443237304688, -0.02236175537109375, -0.017641067504882812, -0.012920379638671875, -0.008199691772460938, -0.00347900390625, 0.0012416839599609375, 0.005962371826171875, 0.010683059692382812, 0.01540374755859375, 0.020124435424804688, 0.024845123291015625, 0.029565811157226562, 0.0342864990234375, 0.03900718688964844, 0.043727874755859375, 0.04844856262207031, 0.05316925048828125, 0.05788993835449219, 0.06261062622070312, 0.06733131408691406, 0.072052001953125, 0.07677268981933594, 0.08149337768554688, 0.08621406555175781, 0.09093475341796875, 0.09565544128417969, 0.10037612915039062, 0.10509681701660156, 0.1098175048828125, 0.11453819274902344, 0.11925888061523438, 0.12397956848144531, 0.12870025634765625, 0.1334209442138672, 0.13814163208007812, 0.14286231994628906, 0.1475830078125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 8.0, 14.0, 12.0, 12.0, 15.0, 18.0, 26.0, 20.0, 31.0, 42.0, 35.0, 42.0, 48.0, 56.0, 57.0, 36.0, 57.0, 59.0, 47.0, 32.0, 49.0, 43.0, 40.0, 37.0, 19.0, 27.0, 31.0, 24.0, 14.0, 4.0, 11.0, 8.0, 4.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4638671875, -0.4498481750488281, -0.43582916259765625, -0.4218101501464844, -0.4077911376953125, -0.3937721252441406, -0.37975311279296875, -0.3657341003417969, -0.351715087890625, -0.3376960754394531, -0.32367706298828125, -0.3096580505371094, -0.2956390380859375, -0.2816200256347656, -0.26760101318359375, -0.2535820007324219, -0.23956298828125, -0.22554397583007812, -0.21152496337890625, -0.19750595092773438, -0.1834869384765625, -0.16946792602539062, -0.15544891357421875, -0.14142990112304688, -0.127410888671875, -0.11339187622070312, -0.09937286376953125, -0.08535385131835938, -0.0713348388671875, -0.057315826416015625, -0.04329681396484375, -0.029277801513671875, -0.0152587890625, -0.001239776611328125, 0.01277923583984375, 0.026798248291015625, 0.0408172607421875, 0.054836273193359375, 0.06885528564453125, 0.08287429809570312, 0.096893310546875, 0.11091232299804688, 0.12493133544921875, 0.13895034790039062, 0.1529693603515625, 0.16698837280273438, 0.18100738525390625, 0.19502639770507812, 0.20904541015625, 0.22306442260742188, 0.23708343505859375, 0.2511024475097656, 0.2651214599609375, 0.2791404724121094, 0.29315948486328125, 0.3071784973144531, 0.321197509765625, 0.3352165222167969, 0.34923553466796875, 0.3632545471191406, 0.3772735595703125, 0.3912925720214844, 0.40531158447265625, 0.4193305969238281, 0.433349609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 10.0, 9.0, 8.0, 17.0, 23.0, 23.0, 48.0, 73.0, 94.0, 129.0, 206.0, 278.0, 396.0, 681.0, 1098.0, 1637.0, 2714.0, 4398.0, 7427.0, 12361.0, 21388.0, 36533.0, 64803.0, 127234.0, 298522.0, 236787.0, 101838.0, 53512.0, 30511.0, 18349.0, 10952.0, 6595.0, 3833.0, 2301.0, 1285.0, 876.0, 535.0, 355.0, 244.0, 164.0, 110.0, 67.0, 43.0, 34.0, 14.0, 11.0, 7.0, 10.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.032806396484375, -0.03177642822265625, -0.0307464599609375, -0.02971649169921875, -0.0286865234375, -0.02765655517578125, -0.0266265869140625, -0.02559661865234375, -0.024566650390625, -0.02353668212890625, -0.0225067138671875, -0.02147674560546875, -0.02044677734375, -0.01941680908203125, -0.0183868408203125, -0.01735687255859375, -0.016326904296875, -0.01529693603515625, -0.0142669677734375, -0.01323699951171875, -0.01220703125, -0.01117706298828125, -0.0101470947265625, -0.00911712646484375, -0.008087158203125, -0.00705718994140625, -0.0060272216796875, -0.00499725341796875, -0.00396728515625, -0.00293731689453125, -0.0019073486328125, -0.00087738037109375, 0.000152587890625, 0.00118255615234375, 0.0022125244140625, 0.00324249267578125, 0.0042724609375, 0.00530242919921875, 0.0063323974609375, 0.00736236572265625, 0.008392333984375, 0.00942230224609375, 0.0104522705078125, 0.01148223876953125, 0.01251220703125, 0.01354217529296875, 0.0145721435546875, 0.01560211181640625, 0.016632080078125, 0.01766204833984375, 0.0186920166015625, 0.01972198486328125, 0.020751953125, 0.02178192138671875, 0.0228118896484375, 0.02384185791015625, 0.024871826171875, 0.02590179443359375, 0.0269317626953125, 0.02796173095703125, 0.02899169921875, 0.03002166748046875, 0.0310516357421875, 0.03208160400390625, 0.033111572265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 5.0, 12.0, 7.0, 7.0, 22.0, 15.0, 15.0, 23.0, 24.0, 22.0, 31.0, 38.0, 41.0, 39.0, 40.0, 50.0, 38.0, 44.0, 48.0, 31.0, 60.0, 39.0, 46.0, 32.0, 34.0, 28.0, 30.0, 21.0, 28.0, 23.0, 18.0, 16.0, 20.0, 13.0, 13.0, 14.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59716796875, -0.5775833129882812, -0.5579986572265625, -0.5384140014648438, -0.518829345703125, -0.49924468994140625, -0.4796600341796875, -0.46007537841796875, -0.44049072265625, -0.42090606689453125, -0.4013214111328125, -0.38173675537109375, -0.362152099609375, -0.34256744384765625, -0.3229827880859375, -0.30339813232421875, -0.2838134765625, -0.26422882080078125, -0.2446441650390625, -0.22505950927734375, -0.205474853515625, -0.18589019775390625, -0.1663055419921875, -0.14672088623046875, -0.12713623046875, -0.10755157470703125, -0.0879669189453125, -0.06838226318359375, -0.048797607421875, -0.02921295166015625, -0.0096282958984375, 0.00995635986328125, 0.029541015625, 0.04912567138671875, 0.0687103271484375, 0.08829498291015625, 0.107879638671875, 0.12746429443359375, 0.1470489501953125, 0.16663360595703125, 0.18621826171875, 0.20580291748046875, 0.2253875732421875, 0.24497222900390625, 0.264556884765625, 0.28414154052734375, 0.3037261962890625, 0.32331085205078125, 0.3428955078125, 0.36248016357421875, 0.3820648193359375, 0.40164947509765625, 0.421234130859375, 0.44081878662109375, 0.4604034423828125, 0.47998809814453125, 0.49957275390625, 0.5191574096679688, 0.5387420654296875, 0.5583267211914062, 0.577911376953125, 0.5974960327148438, 0.6170806884765625, 0.6366653442382812, 0.65625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 7.0, 10.0, 12.0, 22.0, 18.0, 51.0, 64.0, 102.0, 174.0, 274.0, 474.0, 820.0, 1543.0, 3208.0, 8947.0, 76542.0, 906394.0, 37791.0, 6494.0, 2581.0, 1263.0, 697.0, 391.0, 252.0, 154.0, 92.0, 51.0, 33.0, 21.0, 11.0, 17.0, 5.0, 9.0, 4.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01157379150390625, -0.011192798614501953, -0.010811805725097656, -0.01043081283569336, -0.010049819946289062, -0.009668827056884766, -0.009287834167480469, -0.008906841278076172, -0.008525848388671875, -0.008144855499267578, -0.007763862609863281, -0.007382869720458984, -0.0070018768310546875, -0.006620883941650391, -0.006239891052246094, -0.005858898162841797, -0.0054779052734375, -0.005096912384033203, -0.004715919494628906, -0.004334926605224609, -0.0039539337158203125, -0.0035729408264160156, -0.0031919479370117188, -0.002810955047607422, -0.002429962158203125, -0.002048969268798828, -0.0016679763793945312, -0.0012869834899902344, -0.0009059906005859375, -0.0005249977111816406, -0.00014400482177734375, 0.00023698806762695312, 0.00061798095703125, 0.0009989738464355469, 0.0013799667358398438, 0.0017609596252441406, 0.0021419525146484375, 0.0025229454040527344, 0.0029039382934570312, 0.003284931182861328, 0.003665924072265625, 0.004046916961669922, 0.004427909851074219, 0.004808902740478516, 0.0051898956298828125, 0.005570888519287109, 0.005951881408691406, 0.006332874298095703, 0.0067138671875, 0.007094860076904297, 0.007475852966308594, 0.00785684585571289, 0.008237838745117188, 0.008618831634521484, 0.008999824523925781, 0.009380817413330078, 0.009761810302734375, 0.010142803192138672, 0.010523796081542969, 0.010904788970947266, 0.011285781860351562, 0.01166677474975586, 0.012047767639160156, 0.012428760528564453, 0.01280975341796875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 5.0, 3.0, 9.0, 15.0, 12.0, 31.0, 75.0, 174.0, 312.0, 170.0, 81.0, 44.0, 16.0, 13.0, 4.0, 8.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8252601623535156e-05, -2.7457252144813538e-05, -2.666190266609192e-05, -2.58665531873703e-05, -2.507120370864868e-05, -2.4275854229927063e-05, -2.3480504751205444e-05, -2.2685155272483826e-05, -2.1889805793762207e-05, -2.109445631504059e-05, -2.029910683631897e-05, -1.950375735759735e-05, -1.8708407878875732e-05, -1.7913058400154114e-05, -1.7117708921432495e-05, -1.6322359442710876e-05, -1.5527009963989258e-05, -1.473166048526764e-05, -1.393631100654602e-05, -1.3140961527824402e-05, -1.2345612049102783e-05, -1.1550262570381165e-05, -1.0754913091659546e-05, -9.959563612937927e-06, -9.164214134216309e-06, -8.36886465549469e-06, -7.573515176773071e-06, -6.778165698051453e-06, -5.982816219329834e-06, -5.187466740608215e-06, -4.392117261886597e-06, -3.596767783164978e-06, -2.8014183044433594e-06, -2.0060688257217407e-06, -1.210719347000122e-06, -4.153698682785034e-07, 3.7997961044311523e-07, 1.1753290891647339e-06, 1.9706785678863525e-06, 2.766028046607971e-06, 3.56137752532959e-06, 4.3567270040512085e-06, 5.152076482772827e-06, 5.947425961494446e-06, 6.7427754402160645e-06, 7.538124918937683e-06, 8.333474397659302e-06, 9.12882387638092e-06, 9.924173355102539e-06, 1.0719522833824158e-05, 1.1514872312545776e-05, 1.2310221791267395e-05, 1.3105571269989014e-05, 1.3900920748710632e-05, 1.4696270227432251e-05, 1.549161970615387e-05, 1.6286969184875488e-05, 1.7082318663597107e-05, 1.7877668142318726e-05, 1.8673017621040344e-05, 1.9468367099761963e-05, 2.026371657848358e-05, 2.10590660572052e-05, 2.185441553592682e-05, 2.2649765014648438e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 2.0, 1.0, 8.0, 6.0, 9.0, 27.0, 29.0, 88.0, 318.0, 1536.0, 39087.0, 1003594.0, 3027.0, 537.0, 158.0, 40.0, 26.0, 12.0, 15.0, 5.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05267333984375, -0.05103588104248047, -0.04939842224121094, -0.047760963439941406, -0.046123504638671875, -0.044486045837402344, -0.04284858703613281, -0.04121112823486328, -0.03957366943359375, -0.03793621063232422, -0.03629875183105469, -0.034661293029785156, -0.033023834228515625, -0.031386375427246094, -0.029748916625976562, -0.02811145782470703, -0.0264739990234375, -0.02483654022216797, -0.023199081420898438, -0.021561622619628906, -0.019924163818359375, -0.018286705017089844, -0.016649246215820312, -0.015011787414550781, -0.01337432861328125, -0.011736869812011719, -0.010099411010742188, -0.008461952209472656, -0.006824493408203125, -0.005187034606933594, -0.0035495758056640625, -0.0019121170043945312, -0.000274658203125, 0.0013628005981445312, 0.0030002593994140625, 0.004637718200683594, 0.006275177001953125, 0.007912635803222656, 0.009550094604492188, 0.011187553405761719, 0.01282501220703125, 0.014462471008300781, 0.016099929809570312, 0.017737388610839844, 0.019374847412109375, 0.021012306213378906, 0.022649765014648438, 0.02428722381591797, 0.0259246826171875, 0.02756214141845703, 0.029199600219726562, 0.030837059020996094, 0.032474517822265625, 0.034111976623535156, 0.03574943542480469, 0.03738689422607422, 0.03902435302734375, 0.04066181182861328, 0.04229927062988281, 0.043936729431152344, 0.045574188232421875, 0.047211647033691406, 0.04884910583496094, 0.05048656463623047, 0.0521240234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 19.0, 43.0, 103.0, 263.0, 339.0, 106.0, 56.0, 27.0, 9.0, 7.0, 3.0, 1.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004779815673828125, -0.004630982875823975, -0.004482150077819824, -0.004333317279815674, -0.0041844844818115234, -0.004035651683807373, -0.0038868188858032227, -0.0037379860877990723, -0.003589153289794922, -0.0034403204917907715, -0.003291487693786621, -0.0031426548957824707, -0.0029938220977783203, -0.00284498929977417, -0.0026961565017700195, -0.002547323703765869, -0.0023984909057617188, -0.0022496581077575684, -0.002100825309753418, -0.0019519925117492676, -0.0018031597137451172, -0.0016543269157409668, -0.0015054941177368164, -0.001356661319732666, -0.0012078285217285156, -0.0010589957237243652, -0.0009101629257202148, -0.0007613301277160645, -0.0006124973297119141, -0.00046366453170776367, -0.0003148317337036133, -0.0001659989356994629, -1.71661376953125e-05, 0.0001316666603088379, 0.0002804994583129883, 0.00042933225631713867, 0.0005781650543212891, 0.0007269978523254395, 0.0008758306503295898, 0.0010246634483337402, 0.0011734962463378906, 0.001322329044342041, 0.0014711618423461914, 0.0016199946403503418, 0.0017688274383544922, 0.0019176602363586426, 0.002066493034362793, 0.0022153258323669434, 0.0023641586303710938, 0.002512991428375244, 0.0026618242263793945, 0.002810657024383545, 0.0029594898223876953, 0.0031083226203918457, 0.003257155418395996, 0.0034059882164001465, 0.003554821014404297, 0.0037036538124084473, 0.0038524866104125977, 0.004001319408416748, 0.0041501522064208984, 0.004298985004425049, 0.004447817802429199, 0.00459665060043335, 0.0047454833984375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 6.0, 14.0, 32.0, 63.0, 122.0, 268.0, 269.0, 127.0, 42.0, 24.0, 18.0, 16.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4854736030101776, -0.4483156204223633, -0.41115760803222656, -0.37399962544441223, -0.3368416428565979, -0.2996836304664612, -0.26252564787864685, -0.22536763548851013, -0.1882096529006958, -0.15105165541172028, -0.11389366537332535, -0.07673567533493042, -0.039577677845954895, -0.00241968035697937, 0.03473830223083496, 0.07189631462097168, 0.10905429720878601, 0.14621229469776154, 0.18337029218673706, 0.2205282747745514, 0.2576862573623657, 0.29484426975250244, 0.3320022523403168, 0.3691602647304535, 0.4063182473182678, 0.44347622990608215, 0.48063424229621887, 0.5177922248840332, 0.5549502372741699, 0.5921082496643066, 0.6292662024497986, 0.6664242148399353, 0.7035822868347168, 0.7407402992248535, 0.7778982520103455, 0.8150562644004822, 0.8522142767906189, 0.8893722295761108, 0.9265302419662476, 0.9636882543563843, 1.000846266746521, 1.0380042791366577, 1.0751622915267944, 1.1123201847076416, 1.1494781970977783, 1.186636209487915, 1.2237942218780518, 1.2609522342681885, 1.2981102466583252, 1.335268259048462, 1.3724262714385986, 1.4095842838287354, 1.4467421770095825, 1.4839001893997192, 1.521058201789856, 1.5582162141799927, 1.5953741073608398, 1.6325321197509766, 1.6696901321411133, 1.70684814453125, 1.7440060377120972, 1.7811640501022339, 1.8183220624923706, 1.8554800748825073, 1.892638087272644]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 7.0, 5.0, 12.0, 6.0, 15.0, 13.0, 13.0, 14.0, 20.0, 22.0, 23.0, 28.0, 45.0, 38.0, 35.0, 36.0, 54.0, 51.0, 48.0, 47.0, 41.0, 46.0, 40.0, 38.0, 49.0, 39.0, 34.0, 31.0, 30.0, 28.0, 26.0, 13.0, 13.0, 9.0, 14.0, 6.0, 7.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.42314109206199646, -0.41045239567756653, -0.397763729095459, -0.38507503271102905, -0.3723863363265991, -0.3596976697444916, -0.34700897336006165, -0.3343203067779541, -0.32163161039352417, -0.30894291400909424, -0.2962542474269867, -0.28356555104255676, -0.2708768844604492, -0.2581881880760193, -0.24549949169158936, -0.23281081020832062, -0.22012212872505188, -0.20743344724178314, -0.1947447657585144, -0.18205606937408447, -0.16936738789081573, -0.156678706407547, -0.14399001002311707, -0.13130132853984833, -0.11861264705657959, -0.10592396557331085, -0.09323527663946152, -0.08054658770561218, -0.06785790622234344, -0.05516922473907471, -0.04248053580522537, -0.029791846871376038, -0.017103135585784912, -0.004414450377225876, 0.00827423483133316, 0.020962920039892197, 0.03365160524845123, 0.04634028673171997, 0.059028975665569305, 0.07171766459941864, 0.08440634608268738, 0.09709502756595612, 0.10978371649980545, 0.12247240543365479, 0.13516108691692352, 0.14784976840019226, 0.1605384647846222, 0.17322714626789093, 0.18591582775115967, 0.1986045092344284, 0.21129319071769714, 0.22398188710212708, 0.2366705685853958, 0.24935925006866455, 0.2620479464530945, 0.2747366428375244, 0.28742530941963196, 0.3001140058040619, 0.31280267238616943, 0.32549136877059937, 0.3381800651550293, 0.35086873173713684, 0.3635574281215668, 0.3762460947036743, 0.38893479108810425]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 11.0, 10.0, 12.0, 20.0, 25.0, 50.0, 77.0, 102.0, 152.0, 239.0, 421.0, 740.0, 1307.0, 2256.0, 4692.0, 10766.0, 31385.0, 136103.0, 640323.0, 161403.0, 35844.0, 11791.0, 5011.0, 2416.0, 1397.0, 779.0, 434.0, 252.0, 157.0, 114.0, 94.0, 46.0, 37.0, 32.0, 13.0, 16.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.841796875, -0.810089111328125, -0.77838134765625, -0.746673583984375, -0.7149658203125, -0.683258056640625, -0.65155029296875, -0.619842529296875, -0.588134765625, -0.556427001953125, -0.52471923828125, -0.493011474609375, -0.4613037109375, -0.429595947265625, -0.39788818359375, -0.366180419921875, -0.33447265625, -0.302764892578125, -0.27105712890625, -0.239349365234375, -0.2076416015625, -0.175933837890625, -0.14422607421875, -0.112518310546875, -0.080810546875, -0.049102783203125, -0.01739501953125, 0.014312744140625, 0.0460205078125, 0.077728271484375, 0.10943603515625, 0.141143798828125, 0.1728515625, 0.204559326171875, 0.23626708984375, 0.267974853515625, 0.2996826171875, 0.331390380859375, 0.36309814453125, 0.394805908203125, 0.426513671875, 0.458221435546875, 0.48992919921875, 0.521636962890625, 0.5533447265625, 0.585052490234375, 0.61676025390625, 0.648468017578125, 0.68017578125, 0.711883544921875, 0.74359130859375, 0.775299072265625, 0.8070068359375, 0.838714599609375, 0.87042236328125, 0.902130126953125, 0.933837890625, 0.965545654296875, 0.99725341796875, 1.028961181640625, 1.0606689453125, 1.092376708984375, 1.12408447265625, 1.155792236328125, 1.1875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 4.0, 5.0, 5.0, 13.0, 11.0, 10.0, 21.0, 15.0, 26.0, 34.0, 36.0, 37.0, 50.0, 62.0, 64.0, 51.0, 72.0, 59.0, 51.0, 50.0, 59.0, 48.0, 41.0, 25.0, 39.0, 29.0, 17.0, 17.0, 12.0, 12.0, 8.0, 8.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0], "bins": [-1.0771484375, -1.0514297485351562, -1.0257110595703125, -0.9999923706054688, -0.974273681640625, -0.9485549926757812, -0.9228363037109375, -0.8971176147460938, -0.87139892578125, -0.8456802368164062, -0.8199615478515625, -0.7942428588867188, -0.768524169921875, -0.7428054809570312, -0.7170867919921875, -0.6913681030273438, -0.6656494140625, -0.6399307250976562, -0.6142120361328125, -0.5884933471679688, -0.562774658203125, -0.5370559692382812, -0.5113372802734375, -0.48561859130859375, -0.45989990234375, -0.43418121337890625, -0.4084625244140625, -0.38274383544921875, -0.357025146484375, -0.33130645751953125, -0.3055877685546875, -0.27986907958984375, -0.254150390625, -0.22843170166015625, -0.2027130126953125, -0.17699432373046875, -0.151275634765625, -0.12555694580078125, -0.0998382568359375, -0.07411956787109375, -0.04840087890625, -0.02268218994140625, 0.0030364990234375, 0.02875518798828125, 0.054473876953125, 0.08019256591796875, 0.1059112548828125, 0.13162994384765625, 0.1573486328125, 0.18306732177734375, 0.2087860107421875, 0.23450469970703125, 0.260223388671875, 0.28594207763671875, 0.3116607666015625, 0.33737945556640625, 0.36309814453125, 0.38881683349609375, 0.4145355224609375, 0.44025421142578125, 0.465972900390625, 0.49169158935546875, 0.5174102783203125, 0.5431289672851562, 0.56884765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 5.0, 4.0, 6.0, 8.0, 6.0, 10.0, 29.0, 40.0, 60.0, 111.0, 395.0, 2909.0, 974936.0, 68322.0, 1236.0, 238.0, 91.0, 45.0, 35.0, 24.0, 14.0, 7.0, 7.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25390625, -5.10308837890625, -4.9522705078125, -4.80145263671875, -4.650634765625, -4.49981689453125, -4.3489990234375, -4.19818115234375, -4.04736328125, -3.89654541015625, -3.7457275390625, -3.59490966796875, -3.444091796875, -3.29327392578125, -3.1424560546875, -2.99163818359375, -2.8408203125, -2.69000244140625, -2.5391845703125, -2.38836669921875, -2.237548828125, -2.08673095703125, -1.9359130859375, -1.78509521484375, -1.63427734375, -1.48345947265625, -1.3326416015625, -1.18182373046875, -1.031005859375, -0.88018798828125, -0.7293701171875, -0.57855224609375, -0.427734375, -0.27691650390625, -0.1260986328125, 0.02471923828125, 0.175537109375, 0.32635498046875, 0.4771728515625, 0.62799072265625, 0.77880859375, 0.92962646484375, 1.0804443359375, 1.23126220703125, 1.382080078125, 1.53289794921875, 1.6837158203125, 1.83453369140625, 1.9853515625, 2.13616943359375, 2.2869873046875, 2.43780517578125, 2.588623046875, 2.73944091796875, 2.8902587890625, 3.04107666015625, 3.19189453125, 3.34271240234375, 3.4935302734375, 3.64434814453125, 3.795166015625, 3.94598388671875, 4.0968017578125, 4.24761962890625, 4.3984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 5.0, 7.0, 9.0, 6.0, 20.0, 34.0, 47.0, 71.0, 79.0, 108.0, 116.0, 106.0, 99.0, 73.0, 73.0, 35.0, 38.0, 22.0, 17.0, 7.0, 10.0, 1.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84375, -1.7911834716796875, -1.738616943359375, -1.6860504150390625, -1.63348388671875, -1.5809173583984375, -1.528350830078125, -1.4757843017578125, -1.4232177734375, -1.3706512451171875, -1.318084716796875, -1.2655181884765625, -1.21295166015625, -1.1603851318359375, -1.107818603515625, -1.0552520751953125, -1.002685546875, -0.9501190185546875, -0.897552490234375, -0.8449859619140625, -0.79241943359375, -0.7398529052734375, -0.687286376953125, -0.6347198486328125, -0.5821533203125, -0.5295867919921875, -0.477020263671875, -0.4244537353515625, -0.37188720703125, -0.3193206787109375, -0.266754150390625, -0.2141876220703125, -0.16162109375, -0.1090545654296875, -0.056488037109375, -0.0039215087890625, 0.04864501953125, 0.1012115478515625, 0.153778076171875, 0.2063446044921875, 0.2589111328125, 0.3114776611328125, 0.364044189453125, 0.4166107177734375, 0.46917724609375, 0.5217437744140625, 0.574310302734375, 0.6268768310546875, 0.679443359375, 0.7320098876953125, 0.784576416015625, 0.8371429443359375, 0.88970947265625, 0.9422760009765625, 0.994842529296875, 1.0474090576171875, 1.0999755859375, 1.1525421142578125, 1.205108642578125, 1.2576751708984375, 1.31024169921875, 1.3628082275390625, 1.415374755859375, 1.4679412841796875, 1.5205078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 12.0, 18.0, 15.0, 30.0, 54.0, 81.0, 145.0, 284.0, 577.0, 1427.0, 4031.0, 15377.0, 128634.0, 833256.0, 50794.0, 9116.0, 2702.0, 1034.0, 433.0, 241.0, 113.0, 65.0, 49.0, 20.0, 11.0, 12.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033477783203125, -0.03229570388793945, -0.031113624572753906, -0.02993154525756836, -0.028749465942382812, -0.027567386627197266, -0.02638530731201172, -0.025203227996826172, -0.024021148681640625, -0.022839069366455078, -0.02165699005126953, -0.020474910736083984, -0.019292831420898438, -0.01811075210571289, -0.016928672790527344, -0.015746593475341797, -0.01456451416015625, -0.013382434844970703, -0.012200355529785156, -0.01101827621459961, -0.009836196899414062, -0.008654117584228516, -0.007472038269042969, -0.006289958953857422, -0.005107879638671875, -0.003925800323486328, -0.0027437210083007812, -0.0015616416931152344, -0.0003795623779296875, 0.0008025169372558594, 0.0019845962524414062, 0.003166675567626953, 0.0043487548828125, 0.005530834197998047, 0.006712913513183594, 0.00789499282836914, 0.009077072143554688, 0.010259151458740234, 0.011441230773925781, 0.012623310089111328, 0.013805389404296875, 0.014987468719482422, 0.01616954803466797, 0.017351627349853516, 0.018533706665039062, 0.01971578598022461, 0.020897865295410156, 0.022079944610595703, 0.02326202392578125, 0.024444103240966797, 0.025626182556152344, 0.02680826187133789, 0.027990341186523438, 0.029172420501708984, 0.03035449981689453, 0.03153657913208008, 0.032718658447265625, 0.03390073776245117, 0.03508281707763672, 0.036264896392822266, 0.03744697570800781, 0.03862905502319336, 0.039811134338378906, 0.04099321365356445, 0.04217529296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 19.0, 20.0, 51.0, 100.0, 262.0, 311.0, 113.0, 55.0, 32.0, 10.0, 5.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.110004425048828e-05, -2.0531006157398224e-05, -1.9961968064308167e-05, -1.939292997121811e-05, -1.8823891878128052e-05, -1.8254853785037994e-05, -1.7685815691947937e-05, -1.711677759885788e-05, -1.6547739505767822e-05, -1.5978701412677765e-05, -1.5409663319587708e-05, -1.484062522649765e-05, -1.4271587133407593e-05, -1.3702549040317535e-05, -1.3133510947227478e-05, -1.256447285413742e-05, -1.1995434761047363e-05, -1.1426396667957306e-05, -1.0857358574867249e-05, -1.0288320481777191e-05, -9.719282388687134e-06, -9.150244295597076e-06, -8.581206202507019e-06, -8.012168109416962e-06, -7.443130016326904e-06, -6.874091923236847e-06, -6.3050538301467896e-06, -5.736015737056732e-06, -5.166977643966675e-06, -4.5979395508766174e-06, -4.02890145778656e-06, -3.4598633646965027e-06, -2.8908252716064453e-06, -2.321787178516388e-06, -1.7527490854263306e-06, -1.1837109923362732e-06, -6.146728992462158e-07, -4.563480615615845e-08, 5.234032869338989e-07, 1.0924413800239563e-06, 1.6614794731140137e-06, 2.230517566204071e-06, 2.7995556592941284e-06, 3.368593752384186e-06, 3.937631845474243e-06, 4.5066699385643005e-06, 5.075708031654358e-06, 5.644746124744415e-06, 6.213784217834473e-06, 6.78282231092453e-06, 7.351860404014587e-06, 7.920898497104645e-06, 8.489936590194702e-06, 9.05897468328476e-06, 9.628012776374817e-06, 1.0197050869464874e-05, 1.0766088962554932e-05, 1.1335127055644989e-05, 1.1904165148735046e-05, 1.2473203241825104e-05, 1.3042241334915161e-05, 1.3611279428005219e-05, 1.4180317521095276e-05, 1.4749355614185333e-05, 1.531839370727539e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 10.0, 9.0, 15.0, 25.0, 32.0, 40.0, 66.0, 73.0, 113.0, 158.0, 250.0, 360.0, 624.0, 1045.0, 2144.0, 5111.0, 17327.0, 181599.0, 791057.0, 34510.0, 7588.0, 2799.0, 1388.0, 830.0, 479.0, 318.0, 194.0, 123.0, 69.0, 49.0, 40.0, 30.0, 22.0, 14.0, 10.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0285797119140625, -0.027600526809692383, -0.026621341705322266, -0.02564215660095215, -0.02466297149658203, -0.023683786392211914, -0.022704601287841797, -0.02172541618347168, -0.020746231079101562, -0.019767045974731445, -0.018787860870361328, -0.01780867576599121, -0.016829490661621094, -0.015850305557250977, -0.01487112045288086, -0.013891935348510742, -0.012912750244140625, -0.011933565139770508, -0.01095438003540039, -0.009975194931030273, -0.008996009826660156, -0.008016824722290039, -0.007037639617919922, -0.006058454513549805, -0.0050792694091796875, -0.00410008430480957, -0.003120899200439453, -0.002141714096069336, -0.0011625289916992188, -0.00018334388732910156, 0.0007958412170410156, 0.0017750263214111328, 0.00275421142578125, 0.003733396530151367, 0.004712581634521484, 0.0056917667388916016, 0.006670951843261719, 0.007650136947631836, 0.008629322052001953, 0.00960850715637207, 0.010587692260742188, 0.011566877365112305, 0.012546062469482422, 0.013525247573852539, 0.014504432678222656, 0.015483617782592773, 0.01646280288696289, 0.017441987991333008, 0.018421173095703125, 0.019400358200073242, 0.02037954330444336, 0.021358728408813477, 0.022337913513183594, 0.02331709861755371, 0.024296283721923828, 0.025275468826293945, 0.026254653930664062, 0.02723383903503418, 0.028213024139404297, 0.029192209243774414, 0.03017139434814453, 0.03115057945251465, 0.032129764556884766, 0.03310894966125488, 0.034088134765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 4.0, 10.0, 9.0, 8.0, 4.0, 4.0, 15.0, 24.0, 36.0, 46.0, 75.0, 120.0, 206.0, 160.0, 92.0, 63.0, 35.0, 21.0, 16.0, 7.0, 15.0, 5.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01165771484375, -0.011183977127075195, -0.01071023941040039, -0.010236501693725586, -0.009762763977050781, -0.009289026260375977, -0.008815288543701172, -0.008341550827026367, -0.007867813110351562, -0.007394075393676758, -0.006920337677001953, -0.0064465999603271484, -0.005972862243652344, -0.005499124526977539, -0.005025386810302734, -0.00455164909362793, -0.004077911376953125, -0.0036041736602783203, -0.0031304359436035156, -0.002656698226928711, -0.0021829605102539062, -0.0017092227935791016, -0.0012354850769042969, -0.0007617473602294922, -0.0002880096435546875, 0.0001857280731201172, 0.0006594657897949219, 0.0011332035064697266, 0.0016069412231445312, 0.002080678939819336, 0.0025544166564941406, 0.0030281543731689453, 0.00350189208984375, 0.003975629806518555, 0.004449367523193359, 0.004923105239868164, 0.005396842956542969, 0.0058705806732177734, 0.006344318389892578, 0.006818056106567383, 0.0072917938232421875, 0.007765531539916992, 0.008239269256591797, 0.008713006973266602, 0.009186744689941406, 0.009660482406616211, 0.010134220123291016, 0.01060795783996582, 0.011081695556640625, 0.01155543327331543, 0.012029170989990234, 0.012502908706665039, 0.012976646423339844, 0.013450384140014648, 0.013924121856689453, 0.014397859573364258, 0.014871597290039062, 0.015345335006713867, 0.015819072723388672, 0.016292810440063477, 0.01676654815673828, 0.017240285873413086, 0.01771402359008789, 0.018187761306762695, 0.0186614990234375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 61.0, 939.0, 20.0], "bins": [-20.553619384765625, -20.2238826751709, -19.894145965576172, -19.564411163330078, -19.23467445373535, -18.904937744140625, -18.5752010345459, -18.245464324951172, -17.915729522705078, -17.58599281311035, -17.256256103515625, -16.92652130126953, -16.596784591674805, -16.267047882080078, -15.937311172485352, -15.607574462890625, -15.277837753295898, -14.948101043701172, -14.618365287780762, -14.288628578186035, -13.958892822265625, -13.629156112670898, -13.299419403076172, -12.969682693481445, -12.639946937561035, -12.310210227966309, -11.980474472045898, -11.650737762451172, -11.321001052856445, -10.991265296936035, -10.661528587341309, -10.331792831420898, -10.002056121826172, -9.672319412231445, -9.342583656311035, -9.012846946716309, -8.683111190795898, -8.353374481201172, -8.023637771606445, -7.693901538848877, -7.364165782928467, -7.034429550170898, -6.704692840576172, -6.3749566078186035, -6.045220375061035, -5.715484142303467, -5.385747909545898, -5.056011199951172, -4.7262749671936035, -4.396538734436035, -4.066802024841309, -3.7370657920837402, -3.407329559326172, -3.0775933265686035, -2.747856855392456, -2.4181203842163086, -2.088383913040161, -1.7586475610733032, -1.4289112091064453, -1.0991748571395874, -0.7694385051727295, -0.4397021532058716, -0.10996580123901367, 0.2197706699371338, 0.5495068430900574]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 7.0, 10.0, 15.0, 23.0, 23.0, 31.0, 43.0, 59.0, 62.0, 69.0, 89.0, 71.0, 84.0, 85.0, 71.0, 52.0, 54.0, 46.0, 32.0, 19.0, 17.0, 18.0, 11.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-3.5020909309387207, -3.4236693382263184, -3.345247507095337, -3.2668256759643555, -3.188404083251953, -3.109982490539551, -3.0315606594085693, -2.953138828277588, -2.8747172355651855, -2.796295642852783, -2.7178738117218018, -2.6394519805908203, -2.561030387878418, -2.4826087951660156, -2.404186964035034, -2.3257651329040527, -2.2473435401916504, -2.168921947479248, -2.0905001163482666, -2.012078285217285, -1.9336566925048828, -1.855234980583191, -1.776813268661499, -1.6983915567398071, -1.6199698448181152, -1.5415481328964233, -1.4631264209747314, -1.3847047090530396, -1.3062829971313477, -1.2278612852096558, -1.1494395732879639, -1.071017861366272, -0.9925963878631592, -0.9141746759414673, -0.8357529640197754, -0.7573312520980835, -0.6789095401763916, -0.6004878282546997, -0.5220661163330078, -0.4436444044113159, -0.365222692489624, -0.28680098056793213, -0.20837926864624023, -0.12995755672454834, -0.051535844802856445, 0.02688586711883545, 0.10530757904052734, 0.18372929096221924, 0.26215100288391113, 0.340572714805603, 0.4189944267272949, 0.4974161386489868, 0.5758378505706787, 0.6542595624923706, 0.7326812744140625, 0.8111029863357544, 0.8895246982574463, 0.9679464101791382, 1.04636812210083, 1.124789834022522, 1.2032115459442139, 1.2816332578659058, 1.3600549697875977, 1.4384766817092896, 1.5168983936309814]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 10.0, 14.0, 26.0, 41.0, 57.0, 100.0, 154.0, 1067.0, 4190978.0, 1549.0, 92.0, 58.0, 46.0, 34.0, 33.0, 20.0, 9.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-12.515625, -12.267822265625, -12.02001953125, -11.772216796875, -11.5244140625, -11.276611328125, -11.02880859375, -10.781005859375, -10.533203125, -10.285400390625, -10.03759765625, -9.789794921875, -9.5419921875, -9.294189453125, -9.04638671875, -8.798583984375, -8.55078125, -8.302978515625, -8.05517578125, -7.807373046875, -7.5595703125, -7.311767578125, -7.06396484375, -6.816162109375, -6.568359375, -6.320556640625, -6.07275390625, -5.824951171875, -5.5771484375, -5.329345703125, -5.08154296875, -4.833740234375, -4.5859375, -4.338134765625, -4.09033203125, -3.842529296875, -3.5947265625, -3.346923828125, -3.09912109375, -2.851318359375, -2.603515625, -2.355712890625, -2.10791015625, -1.860107421875, -1.6123046875, -1.364501953125, -1.11669921875, -0.868896484375, -0.62109375, -0.373291015625, -0.12548828125, 0.122314453125, 0.3701171875, 0.617919921875, 0.86572265625, 1.113525390625, 1.361328125, 1.609130859375, 1.85693359375, 2.104736328125, 2.3525390625, 2.600341796875, 2.84814453125, 3.095947265625, 3.34375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 15.0, 23.0, 38.0, 60.0, 81.0, 139.0, 163.0, 146.0, 105.0, 95.0, 52.0, 39.0, 30.0, 14.0, 3.0, 4.0, 3.0], "bins": [-0.71728515625, -0.7039737701416016, -0.6906623840332031, -0.6773509979248047, -0.6640396118164062, -0.6507282257080078, -0.6374168395996094, -0.6241054534912109, -0.6107940673828125, -0.5974826812744141, -0.5841712951660156, -0.5708599090576172, -0.5575485229492188, -0.5442371368408203, -0.5309257507324219, -0.5176143646240234, -0.504302978515625, -0.49099159240722656, -0.4776802062988281, -0.4643688201904297, -0.45105743408203125, -0.4377460479736328, -0.4244346618652344, -0.41112327575683594, -0.3978118896484375, -0.38450050354003906, -0.3711891174316406, -0.3578777313232422, -0.34456634521484375, -0.3312549591064453, -0.3179435729980469, -0.30463218688964844, -0.29132080078125, -0.27800941467285156, -0.2646980285644531, -0.2513866424560547, -0.23807525634765625, -0.2247638702392578, -0.21145248413085938, -0.19814109802246094, -0.1848297119140625, -0.17151832580566406, -0.15820693969726562, -0.1448955535888672, -0.13158416748046875, -0.11827278137207031, -0.10496139526367188, -0.09165000915527344, -0.078338623046875, -0.06502723693847656, -0.051715850830078125, -0.03840446472167969, -0.02509307861328125, -0.011781692504882812, 0.001529693603515625, 0.014841079711914062, 0.0281524658203125, 0.04146385192871094, 0.054775238037109375, 0.06808662414550781, 0.08139801025390625, 0.09470939636230469, 0.10802078247070312, 0.12133216857910156, 0.1346435546875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 4.0, 7.0, 11.0, 20.0, 62.0, 333.0, 4187872.0, 5375.0, 220.0, 104.0, 51.0, 36.0, 37.0, 20.0, 21.0, 25.0, 15.0, 9.0, 11.0, 7.0, 8.0, 5.0, 7.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.03125, -14.193359375, -13.35546875, -12.517578125, -11.6796875, -10.841796875, -10.00390625, -9.166015625, -8.328125, -7.490234375, -6.65234375, -5.814453125, -4.9765625, -4.138671875, -3.30078125, -2.462890625, -1.625, -0.787109375, 0.05078125, 0.888671875, 1.7265625, 2.564453125, 3.40234375, 4.240234375, 5.078125, 5.916015625, 6.75390625, 7.591796875, 8.4296875, 9.267578125, 10.10546875, 10.943359375, 11.78125, 12.619140625, 13.45703125, 14.294921875, 15.1328125, 15.970703125, 16.80859375, 17.646484375, 18.484375, 19.322265625, 20.16015625, 20.998046875, 21.8359375, 22.673828125, 23.51171875, 24.349609375, 25.1875, 26.025390625, 26.86328125, 27.701171875, 28.5390625, 29.376953125, 30.21484375, 31.052734375, 31.890625, 32.728515625, 33.56640625, 34.404296875, 35.2421875, 36.080078125, 36.91796875, 37.755859375, 38.59375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 8.0, 6.0, 14.0, 19.0, 48.0, 193.0, 507.0, 1367.0, 1080.0, 356.0, 110.0, 71.0, 41.0, 40.0, 33.0, 23.0, 13.0, 17.0, 17.0, 14.0, 15.0, 9.0, 6.0, 10.0, 7.0, 6.0, 2.0, 3.0, 6.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1019287109375, -0.09728431701660156, -0.09263992309570312, -0.08799552917480469, -0.08335113525390625, -0.07870674133300781, -0.07406234741210938, -0.06941795349121094, -0.0647735595703125, -0.06012916564941406, -0.055484771728515625, -0.05084037780761719, -0.04619598388671875, -0.04155158996582031, -0.036907196044921875, -0.03226280212402344, -0.027618408203125, -0.022974014282226562, -0.018329620361328125, -0.013685226440429688, -0.00904083251953125, -0.0043964385986328125, 0.000247955322265625, 0.0048923492431640625, 0.0095367431640625, 0.014181137084960938, 0.018825531005859375, 0.023469924926757812, 0.02811431884765625, 0.03275871276855469, 0.037403106689453125, 0.04204750061035156, 0.04669189453125, 0.05133628845214844, 0.055980682373046875, 0.06062507629394531, 0.06526947021484375, 0.06991386413574219, 0.07455825805664062, 0.07920265197753906, 0.0838470458984375, 0.08849143981933594, 0.09313583374023438, 0.09778022766113281, 0.10242462158203125, 0.10706901550292969, 0.11171340942382812, 0.11635780334472656, 0.121002197265625, 0.12564659118652344, 0.13029098510742188, 0.1349353790283203, 0.13957977294921875, 0.1442241668701172, 0.14886856079101562, 0.15351295471191406, 0.1581573486328125, 0.16280174255371094, 0.16744613647460938, 0.1720905303955078, 0.17673492431640625, 0.1813793182373047, 0.18602371215820312, 0.19066810607910156, 0.1953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 198.0, 779.0, 32.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.541913986206055, -10.350611686706543, -10.159309387207031, -9.968008041381836, -9.776705741882324, -9.585403442382812, -9.3941011428833, -9.202798843383789, -9.011497497558594, -8.820195198059082, -8.62889289855957, -8.437591552734375, -8.246289253234863, -8.054986953735352, -7.86368465423584, -7.672382354736328, -7.481080055236816, -7.289777755737305, -7.098475933074951, -6.9071736335754395, -6.715871810913086, -6.524569511413574, -6.3332672119140625, -6.141964912414551, -5.950663089752197, -5.7593607902526855, -5.568058967590332, -5.37675666809082, -5.185454368591309, -4.994152545928955, -4.802850246429443, -4.61154842376709, -4.420246124267578, -4.228943824768066, -4.037642002105713, -3.846339702606201, -3.6550376415252686, -3.463735580444336, -3.272433280944824, -3.0811312198638916, -2.88982892036438, -2.6985268592834473, -2.5072245597839355, -2.315922498703003, -2.1246204376220703, -1.9333183765411377, -1.7420161962509155, -1.5507140159606934, -1.3594119548797607, -1.1681098937988281, -0.976807713508606, -0.7855055928230286, -0.5942034721374512, -0.4029013514518738, -0.2115992307662964, -0.02029705047607422, 0.1710050106048584, 0.3623071312904358, 0.5536092519760132, 0.7449113726615906, 0.936213493347168, 1.1275155544281006, 1.3188177347183228, 1.510119915008545, 1.7014219760894775]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 7.0, 18.0, 28.0, 25.0, 37.0, 65.0, 83.0, 85.0, 104.0, 99.0, 97.0, 88.0, 73.0, 51.0, 39.0, 36.0, 25.0, 16.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1058284044265747, -1.0793671607971191, -1.052905797958374, -1.0264445543289185, -0.9999832510948181, -0.9735219478607178, -0.9470607042312622, -0.9205994009971619, -0.8941380977630615, -0.8676767945289612, -0.8412154912948608, -0.8147542476654053, -0.7882929444313049, -0.7618316411972046, -0.735370397567749, -0.7089090943336487, -0.6824477910995483, -0.655986487865448, -0.6295251846313477, -0.6030639410018921, -0.5766026377677917, -0.5501413345336914, -0.5236800909042358, -0.4972187876701355, -0.47075748443603516, -0.4442961812019348, -0.41783490777015686, -0.3913736343383789, -0.36491233110427856, -0.3384510278701782, -0.31198975443840027, -0.2855284810066223, -0.25906723737716675, -0.2326059490442276, -0.20614466071128845, -0.1796833723783493, -0.15322208404541016, -0.126760795712471, -0.10029950737953186, -0.07383821904659271, -0.047376930713653564, -0.020915642380714417, 0.0055456459522247314, 0.03200693428516388, 0.05846822261810303, 0.08492951095104218, 0.11139079928398132, 0.13785208761692047, 0.16431337594985962, 0.19077466428279877, 0.21723595261573792, 0.24369724094867706, 0.2701585292816162, 0.29661983251571655, 0.3230811059474945, 0.34954237937927246, 0.3760036826133728, 0.40246498584747314, 0.4289262592792511, 0.45538753271102905, 0.4818488359451294, 0.5083101391792297, 0.5347714424133301, 0.5612326860427856, 0.587693989276886]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 5.0, 9.0, 6.0, 13.0, 17.0, 45.0, 76.0, 179.0, 503.0, 1873.0, 16802.0, 1000343.0, 25448.0, 2244.0, 585.0, 211.0, 87.0, 45.0, 26.0, 10.0, 7.0, 8.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3603515625, -0.34625244140625, -0.3321533203125, -0.31805419921875, -0.303955078125, -0.28985595703125, -0.2757568359375, -0.26165771484375, -0.24755859375, -0.23345947265625, -0.2193603515625, -0.20526123046875, -0.191162109375, -0.17706298828125, -0.1629638671875, -0.14886474609375, -0.134765625, -0.12066650390625, -0.1065673828125, -0.09246826171875, -0.078369140625, -0.06427001953125, -0.0501708984375, -0.03607177734375, -0.02197265625, -0.00787353515625, 0.0062255859375, 0.02032470703125, 0.034423828125, 0.04852294921875, 0.0626220703125, 0.07672119140625, 0.0908203125, 0.10491943359375, 0.1190185546875, 0.13311767578125, 0.147216796875, 0.16131591796875, 0.1754150390625, 0.18951416015625, 0.20361328125, 0.21771240234375, 0.2318115234375, 0.24591064453125, 0.260009765625, 0.27410888671875, 0.2882080078125, 0.30230712890625, 0.31640625, 0.33050537109375, 0.3446044921875, 0.35870361328125, 0.372802734375, 0.38690185546875, 0.4010009765625, 0.41510009765625, 0.42919921875, 0.44329833984375, 0.4573974609375, 0.47149658203125, 0.485595703125, 0.49969482421875, 0.5137939453125, 0.52789306640625, 0.5419921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 10.0, 13.0, 21.0, 35.0, 52.0, 120.0, 144.0, 201.0, 154.0, 99.0, 69.0, 47.0, 18.0, 11.0, 7.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2197265625, -1.192901611328125, -1.16607666015625, -1.139251708984375, -1.1124267578125, -1.085601806640625, -1.05877685546875, -1.031951904296875, -1.005126953125, -0.978302001953125, -0.95147705078125, -0.924652099609375, -0.8978271484375, -0.871002197265625, -0.84417724609375, -0.817352294921875, -0.79052734375, -0.763702392578125, -0.73687744140625, -0.710052490234375, -0.6832275390625, -0.656402587890625, -0.62957763671875, -0.602752685546875, -0.575927734375, -0.549102783203125, -0.52227783203125, -0.495452880859375, -0.4686279296875, -0.441802978515625, -0.41497802734375, -0.388153076171875, -0.361328125, -0.334503173828125, -0.30767822265625, -0.280853271484375, -0.2540283203125, -0.227203369140625, -0.20037841796875, -0.173553466796875, -0.146728515625, -0.119903564453125, -0.09307861328125, -0.066253662109375, -0.0394287109375, -0.012603759765625, 0.01422119140625, 0.041046142578125, 0.06787109375, 0.094696044921875, 0.12152099609375, 0.148345947265625, 0.1751708984375, 0.201995849609375, 0.22882080078125, 0.255645751953125, 0.282470703125, 0.309295654296875, 0.33612060546875, 0.362945556640625, 0.3897705078125, 0.416595458984375, 0.44342041015625, 0.470245361328125, 0.4970703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 9.0, 1.0, 9.0, 19.0, 20.0, 26.0, 49.0, 63.0, 98.0, 122.0, 195.0, 295.0, 483.0, 801.0, 1317.0, 2397.0, 4291.0, 8910.0, 22431.0, 63527.0, 246964.0, 523335.0, 110674.0, 34936.0, 13721.0, 6140.0, 3010.0, 1715.0, 1070.0, 651.0, 430.0, 298.0, 166.0, 133.0, 76.0, 39.0, 40.0, 27.0, 21.0, 15.0, 7.0, 11.0, 5.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.05096435546875, -0.04951763153076172, -0.04807090759277344, -0.046624183654785156, -0.045177459716796875, -0.043730735778808594, -0.04228401184082031, -0.04083728790283203, -0.03939056396484375, -0.03794384002685547, -0.03649711608886719, -0.035050392150878906, -0.033603668212890625, -0.032156944274902344, -0.030710220336914062, -0.02926349639892578, -0.0278167724609375, -0.02637004852294922, -0.024923324584960938, -0.023476600646972656, -0.022029876708984375, -0.020583152770996094, -0.019136428833007812, -0.01768970489501953, -0.01624298095703125, -0.014796257019042969, -0.013349533081054688, -0.011902809143066406, -0.010456085205078125, -0.009009361267089844, -0.0075626373291015625, -0.006115913391113281, -0.004669189453125, -0.0032224655151367188, -0.0017757415771484375, -0.00032901763916015625, 0.001117706298828125, 0.0025644302368164062, 0.0040111541748046875, 0.005457878112792969, 0.00690460205078125, 0.008351325988769531, 0.009798049926757812, 0.011244773864746094, 0.012691497802734375, 0.014138221740722656, 0.015584945678710938, 0.01703166961669922, 0.0184783935546875, 0.01992511749267578, 0.021371841430664062, 0.022818565368652344, 0.024265289306640625, 0.025712013244628906, 0.027158737182617188, 0.02860546112060547, 0.03005218505859375, 0.03149890899658203, 0.03294563293457031, 0.034392356872558594, 0.035839080810546875, 0.037285804748535156, 0.03873252868652344, 0.04017925262451172, 0.0416259765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 5.0, 3.0, 2.0, 4.0, 5.0, 9.0, 17.0, 21.0, 32.0, 48.0, 48.0, 75.0, 83.0, 88.0, 95.0, 86.0, 84.0, 71.0, 58.0, 44.0, 32.0, 21.0, 26.0, 15.0, 8.0, 7.0, 5.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.9560546875, -0.9299240112304688, -0.9037933349609375, -0.8776626586914062, -0.851531982421875, -0.8254013061523438, -0.7992706298828125, -0.7731399536132812, -0.74700927734375, -0.7208786010742188, -0.6947479248046875, -0.6686172485351562, -0.642486572265625, -0.6163558959960938, -0.5902252197265625, -0.5640945434570312, -0.5379638671875, -0.5118331909179688, -0.4857025146484375, -0.45957183837890625, -0.433441162109375, -0.40731048583984375, -0.3811798095703125, -0.35504913330078125, -0.32891845703125, -0.30278778076171875, -0.2766571044921875, -0.25052642822265625, -0.224395751953125, -0.19826507568359375, -0.1721343994140625, -0.14600372314453125, -0.119873046875, -0.09374237060546875, -0.0676116943359375, -0.04148101806640625, -0.015350341796875, 0.01078033447265625, 0.0369110107421875, 0.06304168701171875, 0.08917236328125, 0.11530303955078125, 0.1414337158203125, 0.16756439208984375, 0.193695068359375, 0.21982574462890625, 0.2459564208984375, 0.27208709716796875, 0.2982177734375, 0.32434844970703125, 0.3504791259765625, 0.37660980224609375, 0.402740478515625, 0.42887115478515625, 0.4550018310546875, 0.48113250732421875, 0.50726318359375, 0.5333938598632812, 0.5595245361328125, 0.5856552124023438, 0.611785888671875, 0.6379165649414062, 0.6640472412109375, 0.6901779174804688, 0.71630859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 10.0, 10.0, 10.0, 17.0, 23.0, 30.0, 57.0, 78.0, 138.0, 214.0, 324.0, 544.0, 986.0, 1760.0, 3564.0, 9684.0, 91166.0, 904114.0, 24715.0, 5640.0, 2415.0, 1382.0, 729.0, 362.0, 212.0, 139.0, 72.0, 43.0, 26.0, 15.0, 15.0, 14.0, 9.0, 8.0, 10.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.007595062255859375, -0.007344305515289307, -0.007093548774719238, -0.00684279203414917, -0.0065920352935791016, -0.006341278553009033, -0.006090521812438965, -0.0058397650718688965, -0.005589008331298828, -0.00533825159072876, -0.005087494850158691, -0.004836738109588623, -0.004585981369018555, -0.004335224628448486, -0.004084467887878418, -0.0038337111473083496, -0.0035829544067382812, -0.003332197666168213, -0.0030814409255981445, -0.002830684185028076, -0.002579927444458008, -0.0023291707038879395, -0.002078413963317871, -0.0018276572227478027, -0.0015769004821777344, -0.001326143741607666, -0.0010753870010375977, -0.0008246302604675293, -0.0005738735198974609, -0.0003231167793273926, -7.236003875732422e-05, 0.00017839670181274414, 0.0004291534423828125, 0.0006799101829528809, 0.0009306669235229492, 0.0011814236640930176, 0.001432180404663086, 0.0016829371452331543, 0.0019336938858032227, 0.002184450626373291, 0.0024352073669433594, 0.0026859641075134277, 0.002936720848083496, 0.0031874775886535645, 0.003438234329223633, 0.003688991069793701, 0.0039397478103637695, 0.004190504550933838, 0.004441261291503906, 0.004692018032073975, 0.004942774772644043, 0.005193531513214111, 0.00544428825378418, 0.005695044994354248, 0.005945801734924316, 0.006196558475494385, 0.006447315216064453, 0.0066980719566345215, 0.00694882869720459, 0.007199585437774658, 0.0074503421783447266, 0.007701098918914795, 0.007951855659484863, 0.008202612400054932, 0.008453369140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 0.0, 5.0, 4.0, 9.0, 3.0, 7.0, 8.0, 10.0, 22.0, 22.0, 44.0, 62.0, 100.0, 237.0, 197.0, 87.0, 61.0, 31.0, 24.0, 12.0, 13.0, 8.0, 7.0, 7.0, 4.0, 4.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1801719665527344e-05, -1.1443160474300385e-05, -1.1084601283073425e-05, -1.0726042091846466e-05, -1.0367482900619507e-05, -1.0008923709392548e-05, -9.650364518165588e-06, -9.291805326938629e-06, -8.93324613571167e-06, -8.57468694448471e-06, -8.216127753257751e-06, -7.857568562030792e-06, -7.499009370803833e-06, -7.140450179576874e-06, -6.7818909883499146e-06, -6.423331797122955e-06, -6.064772605895996e-06, -5.706213414669037e-06, -5.347654223442078e-06, -4.989095032215118e-06, -4.630535840988159e-06, -4.2719766497612e-06, -3.913417458534241e-06, -3.5548582673072815e-06, -3.1962990760803223e-06, -2.837739884853363e-06, -2.479180693626404e-06, -2.1206215023994446e-06, -1.7620623111724854e-06, -1.4035031199455261e-06, -1.044943928718567e-06, -6.863847374916077e-07, -3.2782554626464844e-07, 3.073364496231079e-08, 3.8929283618927e-07, 7.478520274162292e-07, 1.1064112186431885e-06, 1.4649704098701477e-06, 1.823529601097107e-06, 2.182088792324066e-06, 2.5406479835510254e-06, 2.8992071747779846e-06, 3.257766366004944e-06, 3.616325557231903e-06, 3.974884748458862e-06, 4.3334439396858215e-06, 4.692003130912781e-06, 5.05056232213974e-06, 5.409121513366699e-06, 5.7676807045936584e-06, 6.126239895820618e-06, 6.484799087047577e-06, 6.843358278274536e-06, 7.201917469501495e-06, 7.560476660728455e-06, 7.919035851955414e-06, 8.277595043182373e-06, 8.636154234409332e-06, 8.994713425636292e-06, 9.35327261686325e-06, 9.71183180809021e-06, 1.007039099931717e-05, 1.0428950190544128e-05, 1.0787509381771088e-05, 1.1146068572998047e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 3.0, 10.0, 11.0, 36.0, 114.0, 1782.0, 1038795.0, 7311.0, 392.0, 40.0, 18.0, 9.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0655517578125, -0.06390094757080078, -0.06225013732910156, -0.060599327087402344, -0.058948516845703125, -0.057297706604003906, -0.05564689636230469, -0.05399608612060547, -0.05234527587890625, -0.05069446563720703, -0.04904365539550781, -0.047392845153808594, -0.045742034912109375, -0.044091224670410156, -0.04244041442871094, -0.04078960418701172, -0.0391387939453125, -0.03748798370361328, -0.03583717346191406, -0.034186363220214844, -0.032535552978515625, -0.030884742736816406, -0.029233932495117188, -0.02758312225341797, -0.02593231201171875, -0.02428150177001953, -0.022630691528320312, -0.020979881286621094, -0.019329071044921875, -0.017678260803222656, -0.016027450561523438, -0.014376640319824219, -0.012725830078125, -0.011075019836425781, -0.009424209594726562, -0.007773399353027344, -0.006122589111328125, -0.004471778869628906, -0.0028209686279296875, -0.0011701583862304688, 0.00048065185546875, 0.0021314620971679688, 0.0037822723388671875, 0.005433082580566406, 0.007083892822265625, 0.008734703063964844, 0.010385513305664062, 0.012036323547363281, 0.0136871337890625, 0.015337944030761719, 0.016988754272460938, 0.018639564514160156, 0.020290374755859375, 0.021941184997558594, 0.023591995239257812, 0.02524280548095703, 0.02689361572265625, 0.02854442596435547, 0.030195236206054688, 0.031846046447753906, 0.033496856689453125, 0.035147666931152344, 0.03679847717285156, 0.03844928741455078, 0.04010009765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 11.0, 18.0, 50.0, 162.0, 432.0, 191.0, 58.0, 30.0, 15.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0034885406494140625, -0.003400474786758423, -0.003312408924102783, -0.0032243430614471436, -0.003136277198791504, -0.0030482113361358643, -0.0029601454734802246, -0.002872079610824585, -0.0027840137481689453, -0.0026959478855133057, -0.002607882022857666, -0.0025198161602020264, -0.0024317502975463867, -0.002343684434890747, -0.0022556185722351074, -0.0021675527095794678, -0.002079486846923828, -0.0019914209842681885, -0.0019033551216125488, -0.0018152892589569092, -0.0017272233963012695, -0.0016391575336456299, -0.0015510916709899902, -0.0014630258083343506, -0.001374959945678711, -0.0012868940830230713, -0.0011988282203674316, -0.001110762357711792, -0.0010226964950561523, -0.0009346306324005127, -0.000846564769744873, -0.0007584989070892334, -0.0006704330444335938, -0.0005823671817779541, -0.0004943013191223145, -0.0004062354564666748, -0.00031816959381103516, -0.0002301037311553955, -0.00014203786849975586, -5.397200584411621e-05, 3.409385681152344e-05, 0.00012215971946716309, 0.00021022558212280273, 0.0002982914447784424, 0.00038635730743408203, 0.0004744231700897217, 0.0005624890327453613, 0.000650554895401001, 0.0007386207580566406, 0.0008266866207122803, 0.0009147524833679199, 0.0010028183460235596, 0.0010908842086791992, 0.0011789500713348389, 0.0012670159339904785, 0.0013550817966461182, 0.0014431476593017578, 0.0015312135219573975, 0.0016192793846130371, 0.0017073452472686768, 0.0017954111099243164, 0.001883476972579956, 0.0019715428352355957, 0.0020596086978912354, 0.002147674560546875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 985.0, 27.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.77761459350586, -8.549973487854004, -8.322331428527832, -8.094690322875977, -7.867048740386963, -7.639407157897949, -7.411766052246094, -7.18412446975708, -6.956482887268066, -6.728841304779053, -6.501200199127197, -6.273558616638184, -6.04591703414917, -5.818275451660156, -5.590634346008301, -5.362992763519287, -5.135351657867432, -4.907710075378418, -4.6800689697265625, -4.452427387237549, -4.224785804748535, -3.9971444606781006, -3.769503116607666, -3.5418615341186523, -3.3142201900482178, -3.086578845977783, -2.8589372634887695, -2.631295919418335, -2.4036545753479004, -2.1760129928588867, -1.9483716487884521, -1.720730185508728, -1.493088722229004, -1.2654472589492798, -1.0378057956695557, -0.8101644515991211, -0.582522988319397, -0.35488152503967285, -0.12724018096923828, 0.10040128231048584, 0.32804274559020996, 0.5556842088699341, 0.7833256125450134, 1.0109670162200928, 1.238608479499817, 1.466249942779541, 1.6938912868499756, 1.9215327501296997, 2.149174213409424, 2.3768155574798584, 2.604457139968872, 2.8320984840393066, 3.0597400665283203, 3.287381410598755, 3.5150227546691895, 3.742664337158203, 3.9703056812286377, 4.197947025299072, 4.425588607788086, 4.653229713439941, 4.880871295928955, 5.108512878417969, 5.336153984069824, 5.563795566558838, 5.791437149047852]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 10.0, 16.0, 18.0, 44.0, 53.0, 113.0, 118.0, 177.0, 137.0, 118.0, 88.0, 55.0, 31.0, 10.0, 15.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0881621837615967, -1.0643454790115356, -1.0405287742614746, -1.0167120695114136, -0.9928953051567078, -0.9690786004066467, -0.9452618956565857, -0.9214451313018799, -0.8976284265518188, -0.8738117218017578, -0.8499950170516968, -0.826178252696991, -0.8023615479469299, -0.7785448431968689, -0.7547281384468079, -0.730911374092102, -0.707094669342041, -0.68327796459198, -0.659461259841919, -0.6356444954872131, -0.6118277907371521, -0.5880110859870911, -0.56419438123703, -0.5403776168823242, -0.516560971736908, -0.4927442669868469, -0.4689275324344635, -0.44511082768440247, -0.42129409313201904, -0.397477388381958, -0.373660683631897, -0.34984394907951355, -0.32602718472480774, -0.3022104799747467, -0.2783937454223633, -0.25457704067230225, -0.23076030611991882, -0.2069436013698578, -0.18312688171863556, -0.15931016206741333, -0.1354934424161911, -0.11167672276496887, -0.08786000311374664, -0.06404329091310501, -0.04022657126188278, -0.016409851610660553, 0.007406860589981079, 0.031223580241203308, 0.05504029989242554, 0.07885701954364777, 0.10267373919487, 0.12649044394493103, 0.15030717849731445, 0.1741238832473755, 0.19794060289859772, 0.22175732254981995, 0.24557404220104218, 0.2693907618522644, 0.29320746660232544, 0.31702420115470886, 0.3408409059047699, 0.3646576404571533, 0.38847434520721436, 0.4122910499572754, 0.4361077845096588]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 7.0, 5.0, 5.0, 1.0, 10.0, 14.0, 14.0, 17.0, 20.0, 32.0, 37.0, 57.0, 99.0, 228.0, 639.0, 2678.0, 18139.0, 664385.0, 344658.0, 14167.0, 2249.0, 612.0, 187.0, 84.0, 56.0, 32.0, 22.0, 17.0, 14.0, 13.0, 8.0, 12.0, 10.0, 10.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.5693359375, -1.5256805419921875, -1.482025146484375, -1.4383697509765625, -1.39471435546875, -1.3510589599609375, -1.307403564453125, -1.2637481689453125, -1.2200927734375, -1.1764373779296875, -1.132781982421875, -1.0891265869140625, -1.04547119140625, -1.0018157958984375, -0.958160400390625, -0.9145050048828125, -0.870849609375, -0.8271942138671875, -0.783538818359375, -0.7398834228515625, -0.69622802734375, -0.6525726318359375, -0.608917236328125, -0.5652618408203125, -0.5216064453125, -0.4779510498046875, -0.434295654296875, -0.3906402587890625, -0.34698486328125, -0.3033294677734375, -0.259674072265625, -0.2160186767578125, -0.17236328125, -0.1287078857421875, -0.085052490234375, -0.0413970947265625, 0.00225830078125, 0.0459136962890625, 0.089569091796875, 0.1332244873046875, 0.1768798828125, 0.2205352783203125, 0.264190673828125, 0.3078460693359375, 0.35150146484375, 0.3951568603515625, 0.438812255859375, 0.4824676513671875, 0.526123046875, 0.5697784423828125, 0.613433837890625, 0.6570892333984375, 0.70074462890625, 0.7444000244140625, 0.788055419921875, 0.8317108154296875, 0.8753662109375, 0.9190216064453125, 0.962677001953125, 1.0063323974609375, 1.04998779296875, 1.0936431884765625, 1.137298583984375, 1.1809539794921875, 1.224609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 3.0, 11.0, 14.0, 24.0, 42.0, 92.0, 123.0, 226.0, 172.0, 137.0, 77.0, 50.0, 20.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.55078125, -5.43231201171875, -5.3138427734375, -5.19537353515625, -5.076904296875, -4.95843505859375, -4.8399658203125, -4.72149658203125, -4.60302734375, -4.48455810546875, -4.3660888671875, -4.24761962890625, -4.129150390625, -4.01068115234375, -3.8922119140625, -3.77374267578125, -3.6552734375, -3.53680419921875, -3.4183349609375, -3.29986572265625, -3.181396484375, -3.06292724609375, -2.9444580078125, -2.82598876953125, -2.70751953125, -2.58905029296875, -2.4705810546875, -2.35211181640625, -2.233642578125, -2.11517333984375, -1.9967041015625, -1.87823486328125, -1.759765625, -1.64129638671875, -1.5228271484375, -1.40435791015625, -1.285888671875, -1.16741943359375, -1.0489501953125, -0.93048095703125, -0.81201171875, -0.69354248046875, -0.5750732421875, -0.45660400390625, -0.338134765625, -0.21966552734375, -0.1011962890625, 0.01727294921875, 0.1357421875, 0.25421142578125, 0.3726806640625, 0.49114990234375, 0.609619140625, 0.72808837890625, 0.8465576171875, 0.96502685546875, 1.08349609375, 1.20196533203125, 1.3204345703125, 1.43890380859375, 1.557373046875, 1.67584228515625, 1.7943115234375, 1.91278076171875, 2.03125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 8.0, 1.0, 6.0, 10.0, 13.0, 7.0, 18.0, 23.0, 33.0, 41.0, 43.0, 55.0, 60.0, 97.0, 42378.0, 1005330.0, 102.0, 78.0, 59.0, 41.0, 28.0, 41.0, 20.0, 17.0, 7.0, 14.0, 7.0, 6.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.88330078125, -7.5556640625, -7.22802734375, -6.900390625, -6.57275390625, -6.2451171875, -5.91748046875, -5.58984375, -5.26220703125, -4.9345703125, -4.60693359375, -4.279296875, -3.95166015625, -3.6240234375, -3.29638671875, -2.96875, -2.64111328125, -2.3134765625, -1.98583984375, -1.658203125, -1.33056640625, -1.0029296875, -0.67529296875, -0.34765625, -0.02001953125, 0.3076171875, 0.63525390625, 0.962890625, 1.29052734375, 1.6181640625, 1.94580078125, 2.2734375, 2.60107421875, 2.9287109375, 3.25634765625, 3.583984375, 3.91162109375, 4.2392578125, 4.56689453125, 4.89453125, 5.22216796875, 5.5498046875, 5.87744140625, 6.205078125, 6.53271484375, 6.8603515625, 7.18798828125, 7.515625, 7.84326171875, 8.1708984375, 8.49853515625, 8.826171875, 9.15380859375, 9.4814453125, 9.80908203125, 10.13671875, 10.46435546875, 10.7919921875, 11.11962890625, 11.447265625, 11.77490234375, 12.1025390625, 12.43017578125, 12.7578125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 7.0, 2.0, 5.0, 9.0, 14.0, 8.0, 15.0, 25.0, 32.0, 41.0, 43.0, 55.0, 57.0, 84.0, 95.0, 91.0, 84.0, 79.0, 61.0, 42.0, 28.0, 43.0, 20.0, 16.0, 7.0, 14.0, 8.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8193359375, -1.7469329833984375, -1.674530029296875, -1.6021270751953125, -1.52972412109375, -1.4573211669921875, -1.384918212890625, -1.3125152587890625, -1.2401123046875, -1.1677093505859375, -1.095306396484375, -1.0229034423828125, -0.95050048828125, -0.8780975341796875, -0.805694580078125, -0.7332916259765625, -0.660888671875, -0.5884857177734375, -0.516082763671875, -0.4436798095703125, -0.37127685546875, -0.2988739013671875, -0.226470947265625, -0.1540679931640625, -0.0816650390625, -0.0092620849609375, 0.063140869140625, 0.1355438232421875, 0.20794677734375, 0.2803497314453125, 0.352752685546875, 0.4251556396484375, 0.49755859375, 0.5699615478515625, 0.642364501953125, 0.7147674560546875, 0.78717041015625, 0.8595733642578125, 0.931976318359375, 1.0043792724609375, 1.0767822265625, 1.1491851806640625, 1.221588134765625, 1.2939910888671875, 1.36639404296875, 1.4387969970703125, 1.511199951171875, 1.5836029052734375, 1.656005859375, 1.7284088134765625, 1.800811767578125, 1.8732147216796875, 1.94561767578125, 2.0180206298828125, 2.090423583984375, 2.1628265380859375, 2.2352294921875, 2.3076324462890625, 2.380035400390625, 2.4524383544921875, 2.52484130859375, 2.5972442626953125, 2.669647216796875, 2.7420501708984375, 2.814453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 7.0, 13.0, 15.0, 20.0, 47.0, 90.0, 228.0, 627.0, 2049.0, 8533.0, 60130.0, 919256.0, 47497.0, 7298.0, 1790.0, 553.0, 180.0, 72.0, 34.0, 29.0, 17.0, 6.0, 7.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.059112548828125, -0.057034969329833984, -0.05495738983154297, -0.05287981033325195, -0.05080223083496094, -0.04872465133666992, -0.046647071838378906, -0.04456949234008789, -0.042491912841796875, -0.04041433334350586, -0.038336753845214844, -0.03625917434692383, -0.03418159484863281, -0.0321040153503418, -0.03002643585205078, -0.027948856353759766, -0.02587127685546875, -0.023793697357177734, -0.02171611785888672, -0.019638538360595703, -0.017560958862304688, -0.015483379364013672, -0.013405799865722656, -0.01132822036743164, -0.009250640869140625, -0.007173061370849609, -0.005095481872558594, -0.003017902374267578, -0.0009403228759765625, 0.0011372566223144531, 0.0032148361206054688, 0.005292415618896484, 0.0073699951171875, 0.009447574615478516, 0.011525154113769531, 0.013602733612060547, 0.015680313110351562, 0.017757892608642578, 0.019835472106933594, 0.02191305160522461, 0.023990631103515625, 0.02606821060180664, 0.028145790100097656, 0.030223369598388672, 0.03230094909667969, 0.0343785285949707, 0.03645610809326172, 0.038533687591552734, 0.04061126708984375, 0.042688846588134766, 0.04476642608642578, 0.0468440055847168, 0.04892158508300781, 0.05099916458129883, 0.053076744079589844, 0.05515432357788086, 0.057231903076171875, 0.05930948257446289, 0.061387062072753906, 0.06346464157104492, 0.06554222106933594, 0.06761980056762695, 0.06969738006591797, 0.07177495956420898, 0.0738525390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 5.0, 4.0, 5.0, 4.0, 4.0, 10.0, 10.0, 22.0, 13.0, 42.0, 47.0, 125.0, 359.0, 178.0, 66.0, 28.0, 21.0, 14.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.390146255493164e-05, -2.329796552658081e-05, -2.269446849822998e-05, -2.209097146987915e-05, -2.148747444152832e-05, -2.088397741317749e-05, -2.028048038482666e-05, -1.967698335647583e-05, -1.9073486328125e-05, -1.846998929977417e-05, -1.786649227142334e-05, -1.726299524307251e-05, -1.665949821472168e-05, -1.605600118637085e-05, -1.545250415802002e-05, -1.484900712966919e-05, -1.424551010131836e-05, -1.364201307296753e-05, -1.30385160446167e-05, -1.2435019016265869e-05, -1.1831521987915039e-05, -1.1228024959564209e-05, -1.0624527931213379e-05, -1.0021030902862549e-05, -9.417533874511719e-06, -8.814036846160889e-06, -8.210539817810059e-06, -7.6070427894592285e-06, -7.0035457611083984e-06, -6.400048732757568e-06, -5.796551704406738e-06, -5.193054676055908e-06, -4.589557647705078e-06, -3.986060619354248e-06, -3.382563591003418e-06, -2.779066562652588e-06, -2.175569534301758e-06, -1.5720725059509277e-06, -9.685754776000977e-07, -3.650784492492676e-07, 2.384185791015625e-07, 8.419156074523926e-07, 1.4454126358032227e-06, 2.0489096641540527e-06, 2.652406692504883e-06, 3.255903720855713e-06, 3.859400749206543e-06, 4.462897777557373e-06, 5.066394805908203e-06, 5.669891834259033e-06, 6.273388862609863e-06, 6.876885890960693e-06, 7.4803829193115234e-06, 8.083879947662354e-06, 8.687376976013184e-06, 9.290874004364014e-06, 9.894371032714844e-06, 1.0497868061065674e-05, 1.1101365089416504e-05, 1.1704862117767334e-05, 1.2308359146118164e-05, 1.2911856174468994e-05, 1.3515353202819824e-05, 1.4118850231170654e-05, 1.4722347259521484e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 7.0, 7.0, 6.0, 19.0, 24.0, 41.0, 114.0, 250.0, 661.0, 2018.0, 7885.0, 50026.0, 937396.0, 40433.0, 6830.0, 1742.0, 603.0, 249.0, 111.0, 58.0, 30.0, 21.0, 11.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06549072265625, -0.0633401870727539, -0.06118965148925781, -0.05903911590576172, -0.056888580322265625, -0.05473804473876953, -0.05258750915527344, -0.050436973571777344, -0.04828643798828125, -0.046135902404785156, -0.04398536682128906, -0.04183483123779297, -0.039684295654296875, -0.03753376007080078, -0.03538322448730469, -0.033232688903808594, -0.0310821533203125, -0.028931617736816406, -0.026781082153320312, -0.02463054656982422, -0.022480010986328125, -0.02032947540283203, -0.018178939819335938, -0.016028404235839844, -0.01387786865234375, -0.011727333068847656, -0.009576797485351562, -0.007426261901855469, -0.005275726318359375, -0.0031251907348632812, -0.0009746551513671875, 0.0011758804321289062, 0.003326416015625, 0.005476951599121094, 0.0076274871826171875, 0.009778022766113281, 0.011928558349609375, 0.014079093933105469, 0.016229629516601562, 0.018380165100097656, 0.02053070068359375, 0.022681236267089844, 0.024831771850585938, 0.02698230743408203, 0.029132843017578125, 0.03128337860107422, 0.03343391418457031, 0.035584449768066406, 0.0377349853515625, 0.039885520935058594, 0.04203605651855469, 0.04418659210205078, 0.046337127685546875, 0.04848766326904297, 0.05063819885253906, 0.052788734436035156, 0.05493927001953125, 0.057089805603027344, 0.05924034118652344, 0.06139087677001953, 0.06354141235351562, 0.06569194793701172, 0.06784248352050781, 0.0699930191040039, 0.0721435546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 5.0, 7.0, 12.0, 10.0, 14.0, 23.0, 15.0, 29.0, 52.0, 61.0, 84.0, 98.0, 98.0, 98.0, 79.0, 64.0, 42.0, 41.0, 34.0, 15.0, 13.0, 15.0, 11.0, 12.0, 8.0, 9.0, 3.0, 3.0, 5.0, 2.0, 3.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00933074951171875, -0.00901484489440918, -0.00869894027709961, -0.008383035659790039, -0.008067131042480469, -0.0077512264251708984, -0.007435321807861328, -0.007119417190551758, -0.0068035125732421875, -0.006487607955932617, -0.006171703338623047, -0.0058557987213134766, -0.005539894104003906, -0.005223989486694336, -0.004908084869384766, -0.004592180252075195, -0.004276275634765625, -0.003960371017456055, -0.0036444664001464844, -0.003328561782836914, -0.0030126571655273438, -0.0026967525482177734, -0.002380847930908203, -0.002064943313598633, -0.0017490386962890625, -0.0014331340789794922, -0.0011172294616699219, -0.0008013248443603516, -0.00048542022705078125, -0.00016951560974121094, 0.00014638900756835938, 0.0004622936248779297, 0.0007781982421875, 0.0010941028594970703, 0.0014100074768066406, 0.001725912094116211, 0.0020418167114257812, 0.0023577213287353516, 0.002673625946044922, 0.002989530563354492, 0.0033054351806640625, 0.003621339797973633, 0.003937244415283203, 0.0042531490325927734, 0.004569053649902344, 0.004884958267211914, 0.005200862884521484, 0.005516767501831055, 0.005832672119140625, 0.006148576736450195, 0.006464481353759766, 0.006780385971069336, 0.007096290588378906, 0.0074121952056884766, 0.007728099822998047, 0.008044004440307617, 0.008359909057617188, 0.008675813674926758, 0.008991718292236328, 0.009307622909545898, 0.009623527526855469, 0.009939432144165039, 0.01025533676147461, 0.01057124137878418, 0.01088714599609375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [90.0, 928.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3648928701877594, -0.05512690544128418, 0.25463905930519104, 0.564405083656311, 0.8741710186004639, 1.1839369535446167, 1.493703007698059, 1.8034688234329224, 2.113234758377075, 2.4230008125305176, 2.732766628265381, 3.0425326824188232, 3.3522987365722656, 3.662064552307129, 3.9718306064605713, 4.2815961837768555, 4.591362476348877, 4.90112829208374, 5.210894584655762, 5.520660400390625, 5.830426216125488, 6.140192031860352, 6.449958324432373, 6.759724140167236, 7.069490432739258, 7.379256248474121, 7.689022541046143, 7.998788356781006, 8.308554649353027, 8.61832046508789, 8.928086280822754, 9.237852096557617, 9.54761791229248, 9.857383728027344, 10.167149543762207, 10.47691535949707, 10.78668212890625, 11.096447944641113, 11.406213760375977, 11.71597957611084, 12.025745391845703, 12.335511207580566, 12.64527702331543, 12.95504379272461, 13.264809608459473, 13.574575424194336, 13.8843412399292, 14.194107055664062, 14.503873825073242, 14.813639640808105, 15.123405456542969, 15.433172225952148, 15.742938041687012, 16.052703857421875, 16.362468719482422, 16.6722354888916, 16.98200035095215, 17.291767120361328, 17.601531982421875, 17.911298751831055, 18.2210636138916, 18.53083038330078, 18.840595245361328, 19.150362014770508, 19.460128784179688]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 13.0, 25.0, 12.0, 24.0, 34.0, 37.0, 38.0, 46.0, 65.0, 63.0, 69.0, 74.0, 76.0, 79.0, 55.0, 58.0, 50.0, 29.0, 33.0, 36.0, 24.0, 15.0, 12.0, 11.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.687242031097412, -4.586300849914551, -4.485360145568848, -4.384418964385986, -4.283477783203125, -4.182537078857422, -4.0815958976745605, -3.980654716491699, -3.879713773727417, -3.7787728309631348, -3.6778316497802734, -3.576890707015991, -3.47594952583313, -3.3750085830688477, -3.2740674018859863, -3.173126459121704, -3.072185516357422, -2.9712445735931396, -2.8703033924102783, -2.769362449645996, -2.6684212684631348, -2.5674803256988525, -2.4665393829345703, -2.365598201751709, -2.2646570205688477, -2.1637160778045654, -2.062774896621704, -1.9618339538574219, -1.86089289188385, -1.7599518299102783, -1.6590107679367065, -1.5580697059631348, -1.457128882408142, -1.3561878204345703, -1.2552467584609985, -1.1543056964874268, -1.0533647537231445, -0.9524236917495728, -0.851482629776001, -0.750541627407074, -0.6496005654335022, -0.5486595034599304, -0.4477185010910034, -0.34677743911743164, -0.24583640694618225, -0.14489537477493286, -0.043954312801361084, 0.05698668956756592, 0.1579277515411377, 0.2588687837123871, 0.3598098158836365, 0.46075087785720825, 0.5616918802261353, 0.662632942199707, 0.7635740041732788, 0.8645150065422058, 0.9654560685157776, 1.0663970708847046, 1.1673381328582764, 1.2682791948318481, 1.36922025680542, 1.4701611995697021, 1.5711023807525635, 1.6720433235168457, 1.7729843854904175]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 4.0, 15.0, 16.0, 14.0, 27.0, 26.0, 37.0, 70.0, 84.0, 203.0, 1583.0, 4181192.0, 10321.0, 344.0, 103.0, 57.0, 48.0, 35.0, 30.0, 24.0, 17.0, 11.0, 8.0, 4.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0], "bins": [-2.923828125, -2.8598785400390625, -2.795928955078125, -2.7319793701171875, -2.66802978515625, -2.6040802001953125, -2.540130615234375, -2.4761810302734375, -2.4122314453125, -2.3482818603515625, -2.284332275390625, -2.2203826904296875, -2.15643310546875, -2.0924835205078125, -2.028533935546875, -1.9645843505859375, -1.900634765625, -1.8366851806640625, -1.772735595703125, -1.7087860107421875, -1.64483642578125, -1.5808868408203125, -1.516937255859375, -1.4529876708984375, -1.3890380859375, -1.3250885009765625, -1.261138916015625, -1.1971893310546875, -1.13323974609375, -1.0692901611328125, -1.005340576171875, -0.9413909912109375, -0.87744140625, -0.8134918212890625, -0.749542236328125, -0.6855926513671875, -0.62164306640625, -0.5576934814453125, -0.493743896484375, -0.4297943115234375, -0.3658447265625, -0.3018951416015625, -0.237945556640625, -0.1739959716796875, -0.11004638671875, -0.0460968017578125, 0.017852783203125, 0.0818023681640625, 0.145751953125, 0.2097015380859375, 0.273651123046875, 0.3376007080078125, 0.40155029296875, 0.4654998779296875, 0.529449462890625, 0.5933990478515625, 0.6573486328125, 0.7212982177734375, 0.785247802734375, 0.8491973876953125, 0.91314697265625, 0.9770965576171875, 1.041046142578125, 1.1049957275390625, 1.1689453125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 14.0, 18.0, 14.0, 24.0, 32.0, 35.0, 54.0, 59.0, 92.0, 106.0, 97.0, 109.0, 73.0, 63.0, 54.0, 41.0, 29.0, 25.0, 25.0, 12.0, 8.0, 10.0, 1.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.131103515625, -0.1282186508178711, -0.1253337860107422, -0.12244892120361328, -0.11956405639648438, -0.11667919158935547, -0.11379432678222656, -0.11090946197509766, -0.10802459716796875, -0.10513973236083984, -0.10225486755371094, -0.09937000274658203, -0.09648513793945312, -0.09360027313232422, -0.09071540832519531, -0.0878305435180664, -0.0849456787109375, -0.0820608139038086, -0.07917594909667969, -0.07629108428955078, -0.07340621948242188, -0.07052135467529297, -0.06763648986816406, -0.06475162506103516, -0.06186676025390625, -0.058981895446777344, -0.05609703063964844, -0.05321216583251953, -0.050327301025390625, -0.04744243621826172, -0.04455757141113281, -0.041672706604003906, -0.038787841796875, -0.035902976989746094, -0.03301811218261719, -0.03013324737548828, -0.027248382568359375, -0.02436351776123047, -0.021478652954101562, -0.018593788146972656, -0.01570892333984375, -0.012824058532714844, -0.009939193725585938, -0.007054328918457031, -0.004169464111328125, -0.0012845993041992188, 0.0016002655029296875, 0.004485130310058594, 0.0073699951171875, 0.010254859924316406, 0.013139724731445312, 0.01602458953857422, 0.018909454345703125, 0.02179431915283203, 0.024679183959960938, 0.027564048767089844, 0.03044891357421875, 0.033333778381347656, 0.03621864318847656, 0.03910350799560547, 0.041988372802734375, 0.04487323760986328, 0.04775810241699219, 0.050642967224121094, 0.05352783203125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 13.0, 12.0, 33.0, 58.0, 333.0, 4193654.0, 152.0, 16.0, 4.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.125, -17.76544189453125, -17.4058837890625, -17.04632568359375, -16.686767578125, -16.32720947265625, -15.9676513671875, -15.60809326171875, -15.24853515625, -14.88897705078125, -14.5294189453125, -14.16986083984375, -13.810302734375, -13.45074462890625, -13.0911865234375, -12.73162841796875, -12.3720703125, -12.01251220703125, -11.6529541015625, -11.29339599609375, -10.933837890625, -10.57427978515625, -10.2147216796875, -9.85516357421875, -9.49560546875, -9.13604736328125, -8.7764892578125, -8.41693115234375, -8.057373046875, -7.69781494140625, -7.3382568359375, -6.97869873046875, -6.619140625, -6.25958251953125, -5.9000244140625, -5.54046630859375, -5.180908203125, -4.82135009765625, -4.4617919921875, -4.10223388671875, -3.74267578125, -3.38311767578125, -3.0235595703125, -2.66400146484375, -2.304443359375, -1.94488525390625, -1.5853271484375, -1.22576904296875, -0.8662109375, -0.50665283203125, -0.1470947265625, 0.21246337890625, 0.572021484375, 0.93157958984375, 1.2911376953125, 1.65069580078125, 2.01025390625, 2.36981201171875, 2.7293701171875, 3.08892822265625, 3.448486328125, 3.80804443359375, 4.1676025390625, 4.52716064453125, 4.88671875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 10.0, 13.0, 31.0, 50.0, 217.0, 3467.0, 243.0, 28.0, 6.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.328857421875, -0.3228273391723633, -0.31679725646972656, -0.31076717376708984, -0.3047370910644531, -0.2987070083618164, -0.2926769256591797, -0.28664684295654297, -0.28061676025390625, -0.27458667755126953, -0.2685565948486328, -0.2625265121459961, -0.2564964294433594, -0.25046634674072266, -0.24443626403808594, -0.23840618133544922, -0.2323760986328125, -0.22634601593017578, -0.22031593322753906, -0.21428585052490234, -0.20825576782226562, -0.2022256851196289, -0.1961956024169922, -0.19016551971435547, -0.18413543701171875, -0.17810535430908203, -0.1720752716064453, -0.1660451889038086, -0.16001510620117188, -0.15398502349853516, -0.14795494079589844, -0.14192485809326172, -0.135894775390625, -0.12986469268798828, -0.12383460998535156, -0.11780452728271484, -0.11177444458007812, -0.1057443618774414, -0.09971427917480469, -0.09368419647216797, -0.08765411376953125, -0.08162403106689453, -0.07559394836425781, -0.0695638656616211, -0.06353378295898438, -0.057503700256347656, -0.05147361755371094, -0.04544353485107422, -0.0394134521484375, -0.03338336944580078, -0.027353286743164062, -0.021323204040527344, -0.015293121337890625, -0.009263038635253906, -0.0032329559326171875, 0.0027971267700195312, 0.00882720947265625, 0.014857292175292969, 0.020887374877929688, 0.026917457580566406, 0.032947540283203125, 0.038977622985839844, 0.04500770568847656, 0.05103778839111328, 0.05706787109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 12.0, 23.0, 73.0, 167.0, 573.0, 138.0, 15.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23265860974788666, -0.21074682474136353, -0.1888350397348404, -0.16692325472831726, -0.14501148462295532, -0.12309969216585159, -0.10118791460990906, -0.07927612960338593, -0.05736434459686279, -0.03545255959033966, -0.013540778309106827, 0.008371002972126007, 0.03028278797864914, 0.05219457298517227, 0.07410635054111481, 0.09601813554763794, 0.11792992055416107, 0.1398417055606842, 0.16175349056720734, 0.18366527557373047, 0.2055770456790924, 0.22748884558677673, 0.24940061569213867, 0.271312415599823, 0.29322418570518494, 0.3151359558105469, 0.3370477557182312, 0.35895952582359314, 0.38087132573127747, 0.4027830958366394, 0.42469489574432373, 0.44660666584968567, 0.4685184359550476, 0.49043020606040955, 0.5123419761657715, 0.5342537760734558, 0.5561655759811401, 0.5780773758888245, 0.599989116191864, 0.6219009160995483, 0.6438127160072327, 0.665724515914917, 0.6876362562179565, 0.7095480561256409, 0.7314598560333252, 0.7533716559410095, 0.7752833962440491, 0.7971951961517334, 0.819106936454773, 0.8410187363624573, 0.8629304766654968, 0.8848422765731812, 0.9067540764808655, 0.9286658763885498, 0.9505776166915894, 0.9724894165992737, 0.994401216506958, 1.0163129568099976, 1.0382248163223267, 1.0601365566253662, 1.0820482969284058, 1.1039601564407349, 1.1258718967437744, 1.1477837562561035, 1.169695496559143]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 14.0, 21.0, 12.0, 15.0, 16.0, 26.0, 35.0, 33.0, 54.0, 47.0, 49.0, 50.0, 58.0, 58.0, 50.0, 59.0, 44.0, 48.0, 48.0, 40.0, 38.0, 39.0, 23.0, 16.0, 21.0, 17.0, 18.0, 6.0, 13.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10183397680521011, -0.09831398725509644, -0.09479399025440216, -0.09127400070428848, -0.0877540111541748, -0.08423401415348053, -0.08071402460336685, -0.07719403505325317, -0.0736740380525589, -0.07015404850244522, -0.06663405150175095, -0.06311406195163727, -0.05959407240152359, -0.056074079126119614, -0.05255408585071564, -0.04903409630060196, -0.04551410675048828, -0.041994113475084305, -0.03847412392497063, -0.03495413064956665, -0.03143414109945297, -0.027914147824048996, -0.02439415454864502, -0.020874163135886192, -0.017354171723127365, -0.013834180310368538, -0.010314187966287136, -0.006794195622205734, -0.003274204209446907, 0.00024578720331192017, 0.0037657804787158966, 0.007285771891474724, 0.010805770754814148, 0.014325762167572975, 0.017845753580331802, 0.02136574685573578, 0.024885738268494606, 0.028405729681253433, 0.03192572295665741, 0.03544571250677109, 0.038965705782175064, 0.04248569905757904, 0.04600568860769272, 0.049525681883096695, 0.05304567515850067, 0.05656566470861435, 0.060085657984018326, 0.0636056512594223, 0.06712564080953598, 0.07064563035964966, 0.07416562736034393, 0.07768561691045761, 0.08120560646057129, 0.08472560346126556, 0.08824559301137924, 0.09176558256149292, 0.0952855795621872, 0.09880556911230087, 0.10232556611299515, 0.10584555566310883, 0.1093655452132225, 0.11288553476333618, 0.11640553176403046, 0.11992552131414413, 0.12344551086425781]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 9.0, 8.0, 12.0, 22.0, 33.0, 51.0, 91.0, 126.0, 247.0, 538.0, 1359.0, 4317.0, 24539.0, 788804.0, 210826.0, 12827.0, 2755.0, 1014.0, 467.0, 209.0, 113.0, 68.0, 37.0, 22.0, 20.0, 6.0, 10.0, 8.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05682373046875, -0.0551447868347168, -0.053465843200683594, -0.05178689956665039, -0.05010795593261719, -0.048429012298583984, -0.04675006866455078, -0.04507112503051758, -0.043392181396484375, -0.04171323776245117, -0.04003429412841797, -0.038355350494384766, -0.03667640686035156, -0.03499746322631836, -0.033318519592285156, -0.03163957595825195, -0.02996063232421875, -0.028281688690185547, -0.026602745056152344, -0.02492380142211914, -0.023244857788085938, -0.021565914154052734, -0.01988697052001953, -0.018208026885986328, -0.016529083251953125, -0.014850139617919922, -0.013171195983886719, -0.011492252349853516, -0.009813308715820312, -0.00813436508178711, -0.006455421447753906, -0.004776477813720703, -0.0030975341796875, -0.0014185905456542969, 0.00026035308837890625, 0.0019392967224121094, 0.0036182403564453125, 0.005297183990478516, 0.006976127624511719, 0.008655071258544922, 0.010334014892578125, 0.012012958526611328, 0.013691902160644531, 0.015370845794677734, 0.017049789428710938, 0.01872873306274414, 0.020407676696777344, 0.022086620330810547, 0.02376556396484375, 0.025444507598876953, 0.027123451232910156, 0.02880239486694336, 0.030481338500976562, 0.032160282135009766, 0.03383922576904297, 0.03551816940307617, 0.037197113037109375, 0.03887605667114258, 0.04055500030517578, 0.042233943939208984, 0.04391288757324219, 0.04559183120727539, 0.047270774841308594, 0.0489497184753418, 0.050628662109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 3.0, 5.0, 12.0, 18.0, 22.0, 26.0, 41.0, 45.0, 72.0, 82.0, 99.0, 103.0, 124.0, 71.0, 60.0, 55.0, 48.0, 26.0, 23.0, 17.0, 19.0, 4.0, 8.0, 5.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10528564453125, -0.10175323486328125, -0.0982208251953125, -0.09468841552734375, -0.091156005859375, -0.08762359619140625, -0.0840911865234375, -0.08055877685546875, -0.0770263671875, -0.07349395751953125, -0.0699615478515625, -0.06642913818359375, -0.062896728515625, -0.05936431884765625, -0.0558319091796875, -0.05229949951171875, -0.04876708984375, -0.04523468017578125, -0.0417022705078125, -0.03816986083984375, -0.034637451171875, -0.03110504150390625, -0.0275726318359375, -0.02404022216796875, -0.0205078125, -0.01697540283203125, -0.0134429931640625, -0.00991058349609375, -0.006378173828125, -0.00284576416015625, 0.0006866455078125, 0.00421905517578125, 0.00775146484375, 0.01128387451171875, 0.0148162841796875, 0.01834869384765625, 0.021881103515625, 0.02541351318359375, 0.0289459228515625, 0.03247833251953125, 0.0360107421875, 0.03954315185546875, 0.0430755615234375, 0.04660797119140625, 0.050140380859375, 0.05367279052734375, 0.0572052001953125, 0.06073760986328125, 0.06427001953125, 0.06780242919921875, 0.0713348388671875, 0.07486724853515625, 0.078399658203125, 0.08193206787109375, 0.0854644775390625, 0.08899688720703125, 0.092529296875, 0.09606170654296875, 0.0995941162109375, 0.10312652587890625, 0.106658935546875, 0.11019134521484375, 0.1137237548828125, 0.11725616455078125, 0.12078857421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 6.0, 7.0, 8.0, 12.0, 17.0, 23.0, 27.0, 40.0, 73.0, 108.0, 151.0, 239.0, 347.0, 614.0, 939.0, 1814.0, 3185.0, 6321.0, 13138.0, 29921.0, 79249.0, 281449.0, 441380.0, 114846.0, 40151.0, 17177.0, 8018.0, 4019.0, 2112.0, 1275.0, 694.0, 400.0, 255.0, 157.0, 111.0, 85.0, 60.0, 43.0, 25.0, 11.0, 12.0, 13.0, 7.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01125335693359375, -0.010903477668762207, -0.010553598403930664, -0.010203719139099121, -0.009853839874267578, -0.009503960609436035, -0.009154081344604492, -0.00880420207977295, -0.008454322814941406, -0.008104443550109863, -0.00775456428527832, -0.007404685020446777, -0.007054805755615234, -0.006704926490783691, -0.0063550472259521484, -0.0060051679611206055, -0.0056552886962890625, -0.0053054094314575195, -0.0049555301666259766, -0.004605650901794434, -0.004255771636962891, -0.0039058923721313477, -0.0035560131072998047, -0.0032061338424682617, -0.0028562545776367188, -0.0025063753128051758, -0.002156496047973633, -0.0018066167831420898, -0.0014567375183105469, -0.001106858253479004, -0.0007569789886474609, -0.00040709972381591797, -5.7220458984375e-05, 0.00029265880584716797, 0.0006425380706787109, 0.000992417335510254, 0.0013422966003417969, 0.0016921758651733398, 0.002042055130004883, 0.0023919343948364258, 0.0027418136596679688, 0.0030916929244995117, 0.0034415721893310547, 0.0037914514541625977, 0.004141330718994141, 0.004491209983825684, 0.0048410892486572266, 0.0051909685134887695, 0.0055408477783203125, 0.0058907270431518555, 0.0062406063079833984, 0.006590485572814941, 0.006940364837646484, 0.007290244102478027, 0.00764012336730957, 0.007990002632141113, 0.008339881896972656, 0.0086897611618042, 0.009039640426635742, 0.009389519691467285, 0.009739398956298828, 0.010089278221130371, 0.010439157485961914, 0.010789036750793457, 0.011138916015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 7.0, 12.0, 6.0, 9.0, 13.0, 29.0, 30.0, 49.0, 47.0, 56.0, 74.0, 65.0, 77.0, 80.0, 82.0, 56.0, 69.0, 48.0, 43.0, 32.0, 24.0, 27.0, 11.0, 18.0, 10.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1475830078125, -0.14194488525390625, -0.1363067626953125, -0.13066864013671875, -0.125030517578125, -0.11939239501953125, -0.1137542724609375, -0.10811614990234375, -0.10247802734375, -0.09683990478515625, -0.0912017822265625, -0.08556365966796875, -0.079925537109375, -0.07428741455078125, -0.0686492919921875, -0.06301116943359375, -0.057373046875, -0.05173492431640625, -0.0460968017578125, -0.04045867919921875, -0.034820556640625, -0.02918243408203125, -0.0235443115234375, -0.01790618896484375, -0.01226806640625, -0.00662994384765625, -0.0009918212890625, 0.00464630126953125, 0.010284423828125, 0.01592254638671875, 0.0215606689453125, 0.02719879150390625, 0.0328369140625, 0.03847503662109375, 0.0441131591796875, 0.04975128173828125, 0.055389404296875, 0.06102752685546875, 0.0666656494140625, 0.07230377197265625, 0.07794189453125, 0.08358001708984375, 0.0892181396484375, 0.09485626220703125, 0.100494384765625, 0.10613250732421875, 0.1117706298828125, 0.11740875244140625, 0.123046875, 0.12868499755859375, 0.1343231201171875, 0.13996124267578125, 0.145599365234375, 0.15123748779296875, 0.1568756103515625, 0.16251373291015625, 0.16815185546875, 0.17378997802734375, 0.1794281005859375, 0.18506622314453125, 0.190704345703125, 0.19634246826171875, 0.2019805908203125, 0.20761871337890625, 0.2132568359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 7.0, 9.0, 10.0, 16.0, 13.0, 5.0, 23.0, 43.0, 51.0, 108.0, 126.0, 223.0, 368.0, 692.0, 1331.0, 2547.0, 5487.0, 13558.0, 39243.0, 231131.0, 664213.0, 56537.0, 18098.0, 7359.0, 3383.0, 1706.0, 900.0, 544.0, 301.0, 177.0, 115.0, 70.0, 46.0, 22.0, 13.0, 16.0, 13.0, 13.0, 8.0, 7.0, 6.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0029144287109375, -0.002826482057571411, -0.0027385354042053223, -0.0026505887508392334, -0.0025626420974731445, -0.0024746954441070557, -0.002386748790740967, -0.002298802137374878, -0.002210855484008789, -0.0021229088306427, -0.0020349621772766113, -0.0019470155239105225, -0.0018590688705444336, -0.0017711222171783447, -0.0016831755638122559, -0.001595228910446167, -0.0015072822570800781, -0.0014193356037139893, -0.0013313889503479004, -0.0012434422969818115, -0.0011554956436157227, -0.0010675489902496338, -0.000979602336883545, -0.0008916556835174561, -0.0008037090301513672, -0.0007157623767852783, -0.0006278157234191895, -0.0005398690700531006, -0.0004519224166870117, -0.00036397576332092285, -0.000276029109954834, -0.00018808245658874512, -0.00010013580322265625, -1.2189149856567383e-05, 7.575750350952148e-05, 0.00016370415687561035, 0.0002516508102416992, 0.0003395974636077881, 0.00042754411697387695, 0.0005154907703399658, 0.0006034374237060547, 0.0006913840770721436, 0.0007793307304382324, 0.0008672773838043213, 0.0009552240371704102, 0.001043170690536499, 0.0011311173439025879, 0.0012190639972686768, 0.0013070106506347656, 0.0013949573040008545, 0.0014829039573669434, 0.0015708506107330322, 0.001658797264099121, 0.00174674391746521, 0.0018346905708312988, 0.0019226372241973877, 0.0020105838775634766, 0.0020985305309295654, 0.0021864771842956543, 0.002274423837661743, 0.002362370491027832, 0.002450317144393921, 0.0025382637977600098, 0.0026262104511260986, 0.0027141571044921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 0.0, 6.0, 3.0, 9.0, 4.0, 20.0, 17.0, 28.0, 27.0, 32.0, 115.0, 199.0, 273.0, 97.0, 55.0, 37.0, 18.0, 18.0, 12.0, 5.0, 5.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.079673767089844e-06, -5.877576768398285e-06, -5.675479769706726e-06, -5.473382771015167e-06, -5.271285772323608e-06, -5.0691887736320496e-06, -4.867091774940491e-06, -4.664994776248932e-06, -4.462897777557373e-06, -4.260800778865814e-06, -4.058703780174255e-06, -3.8566067814826965e-06, -3.6545097827911377e-06, -3.452412784099579e-06, -3.25031578540802e-06, -3.048218786716461e-06, -2.8461217880249023e-06, -2.6440247893333435e-06, -2.4419277906417847e-06, -2.239830791950226e-06, -2.037733793258667e-06, -1.8356367945671082e-06, -1.6335397958755493e-06, -1.4314427971839905e-06, -1.2293457984924316e-06, -1.0272487998008728e-06, -8.25151801109314e-07, -6.230548024177551e-07, -4.209578037261963e-07, -2.1886080503463745e-07, -1.6763806343078613e-08, 1.8533319234848022e-07, 3.8743019104003906e-07, 5.895271897315979e-07, 7.916241884231567e-07, 9.937211871147156e-07, 1.1958181858062744e-06, 1.3979151844978333e-06, 1.600012183189392e-06, 1.802109181880951e-06, 2.0042061805725098e-06, 2.2063031792640686e-06, 2.4084001779556274e-06, 2.6104971766471863e-06, 2.812594175338745e-06, 3.014691174030304e-06, 3.216788172721863e-06, 3.4188851714134216e-06, 3.6209821701049805e-06, 3.823079168796539e-06, 4.025176167488098e-06, 4.227273166179657e-06, 4.429370164871216e-06, 4.631467163562775e-06, 4.8335641622543335e-06, 5.035661160945892e-06, 5.237758159637451e-06, 5.43985515832901e-06, 5.641952157020569e-06, 5.844049155712128e-06, 6.0461461544036865e-06, 6.248243153095245e-06, 6.450340151786804e-06, 6.652437150478363e-06, 6.854534149169922e-06]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 4.0, 4.0, 5.0, 2.0, 11.0, 15.0, 12.0, 15.0, 13.0, 23.0, 34.0, 74.0, 309.0, 1994.0, 27163.0, 988309.0, 28024.0, 2012.0, 310.0, 72.0, 41.0, 18.0, 14.0, 19.0, 8.0, 8.0, 8.0, 6.0, 3.0, 6.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00936126708984375, -0.009032845497131348, -0.008704423904418945, -0.008376002311706543, -0.00804758071899414, -0.007719159126281738, -0.007390737533569336, -0.007062315940856934, -0.006733894348144531, -0.006405472755432129, -0.0060770511627197266, -0.005748629570007324, -0.005420207977294922, -0.0050917863845825195, -0.004763364791870117, -0.004434943199157715, -0.0041065216064453125, -0.00377810001373291, -0.003449678421020508, -0.0031212568283081055, -0.002792835235595703, -0.0024644136428833008, -0.0021359920501708984, -0.001807570457458496, -0.0014791488647460938, -0.0011507272720336914, -0.0008223056793212891, -0.0004938840866088867, -0.00016546249389648438, 0.00016295909881591797, 0.0004913806915283203, 0.0008198022842407227, 0.001148223876953125, 0.0014766454696655273, 0.0018050670623779297, 0.002133488655090332, 0.0024619102478027344, 0.0027903318405151367, 0.003118753433227539, 0.0034471750259399414, 0.0037755966186523438, 0.004104018211364746, 0.0044324398040771484, 0.004760861396789551, 0.005089282989501953, 0.0054177045822143555, 0.005746126174926758, 0.00607454776763916, 0.0064029693603515625, 0.006731390953063965, 0.007059812545776367, 0.0073882341384887695, 0.007716655731201172, 0.008045077323913574, 0.008373498916625977, 0.008701920509338379, 0.009030342102050781, 0.009358763694763184, 0.009687185287475586, 0.010015606880187988, 0.01034402847290039, 0.010672450065612793, 0.011000871658325195, 0.011329293251037598, 0.01165771484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 2.0, 4.0, 4.0, 10.0, 11.0, 10.0, 20.0, 12.0, 17.0, 22.0, 37.0, 38.0, 36.0, 81.0, 146.0, 180.0, 95.0, 58.0, 42.0, 26.0, 33.0, 22.0, 14.0, 9.0, 12.0, 14.0, 10.0, 4.0, 4.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006313323974609375, -0.0006097406148910522, -0.000588148832321167, -0.0005665570497512817, -0.0005449652671813965, -0.0005233734846115112, -0.000501781702041626, -0.0004801899194717407, -0.00045859813690185547, -0.0004370063543319702, -0.00041541457176208496, -0.0003938227891921997, -0.00037223100662231445, -0.0003506392240524292, -0.00032904744148254395, -0.0003074556589126587, -0.00028586387634277344, -0.0002642720937728882, -0.00024268031120300293, -0.00022108852863311768, -0.00019949674606323242, -0.00017790496349334717, -0.00015631318092346191, -0.00013472139835357666, -0.0001131296157836914, -9.153783321380615e-05, -6.99460506439209e-05, -4.8354268074035645e-05, -2.676248550415039e-05, -5.170702934265137e-06, 1.6421079635620117e-05, 3.801286220550537e-05, 5.9604644775390625e-05, 8.119642734527588e-05, 0.00010278820991516113, 0.0001243799924850464, 0.00014597177505493164, 0.0001675635576248169, 0.00018915534019470215, 0.0002107471227645874, 0.00023233890533447266, 0.0002539306879043579, 0.00027552247047424316, 0.0002971142530441284, 0.00031870603561401367, 0.0003402978181838989, 0.0003618896007537842, 0.00038348138332366943, 0.0004050731658935547, 0.00042666494846343994, 0.0004482567310333252, 0.00046984851360321045, 0.0004914402961730957, 0.000513032078742981, 0.0005346238613128662, 0.0005562156438827515, 0.0005778074264526367, 0.000599399209022522, 0.0006209909915924072, 0.0006425827741622925, 0.0006641745567321777, 0.000685766339302063, 0.0007073581218719482, 0.0007289499044418335, 0.0007505416870117188]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [14.0, 1004.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1524183303117752, -0.060393884778022766, 0.031630560755729675, 0.12365500628948212, 0.21567945182323456, 0.3077039122581482, 0.39972835779190063, 0.4917528033256531, 0.5837772488594055, 0.675801694393158, 0.7678261399269104, 0.8598505854606628, 0.9518750309944153, 1.0438995361328125, 1.1359238624572754, 1.2279484272003174, 1.3199727535247803, 1.4119971990585327, 1.5040216445922852, 1.5960460901260376, 1.68807053565979, 1.7800949811935425, 1.872119426727295, 1.9641438722610474, 2.0561683177948, 2.148192882537842, 2.2402172088623047, 2.3322415351867676, 2.4242660999298096, 2.5162906646728516, 2.6083149909973145, 2.7003393173217773, 2.7923641204833984, 2.8843884468078613, 2.9764130115509033, 3.0684375762939453, 3.160461902618408, 3.252486228942871, 3.344510793685913, 3.436535358428955, 3.528559684753418, 3.620584011077881, 3.712608575820923, 3.804633140563965, 3.8966574668884277, 3.9886817932128906, 4.080706596374512, 4.172730922698975, 4.2647552490234375, 4.3567795753479, 4.448803901672363, 4.540828704833984, 4.632853031158447, 4.72487735748291, 4.816902160644531, 4.908926486968994, 5.000950813293457, 5.09297513961792, 5.184999465942383, 5.277024269104004, 5.369048595428467, 5.46107292175293, 5.553097724914551, 5.645122051239014, 5.737146377563477]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 16.0, 31.0, 38.0, 61.0, 86.0, 100.0, 130.0, 106.0, 104.0, 96.0, 78.0, 42.0, 33.0, 30.0, 14.0, 12.0, 5.0, 7.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07409506291151047, -0.06984714418649673, -0.065599225461483, -0.06135131046175957, -0.057103391736745834, -0.0528554730117321, -0.04860755801200867, -0.044359639286994934, -0.0401117205619812, -0.03586380183696747, -0.031615883111953735, -0.0273679681122303, -0.023120049387216568, -0.018872130662202835, -0.014624213799834251, -0.010376296937465668, -0.006128378212451935, -0.0018804604187607765, 0.0023674573749303818, 0.00661537516862154, 0.010863292962312698, 0.015111211687326431, 0.019359128549695015, 0.0236070454120636, 0.02785496413707733, 0.032102882862091064, 0.0363508015871048, 0.04059871658682823, 0.044846635311841965, 0.0490945540368557, 0.05334246903657913, 0.057590387761592865, 0.061838313937187195, 0.06608623266220093, 0.07033415138721466, 0.0745820701122284, 0.07882998883724213, 0.08307790756225586, 0.087325818836689, 0.09157373756170273, 0.09582165628671646, 0.1000695750117302, 0.10431749373674393, 0.10856541246175766, 0.1128133237361908, 0.11706124246120453, 0.12130916118621826, 0.125557079911232, 0.12980499863624573, 0.13405291736125946, 0.1383008360862732, 0.14254875481128693, 0.14679667353630066, 0.1510445922613144, 0.15529251098632812, 0.15954041481018066, 0.1637883484363556, 0.16803626716136932, 0.17228418588638306, 0.1765321046113968, 0.18078002333641052, 0.18502794206142426, 0.189275860786438, 0.19352376461029053, 0.19777168333530426]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 12.0, 5.0, 15.0, 10.0, 19.0, 22.0, 31.0, 48.0, 98.0, 242.0, 670.0, 2650.0, 15164.0, 208644.0, 782151.0, 32547.0, 4522.0, 1043.0, 340.0, 144.0, 58.0, 30.0, 19.0, 20.0, 9.0, 8.0, 10.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37744140625, -0.3657112121582031, -0.35398101806640625, -0.3422508239746094, -0.3305206298828125, -0.3187904357910156, -0.30706024169921875, -0.2953300476074219, -0.283599853515625, -0.2718696594238281, -0.26013946533203125, -0.24840927124023438, -0.2366790771484375, -0.22494888305664062, -0.21321868896484375, -0.20148849487304688, -0.18975830078125, -0.17802810668945312, -0.16629791259765625, -0.15456771850585938, -0.1428375244140625, -0.13110733032226562, -0.11937713623046875, -0.10764694213867188, -0.095916748046875, -0.08418655395507812, -0.07245635986328125, -0.060726165771484375, -0.0489959716796875, -0.037265777587890625, -0.02553558349609375, -0.013805389404296875, -0.0020751953125, 0.009654998779296875, 0.02138519287109375, 0.033115386962890625, 0.0448455810546875, 0.056575775146484375, 0.06830596923828125, 0.08003616333007812, 0.091766357421875, 0.10349655151367188, 0.11522674560546875, 0.12695693969726562, 0.1386871337890625, 0.15041732788085938, 0.16214752197265625, 0.17387771606445312, 0.18560791015625, 0.19733810424804688, 0.20906829833984375, 0.22079849243164062, 0.2325286865234375, 0.24425888061523438, 0.25598907470703125, 0.2677192687988281, 0.279449462890625, 0.2911796569824219, 0.30290985107421875, 0.3146400451660156, 0.3263702392578125, 0.3381004333496094, 0.34983062744140625, 0.3615608215332031, 0.373291015625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 20.0, 24.0, 35.0, 57.0, 86.0, 105.0, 159.0, 145.0, 114.0, 81.0, 54.0, 39.0, 31.0, 15.0, 10.0, 10.0, 5.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.362548828125, -0.3425407409667969, -0.32253265380859375, -0.3025245666503906, -0.2825164794921875, -0.2625083923339844, -0.24250030517578125, -0.22249221801757812, -0.202484130859375, -0.18247604370117188, -0.16246795654296875, -0.14245986938476562, -0.1224517822265625, -0.10244369506835938, -0.08243560791015625, -0.062427520751953125, -0.04241943359375, -0.022411346435546875, -0.00240325927734375, 0.017604827880859375, 0.0376129150390625, 0.057621002197265625, 0.07762908935546875, 0.09763717651367188, 0.117645263671875, 0.13765335083007812, 0.15766143798828125, 0.17766952514648438, 0.1976776123046875, 0.21768569946289062, 0.23769378662109375, 0.2577018737792969, 0.2777099609375, 0.2977180480957031, 0.31772613525390625, 0.3377342224121094, 0.3577423095703125, 0.3777503967285156, 0.39775848388671875, 0.4177665710449219, 0.437774658203125, 0.4577827453613281, 0.47779083251953125, 0.4977989196777344, 0.5178070068359375, 0.5378150939941406, 0.5578231811523438, 0.5778312683105469, 0.59783935546875, 0.6178474426269531, 0.6378555297851562, 0.6578636169433594, 0.6778717041015625, 0.6978797912597656, 0.7178878784179688, 0.7378959655761719, 0.757904052734375, 0.7779121398925781, 0.7979202270507812, 0.8179283142089844, 0.8379364013671875, 0.8579444885253906, 0.8779525756835938, 0.8979606628417969, 0.91796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 3.0, 3.0, 4.0, 4.0, 8.0, 10.0, 10.0, 5.0, 12.0, 23.0, 21.0, 29.0, 30.0, 32.0, 32.0, 46.0, 41.0, 47.0, 43.0, 413.0, 1034530.0, 12754.0, 67.0, 48.0, 41.0, 39.0, 46.0, 26.0, 28.0, 23.0, 20.0, 29.0, 17.0, 18.0, 10.0, 9.0, 13.0, 7.0, 5.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.0712890625, -1.035247802734375, -0.99920654296875, -0.963165283203125, -0.9271240234375, -0.891082763671875, -0.85504150390625, -0.819000244140625, -0.782958984375, -0.746917724609375, -0.71087646484375, -0.674835205078125, -0.6387939453125, -0.602752685546875, -0.56671142578125, -0.530670166015625, -0.49462890625, -0.458587646484375, -0.42254638671875, -0.386505126953125, -0.3504638671875, -0.314422607421875, -0.27838134765625, -0.242340087890625, -0.206298828125, -0.170257568359375, -0.13421630859375, -0.098175048828125, -0.0621337890625, -0.026092529296875, 0.00994873046875, 0.045989990234375, 0.08203125, 0.118072509765625, 0.15411376953125, 0.190155029296875, 0.2261962890625, 0.262237548828125, 0.29827880859375, 0.334320068359375, 0.370361328125, 0.406402587890625, 0.44244384765625, 0.478485107421875, 0.5145263671875, 0.550567626953125, 0.58660888671875, 0.622650146484375, 0.65869140625, 0.694732666015625, 0.73077392578125, 0.766815185546875, 0.8028564453125, 0.838897705078125, 0.87493896484375, 0.910980224609375, 0.947021484375, 0.983062744140625, 1.01910400390625, 1.055145263671875, 1.0911865234375, 1.127227783203125, 1.16326904296875, 1.199310302734375, 1.2353515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 9.0, 10.0, 3.0, 16.0, 21.0, 21.0, 33.0, 29.0, 36.0, 32.0, 48.0, 46.0, 42.0, 46.0, 50.0, 50.0, 67.0, 50.0, 42.0, 39.0, 37.0, 51.0, 26.0, 25.0, 19.0, 25.0, 24.0, 19.0, 15.0, 9.0, 11.0, 11.0, 8.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.282958984375, -0.2733650207519531, -0.26377105712890625, -0.2541770935058594, -0.2445831298828125, -0.23498916625976562, -0.22539520263671875, -0.21580123901367188, -0.206207275390625, -0.19661331176757812, -0.18701934814453125, -0.17742538452148438, -0.1678314208984375, -0.15823745727539062, -0.14864349365234375, -0.13904953002929688, -0.12945556640625, -0.11986160278320312, -0.11026763916015625, -0.10067367553710938, -0.0910797119140625, -0.08148574829101562, -0.07189178466796875, -0.062297821044921875, -0.052703857421875, -0.043109893798828125, -0.03351593017578125, -0.023921966552734375, -0.0143280029296875, -0.004734039306640625, 0.00485992431640625, 0.014453887939453125, 0.0240478515625, 0.033641815185546875, 0.04323577880859375, 0.052829742431640625, 0.0624237060546875, 0.07201766967773438, 0.08161163330078125, 0.09120559692382812, 0.100799560546875, 0.11039352416992188, 0.11998748779296875, 0.12958145141601562, 0.1391754150390625, 0.14876937866210938, 0.15836334228515625, 0.16795730590820312, 0.17755126953125, 0.18714523315429688, 0.19673919677734375, 0.20633316040039062, 0.2159271240234375, 0.22552108764648438, 0.23511505126953125, 0.24470901489257812, 0.254302978515625, 0.2638969421386719, 0.27349090576171875, 0.2830848693847656, 0.2926788330078125, 0.3022727966308594, 0.31186676025390625, 0.3214607238769531, 0.3310546875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 5.0, 4.0, 8.0, 8.0, 5.0, 14.0, 23.0, 39.0, 69.0, 135.0, 231.0, 463.0, 966.0, 2518.0, 6988.0, 28169.0, 958501.0, 37365.0, 8182.0, 2669.0, 1103.0, 502.0, 239.0, 150.0, 75.0, 44.0, 27.0, 14.0, 10.0, 5.0, 6.0, 8.0, 4.0, 0.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0113372802734375, -0.010856151580810547, -0.010375022888183594, -0.00989389419555664, -0.009412765502929688, -0.008931636810302734, -0.008450508117675781, -0.007969379425048828, -0.007488250732421875, -0.007007122039794922, -0.006525993347167969, -0.006044864654541016, -0.0055637359619140625, -0.005082607269287109, -0.004601478576660156, -0.004120349884033203, -0.00363922119140625, -0.003158092498779297, -0.0026769638061523438, -0.0021958351135253906, -0.0017147064208984375, -0.0012335777282714844, -0.0007524490356445312, -0.0002713203430175781, 0.000209808349609375, 0.0006909370422363281, 0.0011720657348632812, 0.0016531944274902344, 0.0021343231201171875, 0.0026154518127441406, 0.0030965805053710938, 0.003577709197998047, 0.004058837890625, 0.004539966583251953, 0.005021095275878906, 0.005502223968505859, 0.0059833526611328125, 0.006464481353759766, 0.006945610046386719, 0.007426738739013672, 0.007907867431640625, 0.008388996124267578, 0.008870124816894531, 0.009351253509521484, 0.009832382202148438, 0.01031351089477539, 0.010794639587402344, 0.011275768280029297, 0.01175689697265625, 0.012238025665283203, 0.012719154357910156, 0.01320028305053711, 0.013681411743164062, 0.014162540435791016, 0.014643669128417969, 0.015124797821044922, 0.015605926513671875, 0.016087055206298828, 0.01656818389892578, 0.017049312591552734, 0.017530441284179688, 0.01801156997680664, 0.018492698669433594, 0.018973827362060547, 0.0194549560546875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 16.0, 8.0, 17.0, 10.0, 21.0, 31.0, 91.0, 243.0, 287.0, 129.0, 42.0, 30.0, 17.0, 11.0, 8.0, 12.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.874301910400391e-06, -3.750436007976532e-06, -3.6265701055526733e-06, -3.5027042031288147e-06, -3.378838300704956e-06, -3.2549723982810974e-06, -3.1311064958572388e-06, -3.00724059343338e-06, -2.8833746910095215e-06, -2.759508788585663e-06, -2.635642886161804e-06, -2.5117769837379456e-06, -2.387911081314087e-06, -2.2640451788902283e-06, -2.1401792764663696e-06, -2.016313374042511e-06, -1.8924474716186523e-06, -1.7685815691947937e-06, -1.644715666770935e-06, -1.5208497643470764e-06, -1.3969838619232178e-06, -1.2731179594993591e-06, -1.1492520570755005e-06, -1.0253861546516418e-06, -9.015202522277832e-07, -7.776543498039246e-07, -6.537884473800659e-07, -5.299225449562073e-07, -4.0605664253234863e-07, -2.8219074010849e-07, -1.5832483768463135e-07, -3.4458935260772705e-08, 8.940696716308594e-08, 2.1327286958694458e-07, 3.371387720108032e-07, 4.6100467443466187e-07, 5.848705768585205e-07, 7.087364792823792e-07, 8.326023817062378e-07, 9.564682841300964e-07, 1.080334186553955e-06, 1.2042000889778137e-06, 1.3280659914016724e-06, 1.451931893825531e-06, 1.5757977962493896e-06, 1.6996636986732483e-06, 1.823529601097107e-06, 1.9473955035209656e-06, 2.0712614059448242e-06, 2.195127308368683e-06, 2.3189932107925415e-06, 2.4428591132164e-06, 2.566725015640259e-06, 2.6905909180641174e-06, 2.814456820487976e-06, 2.9383227229118347e-06, 3.0621886253356934e-06, 3.186054527759552e-06, 3.3099204301834106e-06, 3.4337863326072693e-06, 3.557652235031128e-06, 3.6815181374549866e-06, 3.8053840398788452e-06, 3.929249942302704e-06, 4.0531158447265625e-06]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 11.0, 9.0, 8.0, 6.0, 12.0, 32.0, 24.0, 48.0, 67.0, 119.0, 160.0, 214.0, 273.0, 386.0, 579.0, 905.0, 1347.0, 1925.0, 3059.0, 5358.0, 10521.0, 28127.0, 863028.0, 94977.0, 17488.0, 7819.0, 4270.0, 2672.0, 1658.0, 1019.0, 665.0, 525.0, 377.0, 278.0, 174.0, 110.0, 70.0, 62.0, 53.0, 36.0, 21.0, 17.0, 16.0, 11.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.006542205810546875, -0.0063364505767822266, -0.006130695343017578, -0.00592494010925293, -0.005719184875488281, -0.005513429641723633, -0.005307674407958984, -0.005101919174194336, -0.0048961639404296875, -0.004690408706665039, -0.004484653472900391, -0.004278898239135742, -0.004073143005371094, -0.0038673877716064453, -0.003661632537841797, -0.0034558773040771484, -0.0032501220703125, -0.0030443668365478516, -0.002838611602783203, -0.0026328563690185547, -0.0024271011352539062, -0.002221345901489258, -0.0020155906677246094, -0.001809835433959961, -0.0016040802001953125, -0.001398324966430664, -0.0011925697326660156, -0.0009868144989013672, -0.0007810592651367188, -0.0005753040313720703, -0.0003695487976074219, -0.00016379356384277344, 4.1961669921875e-05, 0.00024771690368652344, 0.0004534721374511719, 0.0006592273712158203, 0.0008649826049804688, 0.0010707378387451172, 0.0012764930725097656, 0.001482248306274414, 0.0016880035400390625, 0.001893758773803711, 0.0020995140075683594, 0.002305269241333008, 0.0025110244750976562, 0.0027167797088623047, 0.002922534942626953, 0.0031282901763916016, 0.00333404541015625, 0.0035398006439208984, 0.003745555877685547, 0.003951311111450195, 0.004157066345214844, 0.004362821578979492, 0.004568576812744141, 0.004774332046508789, 0.0049800872802734375, 0.005185842514038086, 0.005391597747802734, 0.005597352981567383, 0.005803108215332031, 0.00600886344909668, 0.006214618682861328, 0.0064203739166259766, 0.006626129150390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 1.0, 2.0, 19.0, 11.0, 15.0, 27.0, 42.0, 117.0, 416.0, 163.0, 69.0, 30.0, 23.0, 14.0, 4.0, 8.0, 7.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00421142578125, -0.004096478223800659, -0.003981530666351318, -0.0038665831089019775, -0.0037516355514526367, -0.003636687994003296, -0.003521740436553955, -0.0034067928791046143, -0.0032918453216552734, -0.0031768977642059326, -0.003061950206756592, -0.002947002649307251, -0.00283205509185791, -0.0027171075344085693, -0.0026021599769592285, -0.0024872124195098877, -0.002372264862060547, -0.002257317304611206, -0.0021423697471618652, -0.0020274221897125244, -0.0019124746322631836, -0.0017975270748138428, -0.001682579517364502, -0.0015676319599151611, -0.0014526844024658203, -0.0013377368450164795, -0.0012227892875671387, -0.0011078417301177979, -0.000992894172668457, -0.0008779466152191162, -0.0007629990577697754, -0.0006480515003204346, -0.0005331039428710938, -0.00041815638542175293, -0.0003032088279724121, -0.0001882612705230713, -7.331371307373047e-05, 4.163384437561035e-05, 0.00015658140182495117, 0.000271528959274292, 0.0003864765167236328, 0.0005014240741729736, 0.0006163716316223145, 0.0007313191890716553, 0.0008462667465209961, 0.0009612143039703369, 0.0010761618614196777, 0.0011911094188690186, 0.0013060569763183594, 0.0014210045337677002, 0.001535952091217041, 0.0016508996486663818, 0.0017658472061157227, 0.0018807947635650635, 0.0019957423210144043, 0.002110689878463745, 0.002225637435913086, 0.0023405849933624268, 0.0024555325508117676, 0.0025704801082611084, 0.0026854276657104492, 0.00280037522315979, 0.002915322780609131, 0.0030302703380584717, 0.0031452178955078125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1023.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13193899393081665, 0.2849171459674835, 0.7017732858657837, 1.1186294555664062, 1.5354855060577393, 1.9523417949676514, 2.3691978454589844, 2.7860541343688965, 3.2029101848602295, 3.6197662353515625, 4.036622524261475, 4.453478813171387, 4.870334625244141, 5.287190914154053, 5.704047203063965, 6.120903015136719, 6.537759304046631, 6.954615592956543, 7.371471405029297, 7.788327693939209, 8.205183982849121, 8.622039794921875, 9.038896560668945, 9.4557523727417, 9.872608184814453, 10.289463996887207, 10.706320762634277, 11.123176574707031, 11.540032386779785, 11.956889152526855, 12.37374496459961, 12.79060173034668, 13.207457542419434, 13.624313354492188, 14.041170120239258, 14.458025932312012, 14.874881744384766, 15.291738510131836, 15.70859432220459, 16.125450134277344, 16.542306900024414, 16.959163665771484, 17.376018524169922, 17.792875289916992, 18.209732055664062, 18.6265869140625, 19.04344367980957, 19.46030044555664, 19.877155303955078, 20.29401206970215, 20.710866928100586, 21.127723693847656, 21.544580459594727, 21.961435317993164, 22.378292083740234, 22.795148849487305, 23.212005615234375, 23.628862380981445, 24.045717239379883, 24.462574005126953, 24.879430770874023, 25.29628562927246, 25.71314239501953, 26.1299991607666, 26.54685401916504]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 7.0, 9.0, 9.0, 15.0, 20.0, 22.0, 19.0, 29.0, 28.0, 44.0, 30.0, 44.0, 40.0, 52.0, 44.0, 50.0, 58.0, 55.0, 47.0, 44.0, 51.0, 42.0, 49.0, 25.0, 29.0, 24.0, 32.0, 18.0, 21.0, 10.0, 11.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3570899963378906, -0.34023866057395935, -0.3233873248100281, -0.3065359592437744, -0.28968462347984314, -0.27283328771591187, -0.2559819519519806, -0.23913061618804932, -0.22227926552295685, -0.20542792975902557, -0.1885765790939331, -0.17172524333000183, -0.15487390756607056, -0.1380225569009781, -0.12117122113704681, -0.10431987792253494, -0.08746853470802307, -0.0706171914935112, -0.05376585200428963, -0.036914512515068054, -0.020063169300556183, -0.0032118260860443115, 0.013639509677886963, 0.030490852892398834, 0.047342196106910706, 0.06419353932142258, 0.08104488253593445, 0.09789621829986572, 0.1147475615143776, 0.13159890472888947, 0.14845024049282074, 0.1653015911579132, 0.18215292692184448, 0.19900426268577576, 0.21585561335086823, 0.2327069491147995, 0.24955829977989197, 0.26640963554382324, 0.2832609713077545, 0.3001123070716858, 0.31696367263793945, 0.3338150084018707, 0.350666344165802, 0.36751770973205566, 0.38436904549598694, 0.4012203812599182, 0.4180717170238495, 0.43492305278778076, 0.45177438855171204, 0.4686257243156433, 0.4854770600795746, 0.5023283958435059, 0.5191797614097595, 0.5360311269760132, 0.5528824329376221, 0.5697337985038757, 0.5865851044654846, 0.6034364700317383, 0.6202877759933472, 0.6371391415596008, 0.6539904475212097, 0.6708418130874634, 0.6876931190490723, 0.7045444846153259, 0.7213958501815796]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 6.0, 2.0, 4.0, 12.0, 14.0, 14.0, 15.0, 28.0, 23.0, 28.0, 21.0, 25.0, 31.0, 35.0, 62.0, 160.0, 1356.0, 39520.0, 4106973.0, 44100.0, 1386.0, 124.0, 52.0, 39.0, 25.0, 31.0, 32.0, 32.0, 20.0, 29.0, 13.0, 18.0, 9.0, 9.0, 6.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2783203125, -0.2694892883300781, -0.26065826416015625, -0.2518272399902344, -0.2429962158203125, -0.23416519165039062, -0.22533416748046875, -0.21650314331054688, -0.207672119140625, -0.19884109497070312, -0.19001007080078125, -0.18117904663085938, -0.1723480224609375, -0.16351699829101562, -0.15468597412109375, -0.14585494995117188, -0.13702392578125, -0.12819290161132812, -0.11936187744140625, -0.11053085327148438, -0.1016998291015625, -0.09286880493164062, -0.08403778076171875, -0.07520675659179688, -0.066375732421875, -0.057544708251953125, -0.04871368408203125, -0.039882659912109375, -0.0310516357421875, -0.022220611572265625, -0.01338958740234375, -0.004558563232421875, 0.0042724609375, 0.013103485107421875, 0.02193450927734375, 0.030765533447265625, 0.0395965576171875, 0.048427581787109375, 0.05725860595703125, 0.06608963012695312, 0.074920654296875, 0.08375167846679688, 0.09258270263671875, 0.10141372680664062, 0.1102447509765625, 0.11907577514648438, 0.12790679931640625, 0.13673782348632812, 0.14556884765625, 0.15439987182617188, 0.16323089599609375, 0.17206192016601562, 0.1808929443359375, 0.18972396850585938, 0.19855499267578125, 0.20738601684570312, 0.216217041015625, 0.22504806518554688, 0.23387908935546875, 0.24271011352539062, 0.2515411376953125, 0.2603721618652344, 0.26920318603515625, 0.2780342102050781, 0.286865234375]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 6.0, 3.0, 7.0, 12.0, 9.0, 12.0, 12.0, 17.0, 18.0, 22.0, 32.0, 22.0, 27.0, 29.0, 41.0, 38.0, 59.0, 50.0, 63.0, 40.0, 53.0, 48.0, 54.0, 33.0, 35.0, 27.0, 25.0, 33.0, 24.0, 26.0, 29.0, 19.0, 11.0, 17.0, 7.0, 7.0, 6.0, 3.0, 3.0, 7.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006786346435546875, -0.006571173667907715, -0.006356000900268555, -0.0061408281326293945, -0.005925655364990234, -0.005710482597351074, -0.005495309829711914, -0.005280137062072754, -0.005064964294433594, -0.004849791526794434, -0.0046346187591552734, -0.004419445991516113, -0.004204273223876953, -0.003989100456237793, -0.003773927688598633, -0.0035587549209594727, -0.0033435821533203125, -0.0031284093856811523, -0.002913236618041992, -0.002698063850402832, -0.002482891082763672, -0.0022677183151245117, -0.0020525455474853516, -0.0018373727798461914, -0.0016222000122070312, -0.001407027244567871, -0.001191854476928711, -0.0009766817092895508, -0.0007615089416503906, -0.0005463361740112305, -0.0003311634063720703, -0.00011599063873291016, 9.918212890625e-05, 0.00031435489654541016, 0.0005295276641845703, 0.0007447004318237305, 0.0009598731994628906, 0.0011750459671020508, 0.001390218734741211, 0.001605391502380371, 0.0018205642700195312, 0.0020357370376586914, 0.0022509098052978516, 0.0024660825729370117, 0.002681255340576172, 0.002896428108215332, 0.003111600875854492, 0.0033267736434936523, 0.0035419464111328125, 0.0037571191787719727, 0.003972291946411133, 0.004187464714050293, 0.004402637481689453, 0.004617810249328613, 0.0048329830169677734, 0.005048155784606934, 0.005263328552246094, 0.005478501319885254, 0.005693674087524414, 0.005908846855163574, 0.006124019622802734, 0.0063391923904418945, 0.006554365158081055, 0.006769537925720215, 0.006984710693359375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 4.0, 6.0, 10.0, 19.0, 20.0, 34.0, 38.0, 80.0, 144.0, 189.0, 309.0, 1973.0, 4189897.0, 693.0, 271.0, 216.0, 124.0, 85.0, 51.0, 42.0, 20.0, 22.0, 9.0, 12.0, 10.0, 6.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56396484375, -0.5459976196289062, -0.5280303955078125, -0.5100631713867188, -0.492095947265625, -0.47412872314453125, -0.4561614990234375, -0.43819427490234375, -0.42022705078125, -0.40225982666015625, -0.3842926025390625, -0.36632537841796875, -0.348358154296875, -0.33039093017578125, -0.3124237060546875, -0.29445648193359375, -0.2764892578125, -0.25852203369140625, -0.2405548095703125, -0.22258758544921875, -0.204620361328125, -0.18665313720703125, -0.1686859130859375, -0.15071868896484375, -0.13275146484375, -0.11478424072265625, -0.0968170166015625, -0.07884979248046875, -0.060882568359375, -0.04291534423828125, -0.0249481201171875, -0.00698089599609375, 0.010986328125, 0.02895355224609375, 0.0469207763671875, 0.06488800048828125, 0.082855224609375, 0.10082244873046875, 0.1187896728515625, 0.13675689697265625, 0.15472412109375, 0.17269134521484375, 0.1906585693359375, 0.20862579345703125, 0.226593017578125, 0.24456024169921875, 0.2625274658203125, 0.28049468994140625, 0.2984619140625, 0.31642913818359375, 0.3343963623046875, 0.35236358642578125, 0.370330810546875, 0.38829803466796875, 0.4062652587890625, 0.42423248291015625, 0.44219970703125, 0.46016693115234375, 0.4781341552734375, 0.49610137939453125, 0.514068603515625, 0.5320358276367188, 0.5500030517578125, 0.5679702758789062, 0.5859375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.0, 705.0, 3328.0, 28.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2003173828125, -0.1958904266357422, -0.19146347045898438, -0.18703651428222656, -0.18260955810546875, -0.17818260192871094, -0.17375564575195312, -0.1693286895751953, -0.1649017333984375, -0.1604747772216797, -0.15604782104492188, -0.15162086486816406, -0.14719390869140625, -0.14276695251464844, -0.13833999633789062, -0.1339130401611328, -0.129486083984375, -0.1250591278076172, -0.12063217163085938, -0.11620521545410156, -0.11177825927734375, -0.10735130310058594, -0.10292434692382812, -0.09849739074707031, -0.0940704345703125, -0.08964347839355469, -0.08521652221679688, -0.08078956604003906, -0.07636260986328125, -0.07193565368652344, -0.06750869750976562, -0.06308174133300781, -0.05865478515625, -0.05422782897949219, -0.049800872802734375, -0.04537391662597656, -0.04094696044921875, -0.03652000427246094, -0.032093048095703125, -0.027666091918945312, -0.0232391357421875, -0.018812179565429688, -0.014385223388671875, -0.009958267211914062, -0.00553131103515625, -0.0011043548583984375, 0.003322601318359375, 0.0077495574951171875, 0.012176513671875, 0.016603469848632812, 0.021030426025390625, 0.025457382202148438, 0.02988433837890625, 0.03431129455566406, 0.038738250732421875, 0.04316520690917969, 0.0475921630859375, 0.05201911926269531, 0.056446075439453125, 0.06087303161621094, 0.06529998779296875, 0.06972694396972656, 0.07415390014648438, 0.07858085632324219, 0.0830078125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 2.0, 9.0, 29.0, 38.0, 99.0, 391.0, 297.0, 76.0, 41.0, 13.0, 10.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32934054732322693, -0.3190300166606903, -0.3087194561958313, -0.2984089255332947, -0.28809839487075806, -0.27778783440589905, -0.2674773037433624, -0.2571667432785034, -0.2468562126159668, -0.23654566705226898, -0.22623512148857117, -0.21592459082603455, -0.20561404526233673, -0.19530349969863892, -0.1849929690361023, -0.17468242347240448, -0.16437187790870667, -0.15406133234500885, -0.14375078678131104, -0.13344025611877441, -0.1231297105550766, -0.11281916499137878, -0.10250862687826157, -0.09219808876514435, -0.08188754320144653, -0.07157699763774872, -0.0612664595246315, -0.050955917686223984, -0.04064537584781647, -0.03033483400940895, -0.020024292171001434, -0.009713754057884216, 0.0005967617034912109, 0.010907303541898727, 0.021217845380306244, 0.03152838721871376, 0.04183892905712128, 0.05214947089552879, 0.06246001273393631, 0.07277055084705353, 0.08308109641075134, 0.09339164197444916, 0.10370218008756638, 0.1140127182006836, 0.12432326376438141, 0.13463380932807922, 0.14494433999061584, 0.15525488555431366, 0.16556543111801147, 0.1758759766817093, 0.1861865222454071, 0.19649705290794373, 0.20680759847164154, 0.21711814403533936, 0.22742867469787598, 0.2377392202615738, 0.2480497658252716, 0.2583602964878082, 0.26867085695266724, 0.27898138761520386, 0.2892919182777405, 0.2996024787425995, 0.3099130094051361, 0.3202235698699951, 0.33053410053253174]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 10.0, 9.0, 10.0, 20.0, 30.0, 37.0, 53.0, 52.0, 58.0, 73.0, 65.0, 69.0, 96.0, 72.0, 65.0, 60.0, 54.0, 46.0, 33.0, 35.0, 12.0, 15.0, 10.0, 3.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.09889980405569077, -0.09609703719615936, -0.09329426288604736, -0.09049149602651596, -0.08768872171640396, -0.08488595485687256, -0.08208318054676056, -0.07928041368722916, -0.07647763937711716, -0.07367487251758575, -0.07087209820747375, -0.06806933134794235, -0.06526655703783035, -0.06246378645300865, -0.05966101586818695, -0.05685824900865555, -0.05405547842383385, -0.051252707839012146, -0.048449937254190445, -0.045647166669368744, -0.04284439608454704, -0.04004162549972534, -0.03723885864019394, -0.03443608433008194, -0.03163331747055054, -0.028830546885728836, -0.026027776300907135, -0.023225005716085434, -0.020422235131263733, -0.017619464546442032, -0.01481669582426548, -0.012013925239443779, -0.009211152791976929, -0.006408382207155228, -0.003605612087994814, -0.0008028419688344002, 0.001999928615987301, 0.004802699200809002, 0.007605468854308128, 0.01040823943912983, 0.01321101002395153, 0.01601378060877323, 0.018816551193594933, 0.021619319915771484, 0.024422090500593185, 0.027224861085414886, 0.030027631670236588, 0.03283040225505829, 0.03563317283987999, 0.03843594342470169, 0.04123871400952339, 0.04404148459434509, 0.046844255179166794, 0.049647025763988495, 0.0524497926235199, 0.0552525669336319, 0.0580553337931633, 0.060858104377985, 0.0636608749628067, 0.0664636418223381, 0.0692664161324501, 0.0720691829919815, 0.0748719573020935, 0.07767472416162491, 0.08047749847173691]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 6.0, 8.0, 13.0, 15.0, 26.0, 35.0, 50.0, 94.0, 148.0, 286.0, 1108.0, 20053.0, 1015400.0, 9781.0, 856.0, 285.0, 131.0, 90.0, 46.0, 37.0, 21.0, 26.0, 10.0, 6.0, 8.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.0745849609375, -0.07253694534301758, -0.07048892974853516, -0.06844091415405273, -0.06639289855957031, -0.06434488296508789, -0.06229686737060547, -0.06024885177612305, -0.058200836181640625, -0.0561528205871582, -0.05410480499267578, -0.05205678939819336, -0.05000877380371094, -0.047960758209228516, -0.045912742614746094, -0.04386472702026367, -0.04181671142578125, -0.03976869583129883, -0.037720680236816406, -0.035672664642333984, -0.03362464904785156, -0.03157663345336914, -0.02952861785888672, -0.027480602264404297, -0.025432586669921875, -0.023384571075439453, -0.02133655548095703, -0.01928853988647461, -0.017240524291992188, -0.015192508697509766, -0.013144493103027344, -0.011096477508544922, -0.0090484619140625, -0.007000446319580078, -0.004952430725097656, -0.0029044151306152344, -0.0008563995361328125, 0.0011916160583496094, 0.0032396316528320312, 0.005287647247314453, 0.007335662841796875, 0.009383678436279297, 0.011431694030761719, 0.01347970962524414, 0.015527725219726562, 0.017575740814208984, 0.019623756408691406, 0.021671772003173828, 0.02371978759765625, 0.025767803192138672, 0.027815818786621094, 0.029863834381103516, 0.03191184997558594, 0.03395986557006836, 0.03600788116455078, 0.0380558967590332, 0.040103912353515625, 0.04215192794799805, 0.04419994354248047, 0.04624795913696289, 0.04829597473144531, 0.050343990325927734, 0.052392005920410156, 0.05444002151489258, 0.056488037109375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 13.0, 49.0, 180.0, 348.0, 247.0, 122.0, 38.0, 8.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1639404296875, -0.15677452087402344, -0.14960861206054688, -0.1424427032470703, -0.13527679443359375, -0.1281108856201172, -0.12094497680664062, -0.11377906799316406, -0.1066131591796875, -0.09944725036621094, -0.09228134155273438, -0.08511543273925781, -0.07794952392578125, -0.07078361511230469, -0.06361770629882812, -0.05645179748535156, -0.049285888671875, -0.04211997985839844, -0.034954071044921875, -0.027788162231445312, -0.02062225341796875, -0.013456344604492188, -0.006290435791015625, 0.0008754730224609375, 0.0080413818359375, 0.015207290649414062, 0.022373199462890625, 0.029539108276367188, 0.03670501708984375, 0.04387092590332031, 0.051036834716796875, 0.05820274353027344, 0.06536865234375, 0.07253456115722656, 0.07970046997070312, 0.08686637878417969, 0.09403228759765625, 0.10119819641113281, 0.10836410522460938, 0.11553001403808594, 0.1226959228515625, 0.12986183166503906, 0.13702774047851562, 0.1441936492919922, 0.15135955810546875, 0.1585254669189453, 0.16569137573242188, 0.17285728454589844, 0.180023193359375, 0.18718910217285156, 0.19435501098632812, 0.2015209197998047, 0.20868682861328125, 0.2158527374267578, 0.22301864624023438, 0.23018455505371094, 0.2373504638671875, 0.24451637268066406, 0.2516822814941406, 0.2588481903076172, 0.26601409912109375, 0.2731800079345703, 0.2803459167480469, 0.28751182556152344, 0.294677734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 13.0, 14.0, 22.0, 21.0, 39.0, 46.0, 49.0, 99.0, 117.0, 157.0, 241.0, 299.0, 428.0, 655.0, 1016.0, 1682.0, 3102.0, 7150.0, 21456.0, 102976.0, 714981.0, 148683.0, 27656.0, 8664.0, 3661.0, 1843.0, 1085.0, 712.0, 479.0, 324.0, 242.0, 151.0, 144.0, 93.0, 62.0, 32.0, 53.0, 20.0, 23.0, 11.0, 14.0, 6.0, 9.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.01406097412109375, -0.013629555702209473, -0.013198137283325195, -0.012766718864440918, -0.01233530044555664, -0.011903882026672363, -0.011472463607788086, -0.011041045188903809, -0.010609626770019531, -0.010178208351135254, -0.009746789932250977, -0.0093153715133667, -0.008883953094482422, -0.008452534675598145, -0.008021116256713867, -0.00758969783782959, -0.0071582794189453125, -0.006726861000061035, -0.006295442581176758, -0.0058640241622924805, -0.005432605743408203, -0.005001187324523926, -0.0045697689056396484, -0.004138350486755371, -0.0037069320678710938, -0.0032755136489868164, -0.002844095230102539, -0.0024126768112182617, -0.0019812583923339844, -0.001549839973449707, -0.0011184215545654297, -0.0006870031356811523, -0.000255584716796875, 0.00017583370208740234, 0.0006072521209716797, 0.001038670539855957, 0.0014700889587402344, 0.0019015073776245117, 0.002332925796508789, 0.0027643442153930664, 0.0031957626342773438, 0.003627181053161621, 0.0040585994720458984, 0.004490017890930176, 0.004921436309814453, 0.0053528547286987305, 0.005784273147583008, 0.006215691566467285, 0.0066471099853515625, 0.00707852840423584, 0.007509946823120117, 0.007941365242004395, 0.008372783660888672, 0.00880420207977295, 0.009235620498657227, 0.009667038917541504, 0.010098457336425781, 0.010529875755310059, 0.010961294174194336, 0.011392712593078613, 0.01182413101196289, 0.012255549430847168, 0.012686967849731445, 0.013118386268615723, 0.0135498046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 9.0, 7.0, 13.0, 17.0, 21.0, 38.0, 70.0, 91.0, 153.0, 152.0, 122.0, 104.0, 82.0, 53.0, 19.0, 14.0, 16.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2445068359375, -0.2372150421142578, -0.22992324829101562, -0.22263145446777344, -0.21533966064453125, -0.20804786682128906, -0.20075607299804688, -0.1934642791748047, -0.1861724853515625, -0.1788806915283203, -0.17158889770507812, -0.16429710388183594, -0.15700531005859375, -0.14971351623535156, -0.14242172241210938, -0.1351299285888672, -0.127838134765625, -0.12054634094238281, -0.11325454711914062, -0.10596275329589844, -0.09867095947265625, -0.09137916564941406, -0.08408737182617188, -0.07679557800292969, -0.0695037841796875, -0.06221199035644531, -0.054920196533203125, -0.04762840270996094, -0.04033660888671875, -0.03304481506347656, -0.025753021240234375, -0.018461227416992188, -0.01116943359375, -0.0038776397705078125, 0.003414154052734375, 0.010705947875976562, 0.01799774169921875, 0.025289535522460938, 0.032581329345703125, 0.03987312316894531, 0.0471649169921875, 0.05445671081542969, 0.061748504638671875, 0.06904029846191406, 0.07633209228515625, 0.08362388610839844, 0.09091567993164062, 0.09820747375488281, 0.105499267578125, 0.11279106140136719, 0.12008285522460938, 0.12737464904785156, 0.13466644287109375, 0.14195823669433594, 0.14925003051757812, 0.1565418243408203, 0.1638336181640625, 0.1711254119873047, 0.17841720581054688, 0.18570899963378906, 0.19300079345703125, 0.20029258728027344, 0.20758438110351562, 0.2148761749267578, 0.22216796875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 3.0, 6.0, 9.0, 13.0, 21.0, 49.0, 65.0, 105.0, 184.0, 319.0, 563.0, 1033.0, 1957.0, 3757.0, 9472.0, 986230.0, 34087.0, 5536.0, 2441.0, 1164.0, 646.0, 335.0, 213.0, 110.0, 70.0, 37.0, 39.0, 25.0, 11.0, 10.0, 5.0, 7.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0108642578125, -0.01054227352142334, -0.01022028923034668, -0.00989830493927002, -0.00957632064819336, -0.0092543363571167, -0.008932352066040039, -0.008610367774963379, -0.008288383483886719, -0.007966399192810059, -0.0076444149017333984, -0.007322430610656738, -0.007000446319580078, -0.006678462028503418, -0.006356477737426758, -0.006034493446350098, -0.0057125091552734375, -0.005390524864196777, -0.005068540573120117, -0.004746556282043457, -0.004424571990966797, -0.004102587699890137, -0.0037806034088134766, -0.0034586191177368164, -0.0031366348266601562, -0.002814650535583496, -0.002492666244506836, -0.0021706819534301758, -0.0018486976623535156, -0.0015267133712768555, -0.0012047290802001953, -0.0008827447891235352, -0.000560760498046875, -0.00023877620697021484, 8.320808410644531e-05, 0.00040519237518310547, 0.0007271766662597656, 0.0010491609573364258, 0.001371145248413086, 0.001693129539489746, 0.0020151138305664062, 0.0023370981216430664, 0.0026590824127197266, 0.0029810667037963867, 0.003303050994873047, 0.003625035285949707, 0.003947019577026367, 0.004269003868103027, 0.0045909881591796875, 0.004912972450256348, 0.005234956741333008, 0.005556941032409668, 0.005878925323486328, 0.006200909614562988, 0.0065228939056396484, 0.006844878196716309, 0.007166862487792969, 0.007488846778869629, 0.007810831069946289, 0.00813281536102295, 0.00845479965209961, 0.00877678394317627, 0.00909876823425293, 0.00942075252532959, 0.00974273681640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 9.0, 13.0, 62.0, 325.0, 480.0, 64.0, 16.0, 10.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3709068298339844e-05, -1.3329088687896729e-05, -1.2949109077453613e-05, -1.2569129467010498e-05, -1.2189149856567383e-05, -1.1809170246124268e-05, -1.1429190635681152e-05, -1.1049211025238037e-05, -1.0669231414794922e-05, -1.0289251804351807e-05, -9.909272193908691e-06, -9.529292583465576e-06, -9.149312973022461e-06, -8.769333362579346e-06, -8.38935375213623e-06, -8.009374141693115e-06, -7.62939453125e-06, -7.249414920806885e-06, -6.8694353103637695e-06, -6.489455699920654e-06, -6.109476089477539e-06, -5.729496479034424e-06, -5.349516868591309e-06, -4.969537258148193e-06, -4.589557647705078e-06, -4.209578037261963e-06, -3.829598426818848e-06, -3.4496188163757324e-06, -3.069639205932617e-06, -2.689659595489502e-06, -2.3096799850463867e-06, -1.9297003746032715e-06, -1.5497207641601562e-06, -1.169741153717041e-06, -7.897615432739258e-07, -4.0978193283081055e-07, -2.9802322387695312e-08, 3.501772880554199e-07, 7.301568984985352e-07, 1.1101365089416504e-06, 1.4901161193847656e-06, 1.8700957298278809e-06, 2.250075340270996e-06, 2.6300549507141113e-06, 3.0100345611572266e-06, 3.390014171600342e-06, 3.769993782043457e-06, 4.149973392486572e-06, 4.5299530029296875e-06, 4.909932613372803e-06, 5.289912223815918e-06, 5.669891834259033e-06, 6.0498714447021484e-06, 6.429851055145264e-06, 6.809830665588379e-06, 7.189810276031494e-06, 7.569789886474609e-06, 7.949769496917725e-06, 8.32974910736084e-06, 8.709728717803955e-06, 9.08970832824707e-06, 9.469687938690186e-06, 9.8496675491333e-06, 1.0229647159576416e-05, 1.0609626770019531e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 9.0, 6.0, 15.0, 21.0, 31.0, 49.0, 76.0, 122.0, 160.0, 264.0, 424.0, 639.0, 1104.0, 2091.0, 4767.0, 17915.0, 999543.0, 12701.0, 4031.0, 1886.0, 983.0, 600.0, 404.0, 240.0, 154.0, 107.0, 66.0, 51.0, 32.0, 19.0, 10.0, 14.0, 7.0, 5.0, 4.0, 0.0, 0.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01424407958984375, -0.013759732246398926, -0.013275384902954102, -0.012791037559509277, -0.012306690216064453, -0.011822342872619629, -0.011337995529174805, -0.01085364818572998, -0.010369300842285156, -0.009884953498840332, -0.009400606155395508, -0.008916258811950684, -0.00843191146850586, -0.007947564125061035, -0.007463216781616211, -0.006978869438171387, -0.0064945220947265625, -0.006010174751281738, -0.005525827407836914, -0.00504148006439209, -0.004557132720947266, -0.004072785377502441, -0.003588438034057617, -0.003104090690612793, -0.0026197433471679688, -0.0021353960037231445, -0.0016510486602783203, -0.001166701316833496, -0.0006823539733886719, -0.00019800662994384766, 0.00028634071350097656, 0.0007706880569458008, 0.001255035400390625, 0.0017393827438354492, 0.0022237300872802734, 0.0027080774307250977, 0.003192424774169922, 0.003676772117614746, 0.00416111946105957, 0.0046454668045043945, 0.005129814147949219, 0.005614161491394043, 0.006098508834838867, 0.006582856178283691, 0.007067203521728516, 0.00755155086517334, 0.008035898208618164, 0.008520245552062988, 0.009004592895507812, 0.009488940238952637, 0.009973287582397461, 0.010457634925842285, 0.01094198226928711, 0.011426329612731934, 0.011910676956176758, 0.012395024299621582, 0.012879371643066406, 0.01336371898651123, 0.013848066329956055, 0.014332413673400879, 0.014816761016845703, 0.015301108360290527, 0.01578545570373535, 0.016269803047180176, 0.016754150390625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 8.0, 0.0, 3.0, 10.0, 23.0, 583.0, 309.0, 27.0, 10.0, 6.0, 4.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032100677490234375, -0.00309908390045166, -0.002988100051879883, -0.0028771162033081055, -0.002766132354736328, -0.0026551485061645508, -0.0025441646575927734, -0.002433180809020996, -0.0023221969604492188, -0.0022112131118774414, -0.002100229263305664, -0.0019892454147338867, -0.0018782615661621094, -0.001767277717590332, -0.0016562938690185547, -0.0015453100204467773, -0.001434326171875, -0.0013233423233032227, -0.0012123584747314453, -0.001101374626159668, -0.0009903907775878906, -0.0008794069290161133, -0.0007684230804443359, -0.0006574392318725586, -0.0005464553833007812, -0.0004354715347290039, -0.00032448768615722656, -0.00021350383758544922, -0.00010251998901367188, 8.463859558105469e-06, 0.00011944770812988281, 0.00023043155670166016, 0.0003414154052734375, 0.00045239925384521484, 0.0005633831024169922, 0.0006743669509887695, 0.0007853507995605469, 0.0008963346481323242, 0.0010073184967041016, 0.001118302345275879, 0.0012292861938476562, 0.0013402700424194336, 0.001451253890991211, 0.0015622377395629883, 0.0016732215881347656, 0.001784205436706543, 0.0018951892852783203, 0.0020061731338500977, 0.002117156982421875, 0.0022281408309936523, 0.0023391246795654297, 0.002450108528137207, 0.0025610923767089844, 0.0026720762252807617, 0.002783060073852539, 0.0028940439224243164, 0.0030050277709960938, 0.003116011619567871, 0.0032269954681396484, 0.0033379793167114258, 0.003448963165283203, 0.0035599470138549805, 0.003670930862426758, 0.003781914710998535, 0.0038928985595703125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 6.0, 11.0, 28.0, 62.0, 399.0, 377.0, 75.0, 33.0, 15.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11156415194272995, -0.10500485450029373, -0.09844556450843811, -0.09188626706600189, -0.08532697707414627, -0.07876767963171005, -0.07220838963985443, -0.06564909219741821, -0.05908979848027229, -0.05253050476312637, -0.045971211045980453, -0.039411917328834534, -0.032852619886398315, -0.026293326169252396, -0.019734032452106476, -0.013174738734960556, -0.006615445017814636, -5.615083500742912e-05, 0.006503143347799778, 0.013062437996268272, 0.019621731713414192, 0.02618102729320526, 0.03274032101035118, 0.0392996147274971, 0.04585890844464302, 0.05241820216178894, 0.05897749587893486, 0.06553678959608078, 0.072096087038517, 0.07865537703037262, 0.08521467447280884, 0.09177397191524506, 0.09833325445652008, 0.1048925518989563, 0.11145184189081192, 0.11801113933324814, 0.12457042932510376, 0.13112972676753998, 0.1376890242099762, 0.14424830675125122, 0.15080760419368744, 0.15736690163612366, 0.16392619907855988, 0.1704854816198349, 0.17704477906227112, 0.18360407650470734, 0.19016337394714355, 0.19672265648841858, 0.203281968832016, 0.2098412662744522, 0.21640056371688843, 0.22295984625816345, 0.22951914370059967, 0.2360784411430359, 0.2426377385854721, 0.24919703602790833, 0.25575631856918335, 0.2623156011104584, 0.2688749134540558, 0.2754341959953308, 0.2819935083389282, 0.28855279088020325, 0.29511207342147827, 0.3016713857650757, 0.3082306683063507]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 35.0, 107.0, 211.0, 276.0, 211.0, 115.0, 34.0, 14.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14007048308849335, -0.134372279047966, -0.12867406010627747, -0.12297585606575012, -0.11727764457464218, -0.11157943308353424, -0.1058812290430069, -0.10018301755189896, -0.09448480606079102, -0.08878659456968307, -0.08308838307857513, -0.07739017903804779, -0.07169196754693985, -0.06599375605583191, -0.06029554829001427, -0.054597340524196625, -0.048899129033088684, -0.04320091754198074, -0.0375027097761631, -0.03180450201034546, -0.02610629051923752, -0.020408080890774727, -0.014709871262311935, -0.009011663496494293, -0.0033134520053863525, 0.002384757623076439, 0.00808296725153923, 0.013781176880002022, 0.019479386508464813, 0.025177596136927605, 0.030875805765390396, 0.03657401353120804, 0.04227223992347717, 0.047970451414585114, 0.053668659180402756, 0.0593668669462204, 0.06506507843732834, 0.07076328992843628, 0.07646149396896362, 0.08215970546007156, 0.0878579169511795, 0.09355612844228745, 0.09925433993339539, 0.10495254397392273, 0.11065075546503067, 0.11634896695613861, 0.12204717099666595, 0.1277453899383545, 0.13344359397888184, 0.13914179801940918, 0.14484001696109772, 0.15053822100162506, 0.1562364399433136, 0.16193464398384094, 0.1676328480243683, 0.17333105206489563, 0.17902927100658417, 0.1847274750471115, 0.19042569398880005, 0.1961238980293274, 0.20182210206985474, 0.20752032101154327, 0.21321852505207062, 0.21891674399375916, 0.2246149480342865]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 6.0, 7.0, 5.0, 11.0, 12.0, 12.0, 13.0, 25.0, 16.0, 20.0, 26.0, 37.0, 41.0, 57.0, 94.0, 187.0, 604.0, 125562.0, 920077.0, 1110.0, 190.0, 101.0, 49.0, 46.0, 41.0, 33.0, 30.0, 22.0, 27.0, 13.0, 10.0, 12.0, 8.0, 5.0, 11.0, 6.0, 10.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.81787109375, -0.79388427734375, -0.7698974609375, -0.74591064453125, -0.721923828125, -0.69793701171875, -0.6739501953125, -0.64996337890625, -0.6259765625, -0.60198974609375, -0.5780029296875, -0.55401611328125, -0.530029296875, -0.50604248046875, -0.4820556640625, -0.45806884765625, -0.43408203125, -0.41009521484375, -0.3861083984375, -0.36212158203125, -0.338134765625, -0.31414794921875, -0.2901611328125, -0.26617431640625, -0.2421875, -0.21820068359375, -0.1942138671875, -0.17022705078125, -0.146240234375, -0.12225341796875, -0.0982666015625, -0.07427978515625, -0.05029296875, -0.02630615234375, -0.0023193359375, 0.02166748046875, 0.045654296875, 0.06964111328125, 0.0936279296875, 0.11761474609375, 0.1416015625, 0.16558837890625, 0.1895751953125, 0.21356201171875, 0.237548828125, 0.26153564453125, 0.2855224609375, 0.30950927734375, 0.33349609375, 0.35748291015625, 0.3814697265625, 0.40545654296875, 0.429443359375, 0.45343017578125, 0.4774169921875, 0.50140380859375, 0.525390625, 0.54937744140625, 0.5733642578125, 0.59735107421875, 0.621337890625, 0.64532470703125, 0.6693115234375, 0.69329833984375, 0.71728515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 14.0, 134.0, 506.0, 305.0, 48.0, 8.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061767578125, -0.05730628967285156, -0.052845001220703125, -0.04838371276855469, -0.04392242431640625, -0.03946113586425781, -0.034999847412109375, -0.030538558959960938, -0.0260772705078125, -0.021615982055664062, -0.017154693603515625, -0.012693405151367188, -0.00823211669921875, -0.0037708282470703125, 0.000690460205078125, 0.0051517486572265625, 0.009613037109375, 0.014074325561523438, 0.018535614013671875, 0.022996902465820312, 0.02745819091796875, 0.03191947937011719, 0.036380767822265625, 0.04084205627441406, 0.0453033447265625, 0.04976463317871094, 0.054225921630859375, 0.05868721008300781, 0.06314849853515625, 0.06760978698730469, 0.07207107543945312, 0.07653236389160156, 0.08099365234375, 0.08545494079589844, 0.08991622924804688, 0.09437751770019531, 0.09883880615234375, 0.10330009460449219, 0.10776138305664062, 0.11222267150878906, 0.1166839599609375, 0.12114524841308594, 0.12560653686523438, 0.1300678253173828, 0.13452911376953125, 0.1389904022216797, 0.14345169067382812, 0.14791297912597656, 0.152374267578125, 0.15683555603027344, 0.16129684448242188, 0.1657581329345703, 0.17021942138671875, 0.1746807098388672, 0.17914199829101562, 0.18360328674316406, 0.1880645751953125, 0.19252586364746094, 0.19698715209960938, 0.2014484405517578, 0.20590972900390625, 0.2103710174560547, 0.21483230590820312, 0.21929359436035156, 0.2237548828125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 5.0, 5.0, 6.0, 13.0, 26.0, 34.0, 66.0, 79.0, 138.0, 258.0, 435.0, 792.0, 1407.0, 2854.0, 5442.0, 11834.0, 26719.0, 73438.0, 443200.0, 365391.0, 68632.0, 25469.0, 11076.0, 5366.0, 2686.0, 1410.0, 742.0, 426.0, 234.0, 124.0, 77.0, 67.0, 32.0, 22.0, 19.0, 10.0, 5.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0372314453125, -0.03594636917114258, -0.034661293029785156, -0.033376216888427734, -0.03209114074707031, -0.03080606460571289, -0.02952098846435547, -0.028235912322998047, -0.026950836181640625, -0.025665760040283203, -0.02438068389892578, -0.02309560775756836, -0.021810531616210938, -0.020525455474853516, -0.019240379333496094, -0.017955303192138672, -0.01667022705078125, -0.015385150909423828, -0.014100074768066406, -0.012814998626708984, -0.011529922485351562, -0.01024484634399414, -0.008959770202636719, -0.007674694061279297, -0.006389617919921875, -0.005104541778564453, -0.0038194656372070312, -0.0025343894958496094, -0.0012493133544921875, 3.5762786865234375e-05, 0.0013208389282226562, 0.002605915069580078, 0.0038909912109375, 0.005176067352294922, 0.006461143493652344, 0.007746219635009766, 0.009031295776367188, 0.01031637191772461, 0.011601448059082031, 0.012886524200439453, 0.014171600341796875, 0.015456676483154297, 0.01674175262451172, 0.01802682876586914, 0.019311904907226562, 0.020596981048583984, 0.021882057189941406, 0.023167133331298828, 0.02445220947265625, 0.025737285614013672, 0.027022361755371094, 0.028307437896728516, 0.029592514038085938, 0.03087759017944336, 0.03216266632080078, 0.0334477424621582, 0.034732818603515625, 0.03601789474487305, 0.03730297088623047, 0.03858804702758789, 0.03987312316894531, 0.041158199310302734, 0.042443275451660156, 0.04372835159301758, 0.045013427734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 7.0, 8.0, 7.0, 16.0, 17.0, 23.0, 23.0, 34.0, 50.0, 43.0, 50.0, 49.0, 76.0, 89.0, 90.0, 78.0, 63.0, 44.0, 46.0, 37.0, 22.0, 21.0, 24.0, 23.0, 6.0, 13.0, 12.0, 9.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0251617431640625, -0.024518728256225586, -0.023875713348388672, -0.023232698440551758, -0.022589683532714844, -0.02194666862487793, -0.021303653717041016, -0.0206606388092041, -0.020017623901367188, -0.019374608993530273, -0.01873159408569336, -0.018088579177856445, -0.01744556427001953, -0.016802549362182617, -0.016159534454345703, -0.015516519546508789, -0.014873504638671875, -0.014230489730834961, -0.013587474822998047, -0.012944459915161133, -0.012301445007324219, -0.011658430099487305, -0.01101541519165039, -0.010372400283813477, -0.009729385375976562, -0.009086370468139648, -0.008443355560302734, -0.00780034065246582, -0.007157325744628906, -0.006514310836791992, -0.005871295928955078, -0.005228281021118164, -0.00458526611328125, -0.003942251205444336, -0.003299236297607422, -0.002656221389770508, -0.0020132064819335938, -0.0013701915740966797, -0.0007271766662597656, -8.416175842285156e-05, 0.0005588531494140625, 0.0012018680572509766, 0.0018448829650878906, 0.0024878978729248047, 0.0031309127807617188, 0.003773927688598633, 0.004416942596435547, 0.005059957504272461, 0.005702972412109375, 0.006345987319946289, 0.006989002227783203, 0.007632017135620117, 0.008275032043457031, 0.008918046951293945, 0.00956106185913086, 0.010204076766967773, 0.010847091674804688, 0.011490106582641602, 0.012133121490478516, 0.01277613639831543, 0.013419151306152344, 0.014062166213989258, 0.014705181121826172, 0.015348196029663086, 0.0159912109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 11.0, 7.0, 14.0, 8.0, 19.0, 19.0, 37.0, 53.0, 72.0, 104.0, 167.0, 258.0, 462.0, 907.0, 1835.0, 4611.0, 16156.0, 412406.0, 585749.0, 16703.0, 4688.0, 1941.0, 900.0, 536.0, 287.0, 210.0, 106.0, 87.0, 60.0, 37.0, 29.0, 14.0, 24.0, 11.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0037860870361328125, -0.003677964210510254, -0.0035698413848876953, -0.0034617185592651367, -0.003353595733642578, -0.0032454729080200195, -0.003137350082397461, -0.0030292272567749023, -0.0029211044311523438, -0.002812981605529785, -0.0027048587799072266, -0.002596735954284668, -0.0024886131286621094, -0.0023804903030395508, -0.002272367477416992, -0.0021642446517944336, -0.002056121826171875, -0.0019479990005493164, -0.0018398761749267578, -0.0017317533493041992, -0.0016236305236816406, -0.001515507698059082, -0.0014073848724365234, -0.0012992620468139648, -0.0011911392211914062, -0.0010830163955688477, -0.0009748935699462891, -0.0008667707443237305, -0.0007586479187011719, -0.0006505250930786133, -0.0005424022674560547, -0.0004342794418334961, -0.0003261566162109375, -0.0002180337905883789, -0.00010991096496582031, -1.7881393432617188e-06, 0.00010633468627929688, 0.00021445751190185547, 0.00032258033752441406, 0.00043070316314697266, 0.0005388259887695312, 0.0006469488143920898, 0.0007550716400146484, 0.000863194465637207, 0.0009713172912597656, 0.0010794401168823242, 0.0011875629425048828, 0.0012956857681274414, 0.00140380859375, 0.0015119314193725586, 0.0016200542449951172, 0.0017281770706176758, 0.0018362998962402344, 0.001944422721862793, 0.0020525455474853516, 0.00216066837310791, 0.0022687911987304688, 0.0023769140243530273, 0.002485036849975586, 0.0025931596755981445, 0.002701282501220703, 0.0028094053268432617, 0.0029175281524658203, 0.003025650978088379, 0.0031337738037109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 5.0, 8.0, 0.0, 18.0, 29.0, 0.0, 104.0, 0.0, 197.0, 282.0, 0.0, 209.0, 102.0, 0.0, 28.0, 0.0, 13.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-07, -9.164214134216309e-07, -8.791685104370117e-07, -8.419156074523926e-07, -8.046627044677734e-07, -7.674098014831543e-07, -7.301568984985352e-07, -6.92903995513916e-07, -6.556510925292969e-07, -6.183981895446777e-07, -5.811452865600586e-07, -5.438923835754395e-07, -5.066394805908203e-07, -4.6938657760620117e-07, -4.3213367462158203e-07, -3.948807716369629e-07, -3.5762786865234375e-07, -3.203749656677246e-07, -2.8312206268310547e-07, -2.4586915969848633e-07, -2.086162567138672e-07, -1.7136335372924805e-07, -1.341104507446289e-07, -9.685754776000977e-08, -5.960464477539063e-08, -2.2351741790771484e-08, 1.4901161193847656e-08, 5.21540641784668e-08, 8.940696716308594e-08, 1.2665987014770508e-07, 1.6391277313232422e-07, 2.0116567611694336e-07, 2.384185791015625e-07, 2.7567148208618164e-07, 3.129243850708008e-07, 3.501772880554199e-07, 3.8743019104003906e-07, 4.246830940246582e-07, 4.6193599700927734e-07, 4.991888999938965e-07, 5.364418029785156e-07, 5.736947059631348e-07, 6.109476089477539e-07, 6.48200511932373e-07, 6.854534149169922e-07, 7.227063179016113e-07, 7.599592208862305e-07, 7.972121238708496e-07, 8.344650268554688e-07, 8.717179298400879e-07, 9.08970832824707e-07, 9.462237358093262e-07, 9.834766387939453e-07, 1.0207295417785645e-06, 1.0579824447631836e-06, 1.0952353477478027e-06, 1.1324882507324219e-06, 1.169741153717041e-06, 1.2069940567016602e-06, 1.2442469596862793e-06, 1.2814998626708984e-06, 1.3187527656555176e-06, 1.3560056686401367e-06, 1.3932585716247559e-06, 1.430511474609375e-06]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 7.0, 13.0, 13.0, 10.0, 19.0, 31.0, 38.0, 45.0, 62.0, 97.0, 116.0, 148.0, 234.0, 325.0, 460.0, 672.0, 971.0, 1468.0, 2395.0, 4247.0, 8831.0, 23347.0, 150284.0, 777710.0, 48191.0, 13882.0, 5967.0, 3195.0, 1975.0, 1149.0, 798.0, 532.0, 377.0, 247.0, 200.0, 130.0, 97.0, 70.0, 43.0, 44.0, 38.0, 22.0, 13.0, 11.0, 8.0, 5.0, 4.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0016031265258789062, -0.0015534162521362305, -0.0015037059783935547, -0.001453995704650879, -0.0014042854309082031, -0.0013545751571655273, -0.0013048648834228516, -0.0012551546096801758, -0.0012054443359375, -0.0011557340621948242, -0.0011060237884521484, -0.0010563135147094727, -0.0010066032409667969, -0.0009568929672241211, -0.0009071826934814453, -0.0008574724197387695, -0.0008077621459960938, -0.000758051872253418, -0.0007083415985107422, -0.0006586313247680664, -0.0006089210510253906, -0.0005592107772827148, -0.0005095005035400391, -0.0004597902297973633, -0.0004100799560546875, -0.0003603696823120117, -0.00031065940856933594, -0.00026094913482666016, -0.00021123886108398438, -0.0001615285873413086, -0.00011181831359863281, -6.210803985595703e-05, -1.239776611328125e-05, 3.731250762939453e-05, 8.702278137207031e-05, 0.0001367330551147461, 0.00018644332885742188, 0.00023615360260009766, 0.00028586387634277344, 0.0003355741500854492, 0.000385284423828125, 0.0004349946975708008, 0.00048470497131347656, 0.0005344152450561523, 0.0005841255187988281, 0.0006338357925415039, 0.0006835460662841797, 0.0007332563400268555, 0.0007829666137695312, 0.000832676887512207, 0.0008823871612548828, 0.0009320974349975586, 0.0009818077087402344, 0.0010315179824829102, 0.001081228256225586, 0.0011309385299682617, 0.0011806488037109375, 0.0012303590774536133, 0.001280069351196289, 0.0013297796249389648, 0.0013794898986816406, 0.0014292001724243164, 0.0014789104461669922, 0.001528620719909668, 0.0015783309936523438]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 5.0, 12.0, 22.0, 31.0, 57.0, 132.0, 289.0, 216.0, 72.0, 48.0, 23.0, 21.0, 13.0, 9.0, 6.0, 6.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0011377334594726562, -0.0011068060994148254, -0.0010758787393569946, -0.0010449513792991638, -0.001014024019241333, -0.0009830966591835022, -0.0009521692991256714, -0.0009212419390678406, -0.0008903145790100098, -0.000859387218952179, -0.0008284598588943481, -0.0007975324988365173, -0.0007666051387786865, -0.0007356777787208557, -0.0007047504186630249, -0.0006738230586051941, -0.0006428956985473633, -0.0006119683384895325, -0.0005810409784317017, -0.0005501136183738708, -0.00051918625831604, -0.00048825889825820923, -0.0004573315382003784, -0.0004264041781425476, -0.0003954768180847168, -0.000364549458026886, -0.0003336220979690552, -0.00030269473791122437, -0.00027176737785339355, -0.00024084001779556274, -0.00020991265773773193, -0.00017898529767990112, -0.0001480579376220703, -0.0001171305775642395, -8.620321750640869e-05, -5.527585744857788e-05, -2.434849739074707e-05, 6.57886266708374e-06, 3.750622272491455e-05, 6.843358278274536e-05, 9.936094284057617e-05, 0.00013028830289840698, 0.0001612156629562378, 0.0001921430230140686, 0.00022307038307189941, 0.0002539977431297302, 0.00028492510318756104, 0.00031585246324539185, 0.00034677982330322266, 0.00037770718336105347, 0.0004086345434188843, 0.0004395619034767151, 0.0004704892635345459, 0.0005014166235923767, 0.0005323439836502075, 0.0005632713437080383, 0.0005941987037658691, 0.0006251260638237, 0.0006560534238815308, 0.0006869807839393616, 0.0007179081439971924, 0.0007488355040550232, 0.000779762864112854, 0.0008106902241706848, 0.0008416175842285156]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 13.0, 79.0, 770.0, 126.0, 21.0, 6.0, 1.0, 2.0], "bins": [-0.6291822791099548, -0.6184458136558533, -0.6077094078063965, -0.5969729423522949, -0.5862364768981934, -0.5755000710487366, -0.564763605594635, -0.5540271401405334, -0.5432907342910767, -0.5325542688369751, -0.5218178629875183, -0.5110813975334167, -0.5003449320793152, -0.4896085262298584, -0.47887206077575684, -0.46813562512397766, -0.4573991596698761, -0.4466627240180969, -0.43592625856399536, -0.4251898229122162, -0.414453387260437, -0.40371692180633545, -0.3929804861545563, -0.3822440505027771, -0.37150758504867554, -0.36077114939689636, -0.3500346839427948, -0.3392982482910156, -0.32856181263923645, -0.3178253769874573, -0.3070889115333557, -0.29635247588157654, -0.285616010427475, -0.2748795747756958, -0.26414310932159424, -0.25340667366981506, -0.2426702380180359, -0.23193378746509552, -0.22119733691215515, -0.21046090126037598, -0.1997244507074356, -0.18898800015449524, -0.17825156450271606, -0.1675151139497757, -0.15677866339683533, -0.14604222774505615, -0.13530577719211578, -0.12456933408975601, -0.11383289098739624, -0.10309644788503647, -0.0923600047826767, -0.08162355422973633, -0.07088711112737656, -0.060150668025016785, -0.049414217472076416, -0.038677774369716644, -0.02794133499264717, -0.01720489002764225, -0.006468445062637329, 0.004268001765012741, 0.015004444867372513, 0.025740887969732285, 0.03647733852267265, 0.047213781625032425, 0.0579502247273922]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 15.0, 59.0, 160.0, 226.0, 237.0, 200.0, 85.0, 30.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05867072194814682, -0.05419128015637398, -0.049711838364601135, -0.045232392847537994, -0.04075295478105545, -0.03627350926399231, -0.03179406747221947, -0.027314625680446625, -0.022835183888673782, -0.01835574209690094, -0.013876299373805523, -0.009396856650710106, -0.0049174148589372635, -0.0004379730671644211, 0.0040414705872535706, 0.008520912379026413, 0.013000354170799255, 0.017479795962572098, 0.02195923775434494, 0.026438681408762932, 0.030918123200535774, 0.035397566854953766, 0.03987700864672661, 0.04435645043849945, 0.04883589223027229, 0.053315334022045135, 0.05779477581381798, 0.06227421760559082, 0.06675366312265396, 0.0712331011891365, 0.07571254670619965, 0.08019198477268219, 0.08467142283916473, 0.08915086835622787, 0.09363030642271042, 0.09810975193977356, 0.1025891900062561, 0.10706863552331924, 0.11154808104038239, 0.11602751910686493, 0.12050695717334747, 0.12498640269041061, 0.12946584820747375, 0.1339452862739563, 0.13842472434043884, 0.1429041624069214, 0.14738361537456512, 0.15186305344104767, 0.1563425064086914, 0.16082194447517395, 0.1653013974428177, 0.16978083550930023, 0.17426027357578278, 0.17873971164226532, 0.18321916460990906, 0.1876986026763916, 0.19217804074287415, 0.1966574788093567, 0.20113693177700043, 0.20561636984348297, 0.21009580790996552, 0.21457524597644806, 0.2190546989440918, 0.22353413701057434, 0.22801357507705688]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 7.0, 7.0, 9.0, 7.0, 14.0, 27.0, 27.0, 43.0, 57.0, 74.0, 104.0, 192.0, 282.0, 409.0, 648.0, 1127.0, 1848.0, 3100.0, 6000.0, 11643.0, 24682.0, 58471.0, 176108.0, 3310821.0, 433074.0, 93200.0, 37244.0, 16788.0, 8230.0, 4289.0, 2337.0, 1342.0, 759.0, 482.0, 287.0, 192.0, 116.0, 78.0, 56.0, 32.0, 28.0, 12.0, 16.0, 6.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0209503173828125, -0.020346879959106445, -0.01974344253540039, -0.019140005111694336, -0.01853656768798828, -0.017933130264282227, -0.017329692840576172, -0.016726255416870117, -0.016122817993164062, -0.015519380569458008, -0.014915943145751953, -0.014312505722045898, -0.013709068298339844, -0.013105630874633789, -0.012502193450927734, -0.01189875602722168, -0.011295318603515625, -0.01069188117980957, -0.010088443756103516, -0.009485006332397461, -0.008881568908691406, -0.008278131484985352, -0.007674694061279297, -0.007071256637573242, -0.0064678192138671875, -0.005864381790161133, -0.005260944366455078, -0.0046575069427490234, -0.004054069519042969, -0.003450632095336914, -0.0028471946716308594, -0.0022437572479248047, -0.00164031982421875, -0.0010368824005126953, -0.0004334449768066406, 0.00016999244689941406, 0.0007734298706054688, 0.0013768672943115234, 0.001980304718017578, 0.002583742141723633, 0.0031871795654296875, 0.003790616989135742, 0.004394054412841797, 0.0049974918365478516, 0.005600929260253906, 0.006204366683959961, 0.006807804107666016, 0.00741124153137207, 0.008014678955078125, 0.00861811637878418, 0.009221553802490234, 0.009824991226196289, 0.010428428649902344, 0.011031866073608398, 0.011635303497314453, 0.012238740921020508, 0.012842178344726562, 0.013445615768432617, 0.014049053192138672, 0.014652490615844727, 0.015255928039550781, 0.015859365463256836, 0.01646280288696289, 0.017066240310668945, 0.017669677734375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 6.0, 11.0, 7.0, 13.0, 13.0, 18.0, 17.0, 30.0, 34.0, 37.0, 26.0, 44.0, 39.0, 49.0, 53.0, 66.0, 66.0, 53.0, 57.0, 42.0, 42.0, 38.0, 43.0, 26.0, 33.0, 23.0, 25.0, 16.0, 18.0, 7.0, 12.0, 10.0, 3.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0027446746826171875, -0.0026648640632629395, -0.0025850534439086914, -0.0025052428245544434, -0.0024254322052001953, -0.0023456215858459473, -0.0022658109664916992, -0.002186000347137451, -0.002106189727783203, -0.002026379108428955, -0.001946568489074707, -0.001866757869720459, -0.001786947250366211, -0.0017071366310119629, -0.0016273260116577148, -0.0015475153923034668, -0.0014677047729492188, -0.0013878941535949707, -0.0013080835342407227, -0.0012282729148864746, -0.0011484622955322266, -0.0010686516761779785, -0.0009888410568237305, -0.0009090304374694824, -0.0008292198181152344, -0.0007494091987609863, -0.0006695985794067383, -0.0005897879600524902, -0.0005099773406982422, -0.00043016672134399414, -0.0003503561019897461, -0.00027054548263549805, -0.00019073486328125, -0.00011092424392700195, -3.1113624572753906e-05, 4.869699478149414e-05, 0.0001285076141357422, 0.00020831823348999023, 0.0002881288528442383, 0.00036793947219848633, 0.0004477500915527344, 0.0005275607109069824, 0.0006073713302612305, 0.0006871819496154785, 0.0007669925689697266, 0.0008468031883239746, 0.0009266138076782227, 0.0010064244270324707, 0.0010862350463867188, 0.0011660456657409668, 0.0012458562850952148, 0.0013256669044494629, 0.001405477523803711, 0.001485288143157959, 0.001565098762512207, 0.001644909381866455, 0.0017247200012207031, 0.0018045306205749512, 0.0018843412399291992, 0.0019641518592834473, 0.0020439624786376953, 0.0021237730979919434, 0.0022035837173461914, 0.0022833943367004395, 0.0023632049560546875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 16.0, 26.0, 33.0, 50.0, 103.0, 128.0, 242.0, 1627.0, 4190515.0, 896.0, 239.0, 155.0, 98.0, 56.0, 43.0, 23.0, 18.0, 14.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0645751953125, -0.05938148498535156, -0.054187774658203125, -0.04899406433105469, -0.04380035400390625, -0.03860664367675781, -0.033412933349609375, -0.028219223022460938, -0.0230255126953125, -0.017831802368164062, -0.012638092041015625, -0.0074443817138671875, -0.00225067138671875, 0.0029430389404296875, 0.008136749267578125, 0.013330459594726562, 0.018524169921875, 0.023717880249023438, 0.028911590576171875, 0.03410530090332031, 0.03929901123046875, 0.04449272155761719, 0.049686431884765625, 0.05488014221191406, 0.0600738525390625, 0.06526756286621094, 0.07046127319335938, 0.07565498352050781, 0.08084869384765625, 0.08604240417480469, 0.09123611450195312, 0.09642982482910156, 0.10162353515625, 0.10681724548339844, 0.11201095581054688, 0.11720466613769531, 0.12239837646484375, 0.1275920867919922, 0.13278579711914062, 0.13797950744628906, 0.1431732177734375, 0.14836692810058594, 0.15356063842773438, 0.1587543487548828, 0.16394805908203125, 0.1691417694091797, 0.17433547973632812, 0.17952919006347656, 0.184722900390625, 0.18991661071777344, 0.19511032104492188, 0.2003040313720703, 0.20549774169921875, 0.2106914520263672, 0.21588516235351562, 0.22107887268066406, 0.2262725830078125, 0.23146629333496094, 0.23666000366210938, 0.2418537139892578, 0.24704742431640625, 0.2522411346435547, 0.2574348449707031, 0.26262855529785156, 0.267822265625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 25.0, 132.0, 734.0, 2765.0, 365.0, 59.0, 9.0], "bins": [-0.043792724609375, -0.04306569695472717, -0.042338669300079346, -0.04161164164543152, -0.04088461399078369, -0.040157586336135864, -0.03943055868148804, -0.03870353102684021, -0.03797650337219238, -0.037249475717544556, -0.03652244806289673, -0.0357954204082489, -0.035068392753601074, -0.03434136509895325, -0.03361433744430542, -0.03288730978965759, -0.032160282135009766, -0.03143325448036194, -0.03070622682571411, -0.029979199171066284, -0.029252171516418457, -0.02852514386177063, -0.027798116207122803, -0.027071088552474976, -0.02634406089782715, -0.02561703324317932, -0.024890005588531494, -0.024162977933883667, -0.02343595027923584, -0.022708922624588013, -0.021981894969940186, -0.02125486731529236, -0.02052783966064453, -0.019800812005996704, -0.019073784351348877, -0.01834675669670105, -0.017619729042053223, -0.016892701387405396, -0.01616567373275757, -0.015438646078109741, -0.014711618423461914, -0.013984590768814087, -0.01325756311416626, -0.012530535459518433, -0.011803507804870605, -0.011076480150222778, -0.010349452495574951, -0.009622424840927124, -0.008895397186279297, -0.00816836953163147, -0.007441341876983643, -0.006714314222335815, -0.005987286567687988, -0.005260258913040161, -0.004533231258392334, -0.003806203603744507, -0.0030791759490966797, -0.0023521482944488525, -0.0016251206398010254, -0.0008980929851531982, -0.0001710653305053711, 0.0005559623241424561, 0.0012829899787902832, 0.0020100176334381104, 0.0027370452880859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 11.0, 14.0, 14.0, 34.0, 34.0, 53.0, 122.0, 258.0, 184.0, 95.0, 57.0, 38.0, 33.0, 16.0, 12.0, 11.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02638382278382778, -0.02539873868227005, -0.024413656443357468, -0.023428572341799736, -0.022443488240242004, -0.021458406001329422, -0.02047332189977169, -0.01948823779821396, -0.018503155559301376, -0.017518071457743645, -0.016532989218831062, -0.01554790511727333, -0.014562821947038174, -0.013577738776803017, -0.012592654675245285, -0.011607571505010128, -0.010622488334774971, -0.009637405164539814, -0.008652321994304657, -0.007667237892746925, -0.006682154722511768, -0.005697071552276611, -0.004711987916380167, -0.0037269042804837227, -0.0027418211102485657, -0.001756737707182765, -0.0007716543041169643, 0.00021342909894883633, 0.001198512502014637, 0.002183595672249794, 0.0031686793081462383, 0.004153762944042683, 0.005138847976922989, 0.006123931147158146, 0.00710901478305459, 0.008094098418951035, 0.009079181589186192, 0.010064264759421349, 0.01104934886097908, 0.012034432031214237, 0.013019515201449394, 0.014004598371684551, 0.014989681541919708, 0.01597476564347744, 0.01695984974503517, 0.017944931983947754, 0.018930016085505486, 0.019915100187063217, 0.0209001824259758, 0.02188526652753353, 0.022870348766446114, 0.023855432868003845, 0.024840515106916428, 0.02582559920847416, 0.02681068331003189, 0.027795765548944473, 0.028780849650502205, 0.029765933752059937, 0.03075101599097252, 0.0317360982298851, 0.03272118419408798, 0.033706266433000565, 0.03469134867191315, 0.03567643463611603, 0.03666151687502861]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 7.0, 16.0, 7.0, 19.0, 22.0, 26.0, 40.0, 41.0, 52.0, 50.0, 70.0, 66.0, 76.0, 65.0, 55.0, 71.0, 46.0, 50.0, 51.0, 41.0, 27.0, 24.0, 17.0, 18.0, 9.0, 8.0, 4.0, 7.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.009588564746081829, -0.009191269986331463, -0.008793975226581097, -0.00839668046683073, -0.007999385707080364, -0.007602090947329998, -0.007204796653240919, -0.006807501893490553, -0.006410207133740187, -0.0060129123739898205, -0.005615617614239454, -0.005218323320150375, -0.004821028560400009, -0.004423733800649643, -0.004026439040899277, -0.0036291442811489105, -0.0032318495213985443, -0.002834554761648178, -0.002437260001897812, -0.0020399654749780893, -0.0016426707152277231, -0.001245375955477357, -0.0008480814285576344, -0.00045078666880726814, -5.349190905690193e-05, 0.00034380279248580337, 0.0007410974940285087, 0.001138392137363553, 0.0015356868971139193, 0.0019329816568642855, 0.002330276183784008, 0.0027275709435343742, 0.003124864771962166, 0.003522159531712532, 0.003919454291462898, 0.0043167490512132645, 0.004714043810963631, 0.005111338570713997, 0.005508632864803076, 0.005905927624553442, 0.006303222384303808, 0.006700517144054174, 0.007097811903804541, 0.0074951061978936195, 0.007892400957643986, 0.008289695717394352, 0.008686990477144718, 0.009084285236895084, 0.00948157999664545, 0.009878874756395817, 0.010276169516146183, 0.01067346427589655, 0.011070759035646915, 0.011468053795397282, 0.011865347623825073, 0.01226264238357544, 0.012659937143325806, 0.013057231903076172, 0.013454526662826538, 0.013851821422576904, 0.01424911618232727, 0.014646410942077637, 0.015043705701828003, 0.01544100046157837, 0.015838295221328735]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 0.0, 5.0, 2.0, 3.0, 8.0, 7.0, 11.0, 14.0, 30.0, 36.0, 52.0, 85.0, 141.0, 290.0, 625.0, 1764.0, 6192.0, 34531.0, 681227.0, 292280.0, 23938.0, 4723.0, 1405.0, 543.0, 249.0, 143.0, 75.0, 52.0, 37.0, 20.0, 18.0, 12.0, 10.0, 8.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003681182861328125, -0.0035580992698669434, -0.0034350156784057617, -0.00331193208694458, -0.0031888484954833984, -0.003065764904022217, -0.002942681312561035, -0.0028195977210998535, -0.002696514129638672, -0.0025734305381774902, -0.0024503469467163086, -0.002327263355255127, -0.0022041797637939453, -0.0020810961723327637, -0.001958012580871582, -0.0018349289894104004, -0.0017118453979492188, -0.0015887618064880371, -0.0014656782150268555, -0.0013425946235656738, -0.0012195110321044922, -0.0010964274406433105, -0.0009733438491821289, -0.0008502602577209473, -0.0007271766662597656, -0.000604093074798584, -0.00048100948333740234, -0.0003579258918762207, -0.00023484230041503906, -0.00011175870895385742, 1.1324882507324219e-05, 0.00013440847396850586, 0.0002574920654296875, 0.00038057565689086914, 0.0005036592483520508, 0.0006267428398132324, 0.0007498264312744141, 0.0008729100227355957, 0.0009959936141967773, 0.001119077205657959, 0.0012421607971191406, 0.0013652443885803223, 0.001488327980041504, 0.0016114115715026855, 0.0017344951629638672, 0.0018575787544250488, 0.0019806623458862305, 0.002103745937347412, 0.0022268295288085938, 0.0023499131202697754, 0.002472996711730957, 0.0025960803031921387, 0.0027191638946533203, 0.002842247486114502, 0.0029653310775756836, 0.0030884146690368652, 0.003211498260498047, 0.0033345818519592285, 0.00345766544342041, 0.003580749034881592, 0.0037038326263427734, 0.003826916217803955, 0.003949999809265137, 0.004073083400726318, 0.0041961669921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 12.0, 18.0, 21.0, 39.0, 78.0, 88.0, 119.0, 182.0, 139.0, 86.0, 83.0, 57.0, 29.0, 23.0, 8.0, 8.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0097808837890625, -0.009284496307373047, -0.008788108825683594, -0.00829172134399414, -0.0077953338623046875, -0.007298946380615234, -0.006802558898925781, -0.006306171417236328, -0.005809783935546875, -0.005313396453857422, -0.004817008972167969, -0.004320621490478516, -0.0038242340087890625, -0.0033278465270996094, -0.0028314590454101562, -0.002335071563720703, -0.00183868408203125, -0.0013422966003417969, -0.0008459091186523438, -0.0003495216369628906, 0.0001468658447265625, 0.0006432533264160156, 0.0011396408081054688, 0.0016360282897949219, 0.002132415771484375, 0.002628803253173828, 0.0031251907348632812, 0.0036215782165527344, 0.0041179656982421875, 0.004614353179931641, 0.005110740661621094, 0.005607128143310547, 0.006103515625, 0.006599903106689453, 0.007096290588378906, 0.007592678070068359, 0.008089065551757812, 0.008585453033447266, 0.009081840515136719, 0.009578227996826172, 0.010074615478515625, 0.010571002960205078, 0.011067390441894531, 0.011563777923583984, 0.012060165405273438, 0.01255655288696289, 0.013052940368652344, 0.013549327850341797, 0.01404571533203125, 0.014542102813720703, 0.015038490295410156, 0.01553487777709961, 0.016031265258789062, 0.016527652740478516, 0.01702404022216797, 0.017520427703857422, 0.018016815185546875, 0.018513202667236328, 0.01900959014892578, 0.019505977630615234, 0.020002365112304688, 0.02049875259399414, 0.020995140075683594, 0.021491527557373047, 0.0219879150390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 9.0, 9.0, 8.0, 15.0, 22.0, 39.0, 54.0, 74.0, 118.0, 164.0, 305.0, 444.0, 815.0, 1393.0, 2368.0, 4506.0, 8779.0, 18668.0, 43707.0, 117609.0, 473455.0, 244105.0, 74379.0, 29451.0, 13513.0, 6575.0, 3428.0, 1823.0, 1055.0, 588.0, 394.0, 223.0, 169.0, 102.0, 67.0, 31.0, 24.0, 23.0, 13.0, 8.0, 10.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0012083053588867188, -0.00116632878780365, -0.001124352216720581, -0.0010823756456375122, -0.0010403990745544434, -0.0009984225034713745, -0.0009564459323883057, -0.0009144693613052368, -0.000872492790222168, -0.0008305162191390991, -0.0007885396480560303, -0.0007465630769729614, -0.0007045865058898926, -0.0006626099348068237, -0.0006206333637237549, -0.000578656792640686, -0.0005366802215576172, -0.0004947036504745483, -0.0004527270793914795, -0.00041075050830841064, -0.0003687739372253418, -0.00032679736614227295, -0.0002848207950592041, -0.00024284422397613525, -0.0002008676528930664, -0.00015889108180999756, -0.00011691451072692871, -7.493793964385986e-05, -3.2961368560791016e-05, 9.015202522277832e-06, 5.099177360534668e-05, 9.296834468841553e-05, 0.00013494491577148438, 0.00017692148685455322, 0.00021889805793762207, 0.0002608746290206909, 0.00030285120010375977, 0.0003448277711868286, 0.00038680434226989746, 0.0004287809133529663, 0.00047075748443603516, 0.000512734055519104, 0.0005547106266021729, 0.0005966871976852417, 0.0006386637687683105, 0.0006806403398513794, 0.0007226169109344482, 0.0007645934820175171, 0.0008065700531005859, 0.0008485466241836548, 0.0008905231952667236, 0.0009324997663497925, 0.0009744763374328613, 0.0010164529085159302, 0.001058429479598999, 0.0011004060506820679, 0.0011423826217651367, 0.0011843591928482056, 0.0012263357639312744, 0.0012683123350143433, 0.0013102889060974121, 0.001352265477180481, 0.0013942420482635498, 0.0014362186193466187, 0.0014781951904296875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 11.0, 5.0, 4.0, 12.0, 13.0, 25.0, 25.0, 35.0, 45.0, 50.0, 46.0, 70.0, 68.0, 67.0, 65.0, 62.0, 62.0, 50.0, 47.0, 39.0, 36.0, 31.0, 23.0, 18.0, 20.0, 17.0, 9.0, 7.0, 4.0, 6.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.018035888671875, -0.017414331436157227, -0.016792774200439453, -0.01617121696472168, -0.015549659729003906, -0.014928102493286133, -0.01430654525756836, -0.013684988021850586, -0.013063430786132812, -0.012441873550415039, -0.011820316314697266, -0.011198759078979492, -0.010577201843261719, -0.009955644607543945, -0.009334087371826172, -0.008712530136108398, -0.008090972900390625, -0.0074694156646728516, -0.006847858428955078, -0.006226301193237305, -0.005604743957519531, -0.004983186721801758, -0.004361629486083984, -0.003740072250366211, -0.0031185150146484375, -0.002496957778930664, -0.0018754005432128906, -0.0012538433074951172, -0.0006322860717773438, -1.0728836059570312e-05, 0.0006108283996582031, 0.0012323856353759766, 0.00185394287109375, 0.0024755001068115234, 0.003097057342529297, 0.0037186145782470703, 0.004340171813964844, 0.004961729049682617, 0.005583286285400391, 0.006204843521118164, 0.0068264007568359375, 0.007447957992553711, 0.008069515228271484, 0.008691072463989258, 0.009312629699707031, 0.009934186935424805, 0.010555744171142578, 0.011177301406860352, 0.011798858642578125, 0.012420415878295898, 0.013041973114013672, 0.013663530349731445, 0.014285087585449219, 0.014906644821166992, 0.015528202056884766, 0.01614975929260254, 0.016771316528320312, 0.017392873764038086, 0.01801443099975586, 0.018635988235473633, 0.019257545471191406, 0.01987910270690918, 0.020500659942626953, 0.021122217178344727, 0.0217437744140625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 1.0, 5.0, 5.0, 7.0, 9.0, 19.0, 19.0, 21.0, 37.0, 49.0, 73.0, 133.0, 204.0, 351.0, 588.0, 959.0, 1773.0, 3806.0, 9194.0, 29049.0, 154987.0, 736781.0, 76924.0, 19841.0, 7127.0, 3159.0, 1497.0, 798.0, 437.0, 248.0, 160.0, 88.0, 62.0, 34.0, 26.0, 15.0, 15.0, 10.0, 6.0, 4.0, 6.0, 5.0, 2.0, 4.0, 2.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005335807800292969, -0.0005159825086593628, -0.0004983842372894287, -0.00048078596591949463, -0.00046318769454956055, -0.00044558942317962646, -0.0004279911518096924, -0.0004103928804397583, -0.0003927946090698242, -0.00037519633769989014, -0.00035759806632995605, -0.00033999979496002197, -0.0003224015235900879, -0.0003048032522201538, -0.0002872049808502197, -0.00026960670948028564, -0.00025200843811035156, -0.00023441016674041748, -0.0002168118953704834, -0.00019921362400054932, -0.00018161535263061523, -0.00016401708126068115, -0.00014641880989074707, -0.000128820538520813, -0.0001112222671508789, -9.362399578094482e-05, -7.602572441101074e-05, -5.842745304107666e-05, -4.082918167114258e-05, -2.3230910301208496e-05, -5.632638931274414e-06, 1.1965632438659668e-05, 2.956390380859375e-05, 4.716217517852783e-05, 6.476044654846191e-05, 8.2358717918396e-05, 9.995698928833008e-05, 0.00011755526065826416, 0.00013515353202819824, 0.00015275180339813232, 0.0001703500747680664, 0.0001879483461380005, 0.00020554661750793457, 0.00022314488887786865, 0.00024074316024780273, 0.0002583414316177368, 0.0002759397029876709, 0.000293537974357605, 0.00031113624572753906, 0.00032873451709747314, 0.0003463327884674072, 0.0003639310598373413, 0.0003815293312072754, 0.00039912760257720947, 0.00041672587394714355, 0.00043432414531707764, 0.0004519224166870117, 0.0004695206880569458, 0.0004871189594268799, 0.000504717230796814, 0.000522315502166748, 0.0005399137735366821, 0.0005575120449066162, 0.0005751103162765503, 0.0005927085876464844]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 7.0, 0.0, 11.0, 0.0, 0.0, 11.0, 0.0, 27.0, 0.0, 31.0, 0.0, 51.0, 0.0, 117.0, 0.0, 0.0, 166.0, 0.0, 166.0, 0.0, 149.0, 0.0, 103.0, 0.0, 77.0, 0.0, 0.0, 33.0, 0.0, 21.0, 0.0, 16.0, 0.0, 11.0, 0.0, 10.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.5367431640625e-07, -9.266659617424011e-07, -8.996576070785522e-07, -8.726492524147034e-07, -8.456408977508545e-07, -8.186325430870056e-07, -7.916241884231567e-07, -7.646158337593079e-07, -7.37607479095459e-07, -7.105991244316101e-07, -6.835907697677612e-07, -6.565824151039124e-07, -6.295740604400635e-07, -6.025657057762146e-07, -5.755573511123657e-07, -5.485489964485168e-07, -5.21540641784668e-07, -4.945322871208191e-07, -4.675239324569702e-07, -4.4051557779312134e-07, -4.1350722312927246e-07, -3.864988684654236e-07, -3.594905138015747e-07, -3.3248215913772583e-07, -3.0547380447387695e-07, -2.784654498100281e-07, -2.514570951461792e-07, -2.2444874048233032e-07, -1.9744038581848145e-07, -1.7043203115463257e-07, -1.434236764907837e-07, -1.1641532182693481e-07, -8.940696716308594e-08, -6.239861249923706e-08, -3.5390257835388184e-08, -8.381903171539307e-09, 1.862645149230957e-08, 4.563480615615845e-08, 7.264316082000732e-08, 9.96515154838562e-08, 1.2665987014770508e-07, 1.5366822481155396e-07, 1.8067657947540283e-07, 2.076849341392517e-07, 2.3469328880310059e-07, 2.6170164346694946e-07, 2.8870999813079834e-07, 3.157183527946472e-07, 3.427267074584961e-07, 3.6973506212234497e-07, 3.9674341678619385e-07, 4.237517714500427e-07, 4.507601261138916e-07, 4.777684807777405e-07, 5.047768354415894e-07, 5.317851901054382e-07, 5.587935447692871e-07, 5.85801899433136e-07, 6.128102540969849e-07, 6.398186087608337e-07, 6.668269634246826e-07, 6.938353180885315e-07, 7.208436727523804e-07, 7.478520274162292e-07, 7.748603820800781e-07]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 2.0, 6.0, 6.0, 8.0, 18.0, 34.0, 41.0, 75.0, 93.0, 120.0, 181.0, 251.0, 422.0, 600.0, 962.0, 1506.0, 2388.0, 3647.0, 6554.0, 12364.0, 28031.0, 89489.0, 695900.0, 135841.0, 36170.0, 14901.0, 7387.0, 4256.0, 2576.0, 1635.0, 1046.0, 682.0, 424.0, 305.0, 194.0, 137.0, 96.0, 69.0, 43.0, 33.0, 20.0, 10.0, 16.0, 5.0, 5.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005345344543457031, -0.0005181506276130676, -0.0005017668008804321, -0.00048538297414779663, -0.00046899914741516113, -0.00045261532068252563, -0.00043623149394989014, -0.00041984766721725464, -0.00040346384048461914, -0.00038708001375198364, -0.00037069618701934814, -0.00035431236028671265, -0.00033792853355407715, -0.00032154470682144165, -0.00030516088008880615, -0.00028877705335617065, -0.00027239322662353516, -0.00025600939989089966, -0.00023962557315826416, -0.00022324174642562866, -0.00020685791969299316, -0.00019047409296035767, -0.00017409026622772217, -0.00015770643949508667, -0.00014132261276245117, -0.00012493878602981567, -0.00010855495929718018, -9.217113256454468e-05, -7.578730583190918e-05, -5.940347909927368e-05, -4.3019652366638184e-05, -2.6635825634002686e-05, -1.0251998901367188e-05, 6.1318278312683105e-06, 2.251565456390381e-05, 3.889948129653931e-05, 5.5283308029174805e-05, 7.16671347618103e-05, 8.80509614944458e-05, 0.0001044347882270813, 0.0001208186149597168, 0.0001372024416923523, 0.0001535862684249878, 0.0001699700951576233, 0.0001863539218902588, 0.0002027377486228943, 0.00021912157535552979, 0.00023550540208816528, 0.0002518892288208008, 0.0002682730555534363, 0.0002846568822860718, 0.0003010407090187073, 0.0003174245357513428, 0.00033380836248397827, 0.00035019218921661377, 0.00036657601594924927, 0.00038295984268188477, 0.00039934366941452026, 0.00041572749614715576, 0.00043211132287979126, 0.00044849514961242676, 0.00046487897634506226, 0.00048126280307769775, 0.0004976466298103333, 0.0005140304565429688]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 3.0, 7.0, 10.0, 5.0, 9.0, 10.0, 18.0, 19.0, 31.0, 32.0, 57.0, 90.0, 130.0, 210.0, 100.0, 69.0, 59.0, 31.0, 26.0, 15.0, 16.0, 8.0, 10.0, 6.0, 3.0, 4.0, 0.0, 7.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001468658447265625, -0.00014146976172924042, -0.00013607367873191833, -0.00013067759573459625, -0.00012528151273727417, -0.00011988542973995209, -0.00011448934674263, -0.00010909326374530792, -0.00010369718074798584, -9.830109775066376e-05, -9.290501475334167e-05, -8.750893175601959e-05, -8.211284875869751e-05, -7.671676576137543e-05, -7.132068276405334e-05, -6.592459976673126e-05, -6.052851676940918e-05, -5.51324337720871e-05, -4.9736350774765015e-05, -4.434026777744293e-05, -3.894418478012085e-05, -3.354810178279877e-05, -2.8152018785476685e-05, -2.2755935788154602e-05, -1.735985279083252e-05, -1.1963769793510437e-05, -6.5676867961883545e-06, -1.171603798866272e-06, 4.2244791984558105e-06, 9.620562195777893e-06, 1.5016645193099976e-05, 2.0412728190422058e-05, 2.580881118774414e-05, 3.120489418506622e-05, 3.6600977182388306e-05, 4.199706017971039e-05, 4.739314317703247e-05, 5.278922617435455e-05, 5.8185309171676636e-05, 6.358139216899872e-05, 6.89774751663208e-05, 7.437355816364288e-05, 7.976964116096497e-05, 8.516572415828705e-05, 9.056180715560913e-05, 9.595789015293121e-05, 0.0001013539731502533, 0.00010675005614757538, 0.00011214613914489746, 0.00011754222214221954, 0.00012293830513954163, 0.0001283343881368637, 0.0001337304711341858, 0.00013912655413150787, 0.00014452263712882996, 0.00014991872012615204, 0.00015531480312347412, 0.0001607108861207962, 0.00016610696911811829, 0.00017150305211544037, 0.00017689913511276245, 0.00018229521811008453, 0.00018769130110740662, 0.0001930873841047287, 0.00019848346710205078]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 7.0, 6.0, 9.0, 11.0, 15.0, 23.0, 24.0, 51.0, 63.0, 116.0, 248.0, 165.0, 79.0, 59.0, 26.0, 25.0, 15.0, 15.0, 11.0, 7.0, 6.0, 7.0, 2.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01152532547712326, -0.011193783953785896, -0.010862241499125957, -0.010530699044466019, -0.010199157521128654, -0.00986761599779129, -0.009536073543131351, -0.009204531088471413, -0.008872989565134048, -0.008541448041796684, -0.008209905587136745, -0.007878363132476807, -0.0075468216091394424, -0.007215279620140791, -0.0068837376311421394, -0.006552195642143488, -0.006220653653144836, -0.005889111664146185, -0.005557569675147533, -0.005226027686148882, -0.00489448569715023, -0.004562943708151579, -0.004231401719152927, -0.003899859730154276, -0.0035683177411556244, -0.003236775752156973, -0.0029052337631583214, -0.00257369177415967, -0.0022421497851610184, -0.0019106077961623669, -0.0015790658071637154, -0.0012475238181650639, -0.0009159818291664124, -0.0005844398401677608, -0.00025289785116910934, 7.864413782954216e-05, 0.00041018612682819366, 0.0007417281158268452, 0.0010732701048254967, 0.0014048120938241482, 0.0017363540828227997, 0.002067896071821451, 0.0023994380608201027, 0.002730980049818754, 0.0030625220388174057, 0.003394064027816057, 0.0037256060168147087, 0.00405714800581336, 0.004388689994812012, 0.004720231983810663, 0.005051773972809315, 0.005383315961807966, 0.005714857950806618, 0.006046399939805269, 0.006377941928803921, 0.006709483917802572, 0.007041025906801224, 0.007372567895799875, 0.007704109884798527, 0.008035652339458466, 0.00836719386279583, 0.008698735386133194, 0.009030277840793133, 0.009361820295453072, 0.009693361818790436]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 12.0, 17.0, 23.0, 41.0, 62.0, 86.0, 98.0, 117.0, 119.0, 102.0, 91.0, 86.0, 55.0, 38.0, 24.0, 12.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007988784462213516, -0.007580973673611879, -0.0071731628850102425, -0.006765352562069893, -0.006357541773468256, -0.005949730984866619, -0.005541920196264982, -0.005134109407663345, -0.004726299084722996, -0.004318488296121359, -0.003910677507519722, -0.0035028669517487288, -0.0030950563959777355, -0.0026872456073760986, -0.0022794348187744617, -0.0018716242630034685, -0.001463813241571188, -0.001056002569384873, -0.0006481918389908969, -0.00024038110859692097, 0.0001674295635893941, 0.0005752402357757092, 0.000983051024377346, 0.0013908615801483393, 0.0017986723687499762, 0.002206483157351613, 0.0026142937131226063, 0.003022104501724243, 0.00342991529032588, 0.0038377258460968733, 0.0042455364018678665, 0.004653347190469503, 0.00506115797907114, 0.005468968767672777, 0.005876779556274414, 0.006284589879214764, 0.0066924006678164005, 0.007100211456418037, 0.007508022245019674, 0.007915833033621311, 0.00832364335656166, 0.00873145367950201, 0.009139264933764935, 0.009547075256705284, 0.009954886510968208, 0.010362696833908558, 0.010770507156848907, 0.011178318411111832, 0.011586129665374756, 0.011993939988315105, 0.01240175124257803, 0.01280956156551838, 0.013217372819781303, 0.013625183142721653, 0.014032993465662003, 0.014440804719924927, 0.014848615042865276, 0.015256425365805626, 0.01566423662006855, 0.016072047874331474, 0.01647985726594925, 0.016887668520212173, 0.017295479774475098, 0.017703289166092873, 0.018111100420355797]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 7.0, 8.0, 11.0, 5.0, 4.0, 8.0, 9.0, 17.0, 14.0, 20.0, 20.0, 20.0, 29.0, 33.0, 44.0, 70.0, 164.0, 580.0, 2774.0, 33461.0, 925468.0, 79419.0, 4985.0, 807.0, 254.0, 71.0, 43.0, 35.0, 30.0, 27.0, 18.0, 13.0, 14.0, 17.0, 14.0, 9.0, 6.0, 12.0, 7.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.047637939453125, -0.04633760452270508, -0.045037269592285156, -0.043736934661865234, -0.04243659973144531, -0.04113626480102539, -0.03983592987060547, -0.03853559494018555, -0.037235260009765625, -0.0359349250793457, -0.03463459014892578, -0.03333425521850586, -0.03203392028808594, -0.030733585357666016, -0.029433250427246094, -0.028132915496826172, -0.02683258056640625, -0.025532245635986328, -0.024231910705566406, -0.022931575775146484, -0.021631240844726562, -0.02033090591430664, -0.01903057098388672, -0.017730236053466797, -0.016429901123046875, -0.015129566192626953, -0.013829231262207031, -0.01252889633178711, -0.011228561401367188, -0.009928226470947266, -0.008627891540527344, -0.007327556610107422, -0.0060272216796875, -0.004726886749267578, -0.0034265518188476562, -0.0021262168884277344, -0.0008258819580078125, 0.0004744529724121094, 0.0017747879028320312, 0.003075122833251953, 0.004375457763671875, 0.005675792694091797, 0.006976127624511719, 0.00827646255493164, 0.009576797485351562, 0.010877132415771484, 0.012177467346191406, 0.013477802276611328, 0.01477813720703125, 0.016078472137451172, 0.017378807067871094, 0.018679141998291016, 0.019979476928710938, 0.02127981185913086, 0.02258014678955078, 0.023880481719970703, 0.025180816650390625, 0.026481151580810547, 0.02778148651123047, 0.02908182144165039, 0.030382156372070312, 0.031682491302490234, 0.032982826232910156, 0.03428316116333008, 0.03558349609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 16.0, 36.0, 68.0, 121.0, 195.0, 251.0, 138.0, 92.0, 47.0, 26.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002166748046875, -0.0019745826721191406, -0.0017824172973632812, -0.0015902519226074219, -0.0013980865478515625, -0.0012059211730957031, -0.0010137557983398438, -0.0008215904235839844, -0.000629425048828125, -0.0004372596740722656, -0.00024509429931640625, -5.2928924560546875e-05, 0.0001392364501953125, 0.0003314018249511719, 0.0005235671997070312, 0.0007157325744628906, 0.00090789794921875, 0.0011000633239746094, 0.0012922286987304688, 0.0014843940734863281, 0.0016765594482421875, 0.0018687248229980469, 0.0020608901977539062, 0.0022530555725097656, 0.002445220947265625, 0.0026373863220214844, 0.0028295516967773438, 0.003021717071533203, 0.0032138824462890625, 0.003406047821044922, 0.0035982131958007812, 0.0037903785705566406, 0.0039825439453125, 0.004174709320068359, 0.004366874694824219, 0.004559040069580078, 0.0047512054443359375, 0.004943370819091797, 0.005135536193847656, 0.005327701568603516, 0.005519866943359375, 0.005712032318115234, 0.005904197692871094, 0.006096363067626953, 0.0062885284423828125, 0.006480693817138672, 0.006672859191894531, 0.006865024566650391, 0.00705718994140625, 0.007249355316162109, 0.007441520690917969, 0.007633686065673828, 0.007825851440429688, 0.008018016815185547, 0.008210182189941406, 0.008402347564697266, 0.008594512939453125, 0.008786678314208984, 0.008978843688964844, 0.009171009063720703, 0.009363174438476562, 0.009555339813232422, 0.009747505187988281, 0.00993967056274414, 0.0101318359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 7.0, 4.0, 12.0, 16.0, 23.0, 25.0, 41.0, 68.0, 94.0, 156.0, 210.0, 316.0, 486.0, 763.0, 1287.0, 1969.0, 3272.0, 5341.0, 8947.0, 15721.0, 28656.0, 56378.0, 135122.0, 484243.0, 166566.0, 64439.0, 31631.0, 17485.0, 10002.0, 5778.0, 3556.0, 2195.0, 1269.0, 845.0, 522.0, 355.0, 253.0, 160.0, 106.0, 67.0, 57.0, 41.0, 25.0, 10.0, 16.0, 9.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.004161834716796875, -0.004037916660308838, -0.003913998603820801, -0.0037900805473327637, -0.0036661624908447266, -0.0035422444343566895, -0.0034183263778686523, -0.0032944083213806152, -0.003170490264892578, -0.003046572208404541, -0.002922654151916504, -0.002798736095428467, -0.0026748180389404297, -0.0025508999824523926, -0.0024269819259643555, -0.0023030638694763184, -0.0021791458129882812, -0.002055227756500244, -0.001931309700012207, -0.00180739164352417, -0.0016834735870361328, -0.0015595555305480957, -0.0014356374740600586, -0.0013117194175720215, -0.0011878013610839844, -0.0010638833045959473, -0.0009399652481079102, -0.000816047191619873, -0.0006921291351318359, -0.0005682110786437988, -0.0004442930221557617, -0.0003203749656677246, -0.0001964569091796875, -7.253885269165039e-05, 5.137920379638672e-05, 0.00017529726028442383, 0.00029921531677246094, 0.00042313337326049805, 0.0005470514297485352, 0.0006709694862365723, 0.0007948875427246094, 0.0009188055992126465, 0.0010427236557006836, 0.0011666417121887207, 0.0012905597686767578, 0.001414477825164795, 0.001538395881652832, 0.0016623139381408691, 0.0017862319946289062, 0.0019101500511169434, 0.0020340681076049805, 0.0021579861640930176, 0.0022819042205810547, 0.002405822277069092, 0.002529740333557129, 0.002653658390045166, 0.002777576446533203, 0.0029014945030212402, 0.0030254125595092773, 0.0031493306159973145, 0.0032732486724853516, 0.0033971667289733887, 0.0035210847854614258, 0.003645002841949463, 0.0037689208984375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 8.0, 12.0, 14.0, 18.0, 11.0, 20.0, 18.0, 23.0, 36.0, 32.0, 29.0, 37.0, 38.0, 46.0, 60.0, 77.0, 68.0, 70.0, 55.0, 38.0, 46.0, 42.0, 31.0, 22.0, 19.0, 19.0, 13.0, 18.0, 18.0, 18.0, 12.0, 6.0, 6.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0026416778564453125, -0.0025619566440582275, -0.0024822354316711426, -0.0024025142192840576, -0.0023227930068969727, -0.0022430717945098877, -0.0021633505821228027, -0.0020836293697357178, -0.002003908157348633, -0.0019241869449615479, -0.0018444657325744629, -0.001764744520187378, -0.001685023307800293, -0.001605302095413208, -0.001525580883026123, -0.001445859670639038, -0.0013661384582519531, -0.0012864172458648682, -0.0012066960334777832, -0.0011269748210906982, -0.0010472536087036133, -0.0009675323963165283, -0.0008878111839294434, -0.0008080899715423584, -0.0007283687591552734, -0.0006486475467681885, -0.0005689263343811035, -0.0004892051219940186, -0.0004094839096069336, -0.00032976269721984863, -0.00025004148483276367, -0.0001703202724456787, -9.059906005859375e-05, -1.0877847671508789e-05, 6.884336471557617e-05, 0.00014856457710266113, 0.0002282857894897461, 0.00030800700187683105, 0.000387728214263916, 0.000467449426651001, 0.0005471706390380859, 0.0006268918514251709, 0.0007066130638122559, 0.0007863342761993408, 0.0008660554885864258, 0.0009457767009735107, 0.0010254979133605957, 0.0011052191257476807, 0.0011849403381347656, 0.0012646615505218506, 0.0013443827629089355, 0.0014241039752960205, 0.0015038251876831055, 0.0015835464000701904, 0.0016632676124572754, 0.0017429888248443604, 0.0018227100372314453, 0.0019024312496185303, 0.0019821524620056152, 0.0020618736743927, 0.002141594886779785, 0.00222131609916687, 0.002301037311553955, 0.00238075852394104, 0.002460479736328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 11.0, 15.0, 21.0, 25.0, 33.0, 59.0, 90.0, 104.0, 203.0, 327.0, 599.0, 1145.0, 2883.0, 7856.0, 28234.0, 239023.0, 699372.0, 49219.0, 11948.0, 4031.0, 1587.0, 741.0, 420.0, 193.0, 149.0, 77.0, 47.0, 47.0, 20.0, 15.0, 12.0, 12.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00022876262664794922, -0.00022186525166034698, -0.00021496787667274475, -0.00020807050168514252, -0.00020117312669754028, -0.00019427575170993805, -0.00018737837672233582, -0.00018048100173473358, -0.00017358362674713135, -0.00016668625175952911, -0.00015978887677192688, -0.00015289150178432465, -0.0001459941267967224, -0.00013909675180912018, -0.00013219937682151794, -0.0001253020018339157, -0.00011840462684631348, -0.00011150725185871124, -0.00010460987687110901, -9.771250188350677e-05, -9.081512689590454e-05, -8.391775190830231e-05, -7.702037692070007e-05, -7.012300193309784e-05, -6.32256269454956e-05, -5.632825195789337e-05, -4.943087697029114e-05, -4.2533501982688904e-05, -3.563612699508667e-05, -2.8738752007484436e-05, -2.1841377019882202e-05, -1.4944002032279968e-05, -8.046627044677734e-06, -1.1492520570755005e-06, 5.748122930526733e-06, 1.2645497918128967e-05, 1.95428729057312e-05, 2.6440247893333435e-05, 3.333762288093567e-05, 4.02349978685379e-05, 4.713237285614014e-05, 5.402974784374237e-05, 6.0927122831344604e-05, 6.782449781894684e-05, 7.472187280654907e-05, 8.16192477941513e-05, 8.851662278175354e-05, 9.541399776935577e-05, 0.00010231137275695801, 0.00010920874774456024, 0.00011610612273216248, 0.0001230034977197647, 0.00012990087270736694, 0.00013679824769496918, 0.0001436956226825714, 0.00015059299767017365, 0.00015749037265777588, 0.0001643877476453781, 0.00017128512263298035, 0.00017818249762058258, 0.00018507987260818481, 0.00019197724759578705, 0.00019887462258338928, 0.00020577199757099152, 0.00021266937255859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 232.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 321.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 242.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 19.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0], "bins": [-2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07, 1.862645149230957e-07, 1.9371509552001953e-07, 2.0116567611694336e-07, 2.086162567138672e-07, 2.1606683731079102e-07, 2.2351741790771484e-07, 2.3096799850463867e-07, 2.384185791015625e-07]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 11.0, 10.0, 19.0, 27.0, 29.0, 56.0, 49.0, 69.0, 102.0, 154.0, 190.0, 278.0, 363.0, 472.0, 652.0, 964.0, 1300.0, 1903.0, 2866.0, 3994.0, 6565.0, 10651.0, 18134.0, 36027.0, 86448.0, 362416.0, 349572.0, 82810.0, 33868.0, 18148.0, 10519.0, 6258.0, 4212.0, 2787.0, 1903.0, 1289.0, 931.0, 669.0, 479.0, 369.0, 222.0, 212.0, 144.0, 102.0, 98.0, 62.0, 46.0, 28.0, 23.0, 14.0, 17.0, 11.0, 4.0, 5.0, 3.0, 2.0], "bins": [-8.64267349243164e-05, -8.388329297304153e-05, -8.133985102176666e-05, -7.879640907049179e-05, -7.625296711921692e-05, -7.370952516794205e-05, -7.116608321666718e-05, -6.86226412653923e-05, -6.607919931411743e-05, -6.353575736284256e-05, -6.099231541156769e-05, -5.8448873460292816e-05, -5.5905431509017944e-05, -5.336198955774307e-05, -5.08185476064682e-05, -4.827510565519333e-05, -4.573166370391846e-05, -4.3188221752643585e-05, -4.064477980136871e-05, -3.810133785009384e-05, -3.555789589881897e-05, -3.30144539475441e-05, -3.0471011996269226e-05, -2.7927570044994354e-05, -2.5384128093719482e-05, -2.284068614244461e-05, -2.029724419116974e-05, -1.7753802239894867e-05, -1.5210360288619995e-05, -1.2666918337345123e-05, -1.0123476386070251e-05, -7.58003443479538e-06, -5.036592483520508e-06, -2.493150532245636e-06, 5.029141902923584e-08, 2.5937333703041077e-06, 5.1371753215789795e-06, 7.680617272853851e-06, 1.0224059224128723e-05, 1.2767501175403595e-05, 1.5310943126678467e-05, 1.785438507795334e-05, 2.039782702922821e-05, 2.2941268980503082e-05, 2.5484710931777954e-05, 2.8028152883052826e-05, 3.05715948343277e-05, 3.311503678560257e-05, 3.565847873687744e-05, 3.820192068815231e-05, 4.0745362639427185e-05, 4.328880459070206e-05, 4.583224654197693e-05, 4.83756884932518e-05, 5.091913044452667e-05, 5.3462572395801544e-05, 5.6006014347076416e-05, 5.854945629835129e-05, 6.109289824962616e-05, 6.363634020090103e-05, 6.61797821521759e-05, 6.872322410345078e-05, 7.126666605472565e-05, 7.381010800600052e-05, 7.635354995727539e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 5.0, 6.0, 12.0, 7.0, 8.0, 14.0, 23.0, 19.0, 19.0, 26.0, 34.0, 58.0, 88.0, 120.0, 119.0, 100.0, 73.0, 49.0, 36.0, 30.0, 19.0, 24.0, 14.0, 14.0, 3.0, 13.0, 7.0, 14.0, 4.0, 4.0, 0.0, 6.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.318092346191406e-05, -6.128661334514618e-05, -5.9392303228378296e-05, -5.749799311161041e-05, -5.560368299484253e-05, -5.3709372878074646e-05, -5.181506276130676e-05, -4.992075264453888e-05, -4.8026442527770996e-05, -4.613213241100311e-05, -4.423782229423523e-05, -4.2343512177467346e-05, -4.044920206069946e-05, -3.855489194393158e-05, -3.6660581827163696e-05, -3.476627171039581e-05, -3.287196159362793e-05, -3.0977651476860046e-05, -2.9083341360092163e-05, -2.718903124332428e-05, -2.5294721126556396e-05, -2.3400411009788513e-05, -2.150610089302063e-05, -1.9611790776252747e-05, -1.7717480659484863e-05, -1.582317054271698e-05, -1.3928860425949097e-05, -1.2034550309181213e-05, -1.014024019241333e-05, -8.245930075645447e-06, -6.3516199588775635e-06, -4.45730984210968e-06, -2.562999725341797e-06, -6.686896085739136e-07, 1.2256205081939697e-06, 3.119930624961853e-06, 5.014240741729736e-06, 6.90855085849762e-06, 8.802860975265503e-06, 1.0697171092033386e-05, 1.259148120880127e-05, 1.4485791325569153e-05, 1.6380101442337036e-05, 1.827441155910492e-05, 2.0168721675872803e-05, 2.2063031792640686e-05, 2.395734190940857e-05, 2.5851652026176453e-05, 2.7745962142944336e-05, 2.964027225971222e-05, 3.15345823764801e-05, 3.3428892493247986e-05, 3.532320261001587e-05, 3.721751272678375e-05, 3.9111822843551636e-05, 4.100613296031952e-05, 4.29004430770874e-05, 4.4794753193855286e-05, 4.668906331062317e-05, 4.858337342739105e-05, 5.0477683544158936e-05, 5.237199366092682e-05, 5.42663037776947e-05, 5.6160613894462585e-05, 5.805492401123047e-05]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 12.0, 11.0, 12.0, 23.0, 30.0, 60.0, 102.0, 204.0, 287.0, 92.0, 64.0, 38.0, 24.0, 18.0, 6.0, 5.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.015387069433927536, -0.015003250911831856, -0.014619431458413601, -0.01423561293631792, -0.01385179441422224, -0.01346797589212656, -0.013084156438708305, -0.012700337916612625, -0.012316519394516945, -0.011932700872421265, -0.01154888141900301, -0.01116506289690733, -0.01078124437481165, -0.010397425852715969, -0.010013606399297714, -0.009629787877202034, -0.009245969355106354, -0.008862150833010674, -0.008478331379592419, -0.008094512857496738, -0.007710694335401058, -0.007326875347644091, -0.006943056359887123, -0.006559237837791443, -0.006175418384373188, -0.0057915993966162205, -0.00540778087452054, -0.005023961886763573, -0.0046401433646678925, -0.004256324376910925, -0.003872505621984601, -0.003488686867058277, -0.003104868344962597, -0.002721049590036273, -0.002337230835109949, -0.0019534118473529816, -0.0015695932088419795, -0.0011857744539156556, -0.0008019555825740099, -0.000418136827647686, -3.4318072721362114e-05, 0.00034950071130879223, 0.0007333194953389466, 0.0011171383084729314, 0.0015009570633992553, 0.0018847758183255792, 0.002268594689667225, 0.0026524134445935488, 0.0030362321995198727, 0.0034200509544461966, 0.0038038697093725204, 0.004187688697129488, 0.004571507219225168, 0.004955326206982136, 0.005339144729077816, 0.0057229637168347836, 0.006106782704591751, 0.006490601692348719, 0.006874420214444399, 0.007258239202201366, 0.007642057724297047, 0.008025876246392727, 0.008409695699810982, 0.008793514221906662, 0.009177332744002342]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 10.0, 4.0, 11.0, 26.0, 31.0, 42.0, 46.0, 54.0, 72.0, 75.0, 77.0, 98.0, 65.0, 71.0, 73.0, 66.0, 48.0, 43.0, 37.0, 21.0, 17.0, 10.0, 12.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003933199215680361, -0.0036793570034205914, -0.003425514791160822, -0.0031716725789010525, -0.002917830366641283, -0.0026639881543815136, -0.0024101457092911005, -0.002156303497031331, -0.0019024612847715616, -0.0016486190725117922, -0.0013947768602520227, -0.0011409345315769315, -0.000887092319317162, -0.0006332501070573926, -0.00037940777838230133, -0.0001255655661225319, 0.00012827664613723755, 0.00038211888750083745, 0.0006359611288644373, 0.0008898033993318677, 0.0011436456115916371, 0.0013974878238514066, 0.0016513301525264978, 0.0019051723647862673, 0.0021590145770460367, 0.002412856789305806, 0.0026666990015655756, 0.0029205414466559887, 0.003174383658915758, 0.0034282258711755276, 0.003682068083435297, 0.0039359102956950665, 0.004189752042293549, 0.004443594254553318, 0.0046974364668130875, 0.004951278679072857, 0.005205120891332626, 0.005458963103592396, 0.005712805315852165, 0.005966647528111935, 0.006220489740371704, 0.0064743319526314735, 0.006728174164891243, 0.006982016377151012, 0.007235858589410782, 0.007489700801670551, 0.007743543013930321, 0.00799738522619009, 0.00825122743844986, 0.008505069650709629, 0.008758911862969398, 0.009012754075229168, 0.009266596287488937, 0.009520438499748707, 0.009774280712008476, 0.010028122924268246, 0.01028196606785059, 0.01053580828011036, 0.010789650492370129, 0.011043492704629898, 0.011297334916889668, 0.011551177129149437, 0.011805019341409206, 0.012058861553668976, 0.012312703765928745]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 15.0, 12.0, 14.0, 25.0, 23.0, 41.0, 63.0, 74.0, 124.0, 150.0, 220.0, 281.0, 411.0, 652.0, 934.0, 1603.0, 2511.0, 4370.0, 8042.0, 15738.0, 36737.0, 455475.0, 3542501.0, 74786.0, 23556.0, 11090.0, 5887.0, 3276.0, 1914.0, 1220.0, 782.0, 503.0, 340.0, 243.0, 173.0, 129.0, 96.0, 61.0, 52.0, 36.0, 33.0, 17.0, 16.0, 12.0, 13.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.005352020263671875, -0.005180835723876953, -0.005009651184082031, -0.004838466644287109, -0.0046672821044921875, -0.004496097564697266, -0.004324913024902344, -0.004153728485107422, -0.0039825439453125, -0.003811359405517578, -0.0036401748657226562, -0.0034689903259277344, -0.0032978057861328125, -0.0031266212463378906, -0.0029554367065429688, -0.002784252166748047, -0.002613067626953125, -0.002441883087158203, -0.0022706985473632812, -0.0020995140075683594, -0.0019283294677734375, -0.0017571449279785156, -0.0015859603881835938, -0.0014147758483886719, -0.00124359130859375, -0.0010724067687988281, -0.0009012222290039062, -0.0007300376892089844, -0.0005588531494140625, -0.0003876686096191406, -0.00021648406982421875, -4.5299530029296875e-05, 0.000125885009765625, 0.0002970695495605469, 0.00046825408935546875, 0.0006394386291503906, 0.0008106231689453125, 0.0009818077087402344, 0.0011529922485351562, 0.0013241767883300781, 0.001495361328125, 0.0016665458679199219, 0.0018377304077148438, 0.0020089149475097656, 0.0021800994873046875, 0.0023512840270996094, 0.0025224685668945312, 0.002693653106689453, 0.002864837646484375, 0.003036022186279297, 0.0032072067260742188, 0.0033783912658691406, 0.0035495758056640625, 0.0037207603454589844, 0.0038919448852539062, 0.004063129425048828, 0.00423431396484375, 0.004405498504638672, 0.004576683044433594, 0.004747867584228516, 0.0049190521240234375, 0.005090236663818359, 0.005261421203613281, 0.005432605743408203, 0.005603790283203125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 7.0, 5.0, 7.0, 14.0, 10.0, 21.0, 23.0, 15.0, 17.0, 21.0, 30.0, 23.0, 25.0, 40.0, 26.0, 37.0, 40.0, 53.0, 66.0, 80.0, 41.0, 35.0, 40.0, 36.0, 37.0, 28.0, 31.0, 29.0, 22.0, 20.0, 16.0, 16.0, 15.0, 18.0, 11.0, 11.0, 7.0, 6.0, 5.0, 5.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009393692016601562, -0.0009093433618545532, -0.0008793175220489502, -0.0008492916822433472, -0.0008192658424377441, -0.0007892400026321411, -0.0007592141628265381, -0.0007291883230209351, -0.000699162483215332, -0.000669136643409729, -0.000639110803604126, -0.000609084963798523, -0.0005790591239929199, -0.0005490332841873169, -0.0005190074443817139, -0.0004889816045761108, -0.0004589557647705078, -0.0004289299249649048, -0.00039890408515930176, -0.00036887824535369873, -0.0003388524055480957, -0.0003088265657424927, -0.00027880072593688965, -0.0002487748861312866, -0.0002187490463256836, -0.00018872320652008057, -0.00015869736671447754, -0.0001286715269088745, -9.864568710327148e-05, -6.861984729766846e-05, -3.859400749206543e-05, -8.568167686462402e-06, 2.1457672119140625e-05, 5.148351192474365e-05, 8.150935173034668e-05, 0.00011153519153594971, 0.00014156103134155273, 0.00017158687114715576, 0.0002016127109527588, 0.00023163855075836182, 0.00026166439056396484, 0.00029169023036956787, 0.0003217160701751709, 0.0003517419099807739, 0.00038176774978637695, 0.00041179358959198, 0.000441819429397583, 0.00047184526920318604, 0.0005018711090087891, 0.0005318969488143921, 0.0005619227886199951, 0.0005919486284255981, 0.0006219744682312012, 0.0006520003080368042, 0.0006820261478424072, 0.0007120519876480103, 0.0007420778274536133, 0.0007721036672592163, 0.0008021295070648193, 0.0008321553468704224, 0.0008621811866760254, 0.0008922070264816284, 0.0009222328662872314, 0.0009522587060928345, 0.0009822845458984375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 9.0, 5.0, 13.0, 11.0, 15.0, 10.0, 22.0, 26.0, 30.0, 44.0, 65.0, 91.0, 168.0, 306.0, 553.0, 1047.0, 2158.0, 4394.0, 9819.0, 24206.0, 76217.0, 1449726.0, 2510278.0, 74833.0, 23175.0, 9163.0, 3905.0, 1884.0, 888.0, 478.0, 263.0, 160.0, 90.0, 62.0, 38.0, 29.0, 21.0, 19.0, 13.0, 12.0, 7.0, 9.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.004398345947265625, -0.004265129566192627, -0.004131913185119629, -0.003998696804046631, -0.003865480422973633, -0.0037322640419006348, -0.0035990476608276367, -0.0034658312797546387, -0.0033326148986816406, -0.0031993985176086426, -0.0030661821365356445, -0.0029329657554626465, -0.0027997493743896484, -0.0026665329933166504, -0.0025333166122436523, -0.0024001002311706543, -0.0022668838500976562, -0.002133667469024658, -0.00200045108795166, -0.0018672347068786621, -0.001734018325805664, -0.001600801944732666, -0.001467585563659668, -0.00133436918258667, -0.0012011528015136719, -0.0010679364204406738, -0.0009347200393676758, -0.0008015036582946777, -0.0006682872772216797, -0.0005350708961486816, -0.0004018545150756836, -0.00026863813400268555, -0.0001354217529296875, -2.205371856689453e-06, 0.0001310110092163086, 0.00026422739028930664, 0.0003974437713623047, 0.0005306601524353027, 0.0006638765335083008, 0.0007970929145812988, 0.0009303092956542969, 0.001063525676727295, 0.001196742057800293, 0.001329958438873291, 0.001463174819946289, 0.0015963912010192871, 0.0017296075820922852, 0.0018628239631652832, 0.0019960403442382812, 0.0021292567253112793, 0.0022624731063842773, 0.0023956894874572754, 0.0025289058685302734, 0.0026621222496032715, 0.0027953386306762695, 0.0029285550117492676, 0.0030617713928222656, 0.0031949877738952637, 0.0033282041549682617, 0.0034614205360412598, 0.003594636917114258, 0.003727853298187256, 0.003861069679260254, 0.003994286060333252, 0.00412750244140625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 7.0, 5.0, 7.0, 15.0, 19.0, 32.0, 44.0, 68.0, 162.0, 1005.0, 1954.0, 333.0, 141.0, 89.0, 58.0, 36.0, 35.0, 20.0, 11.0, 13.0, 13.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020771026611328125, -0.002000570297241211, -0.0019240379333496094, -0.0018475055694580078, -0.0017709732055664062, -0.0016944408416748047, -0.0016179084777832031, -0.0015413761138916016, -0.00146484375, -0.0013883113861083984, -0.0013117790222167969, -0.0012352466583251953, -0.0011587142944335938, -0.0010821819305419922, -0.0010056495666503906, -0.0009291172027587891, -0.0008525848388671875, -0.0007760524749755859, -0.0006995201110839844, -0.0006229877471923828, -0.0005464553833007812, -0.0004699230194091797, -0.0003933906555175781, -0.00031685829162597656, -0.000240325927734375, -0.00016379356384277344, -8.726119995117188e-05, -1.0728836059570312e-05, 6.580352783203125e-05, 0.0001423358917236328, 0.00021886825561523438, 0.00029540061950683594, 0.0003719329833984375, 0.00044846534729003906, 0.0005249977111816406, 0.0006015300750732422, 0.0006780624389648438, 0.0007545948028564453, 0.0008311271667480469, 0.0009076595306396484, 0.00098419189453125, 0.0010607242584228516, 0.0011372566223144531, 0.0012137889862060547, 0.0012903213500976562, 0.0013668537139892578, 0.0014433860778808594, 0.001519918441772461, 0.0015964508056640625, 0.001672983169555664, 0.0017495155334472656, 0.0018260478973388672, 0.0019025802612304688, 0.0019791126251220703, 0.002055644989013672, 0.0021321773529052734, 0.002208709716796875, 0.0022852420806884766, 0.002361774444580078, 0.0024383068084716797, 0.0025148391723632812, 0.002591371536254883, 0.0026679039001464844, 0.002744436264038086, 0.0028209686279296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 8.0, 13.0, 14.0, 14.0, 19.0, 35.0, 41.0, 74.0, 103.0, 225.0, 118.0, 55.0, 59.0, 37.0, 32.0, 19.0, 19.0, 19.0, 14.0, 14.0, 8.0, 10.0, 9.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.004662953782826662, -0.00450569111853838, -0.004348428454250097, -0.004191165789961815, -0.0040339031256735325, -0.0038766406942158937, -0.0037193780299276114, -0.0035621155984699726, -0.00340485293418169, -0.003247590269893408, -0.0030903276056051254, -0.002933064941316843, -0.0027758025098592043, -0.002618539845570922, -0.0024612771812826395, -0.0023040147498250008, -0.0021467518527060747, -0.0019894891884177923, -0.0018322266405448318, -0.0016749639762565494, -0.0015177014283835888, -0.0013604387640953064, -0.001203176099807024, -0.0010459135519340634, -0.000888650887645781, -0.0007313882815651596, -0.0005741256754845381, -0.0004168630111962557, -0.0002596004051156342, -0.00010233779903501272, 5.492486525326967e-05, 0.00021218741312623024, 0.00036945007741451263, 0.0005267126834951341, 0.0006839752895757556, 0.000841237953864038, 0.0009985005017369986, 0.001155763166025281, 0.0013130258303135633, 0.001470288378186524, 0.0016275510424748063, 0.0017848137067630887, 0.0019420762546360493, 0.0020993389189243317, 0.002256601583212614, 0.0024138642475008965, 0.002571126911789179, 0.0027283893432468176, 0.0028856520075351, 0.0030429146718233824, 0.0032001773361116648, 0.0033574397675693035, 0.003514702431857586, 0.0036719650961458683, 0.0038292277604341507, 0.003986490424722433, 0.0041437530890107155, 0.004301015753298998, 0.00445827841758728, 0.004615541081875563, 0.004772803746163845, 0.00493006594479084, 0.00508732907474041, 0.005244591273367405, 0.005401853937655687]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 7.0, 2.0, 8.0, 14.0, 13.0, 11.0, 20.0, 25.0, 18.0, 36.0, 32.0, 42.0, 45.0, 46.0, 57.0, 62.0, 57.0, 55.0, 45.0, 42.0, 55.0, 41.0, 50.0, 32.0, 36.0, 26.0, 28.0, 16.0, 16.0, 15.0, 18.0, 5.0, 11.0, 4.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0035793466959148645, -0.003459329018369317, -0.0033393115736544132, -0.0032192938961088657, -0.0030992762185633183, -0.0029792585410177708, -0.002859241096302867, -0.0027392234187573195, -0.0026192059740424156, -0.002499188296496868, -0.0023791708517819643, -0.002259153174236417, -0.0021391354966908693, -0.0020191180519759655, -0.001899100374430418, -0.0017790826968848705, -0.001659065019339323, -0.0015390474582090974, -0.00141902978066355, -0.0012990122195333242, -0.0011789945419877768, -0.001058976980857551, -0.0009389594197273254, -0.0008189418003894389, -0.0006989241810515523, -0.0005789065617136657, -0.0004588889714796096, -0.0003388713812455535, -0.00021885376190766692, -9.883614256978035e-05, 2.118141856044531e-05, 0.00014119903789833188, 0.0002612168900668621, 0.0003812345094047487, 0.0005012521287426353, 0.0006212696898728609, 0.0007412873092107475, 0.000861304928548634, 0.0009813224896788597, 0.0011013401672244072, 0.0012213577283546329, 0.0013413752894848585, 0.001461392967030406, 0.0015814105281606317, 0.0017014280892908573, 0.0018214457668364048, 0.0019414633279666305, 0.002061480889096856, 0.0021814985666424036, 0.002301516244187951, 0.002421533688902855, 0.0025415513664484024, 0.00266156904399395, 0.0027815867215394974, 0.002901604166254401, 0.0030216218437999487, 0.0031416392885148525, 0.0032616569660604, 0.003381674410775304, 0.0035016920883208513, 0.003621709765866399, 0.0037417272105813026, 0.00386174488812685, 0.003981762565672398, 0.004101780243217945]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 2.0, 5.0, 11.0, 17.0, 15.0, 25.0, 27.0, 49.0, 90.0, 132.0, 183.0, 290.0, 485.0, 894.0, 1865.0, 5574.0, 18809.0, 86447.0, 722630.0, 167064.0, 30591.0, 8002.0, 2630.0, 1195.0, 593.0, 343.0, 220.0, 113.0, 71.0, 57.0, 28.0, 24.0, 19.0, 14.0, 9.0, 9.0, 8.0, 5.0, 7.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0007791519165039062, -0.0007545500993728638, -0.0007299482822418213, -0.0007053464651107788, -0.0006807446479797363, -0.0006561428308486938, -0.0006315410137176514, -0.0006069391965866089, -0.0005823373794555664, -0.0005577355623245239, -0.0005331337451934814, -0.000508531928062439, -0.0004839301109313965, -0.000459328293800354, -0.0004347264766693115, -0.00041012465953826904, -0.00038552284240722656, -0.0003609210252761841, -0.0003363192081451416, -0.0003117173910140991, -0.00028711557388305664, -0.00026251375675201416, -0.00023791193962097168, -0.0002133101224899292, -0.00018870830535888672, -0.00016410648822784424, -0.00013950467109680176, -0.00011490285396575928, -9.03010368347168e-05, -6.569921970367432e-05, -4.1097402572631836e-05, -1.6495585441589355e-05, 8.106231689453125e-06, 3.2708048820495605e-05, 5.7309865951538086e-05, 8.191168308258057e-05, 0.00010651350021362305, 0.00013111531734466553, 0.000155717134475708, 0.0001803189516067505, 0.00020492076873779297, 0.00022952258586883545, 0.00025412440299987793, 0.0002787262201309204, 0.0003033280372619629, 0.00032792985439300537, 0.00035253167152404785, 0.00037713348865509033, 0.0004017353057861328, 0.0004263371229171753, 0.0004509389400482178, 0.00047554075717926025, 0.0005001425743103027, 0.0005247443914413452, 0.0005493462085723877, 0.0005739480257034302, 0.0005985498428344727, 0.0006231516599655151, 0.0006477534770965576, 0.0006723552942276001, 0.0006969571113586426, 0.0007215589284896851, 0.0007461607456207275, 0.00077076256275177, 0.0007953643798828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 10.0, 9.0, 12.0, 23.0, 35.0, 55.0, 60.0, 70.0, 107.0, 168.0, 118.0, 64.0, 68.0, 67.0, 43.0, 36.0, 28.0, 17.0, 3.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00540924072265625, -0.00526273250579834, -0.00511622428894043, -0.0049697160720825195, -0.004823207855224609, -0.004676699638366699, -0.004530191421508789, -0.004383683204650879, -0.004237174987792969, -0.004090666770935059, -0.0039441585540771484, -0.0037976503372192383, -0.003651142120361328, -0.003504633903503418, -0.003358125686645508, -0.0032116174697875977, -0.0030651092529296875, -0.0029186010360717773, -0.002772092819213867, -0.002625584602355957, -0.002479076385498047, -0.0023325681686401367, -0.0021860599517822266, -0.0020395517349243164, -0.0018930435180664062, -0.001746535301208496, -0.001600027084350586, -0.0014535188674926758, -0.0013070106506347656, -0.0011605024337768555, -0.0010139942169189453, -0.0008674860000610352, -0.000720977783203125, -0.0005744695663452148, -0.0004279613494873047, -0.00028145313262939453, -0.00013494491577148438, 1.1563301086425781e-05, 0.00015807151794433594, 0.0003045797348022461, 0.00045108795166015625, 0.0005975961685180664, 0.0007441043853759766, 0.0008906126022338867, 0.0010371208190917969, 0.001183629035949707, 0.0013301372528076172, 0.0014766454696655273, 0.0016231536865234375, 0.0017696619033813477, 0.0019161701202392578, 0.002062678337097168, 0.002209186553955078, 0.0023556947708129883, 0.0025022029876708984, 0.0026487112045288086, 0.0027952194213867188, 0.002941727638244629, 0.003088235855102539, 0.0032347440719604492, 0.0033812522888183594, 0.0035277605056762695, 0.0036742687225341797, 0.00382077693939209, 0.00396728515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 10.0, 9.0, 11.0, 19.0, 35.0, 40.0, 48.0, 56.0, 89.0, 142.0, 257.0, 463.0, 932.0, 2600.0, 10210.0, 79954.0, 823170.0, 112000.0, 13062.0, 3126.0, 1071.0, 462.0, 210.0, 152.0, 108.0, 75.0, 39.0, 48.0, 31.0, 17.0, 23.0, 21.0, 16.0, 13.0, 7.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0009946823120117188, -0.0009621381759643555, -0.0009295940399169922, -0.0008970499038696289, -0.0008645057678222656, -0.0008319616317749023, -0.0007994174957275391, -0.0007668733596801758, -0.0007343292236328125, -0.0007017850875854492, -0.0006692409515380859, -0.0006366968154907227, -0.0006041526794433594, -0.0005716085433959961, -0.0005390644073486328, -0.0005065202713012695, -0.00047397613525390625, -0.00044143199920654297, -0.0004088878631591797, -0.0003763437271118164, -0.0003437995910644531, -0.00031125545501708984, -0.00027871131896972656, -0.0002461671829223633, -0.000213623046875, -0.00018107891082763672, -0.00014853477478027344, -0.00011599063873291016, -8.344650268554688e-05, -5.0902366638183594e-05, -1.8358230590820312e-05, 1.4185905456542969e-05, 4.673004150390625e-05, 7.927417755126953e-05, 0.00011181831359863281, 0.0001443624496459961, 0.00017690658569335938, 0.00020945072174072266, 0.00024199485778808594, 0.0002745389938354492, 0.0003070831298828125, 0.0003396272659301758, 0.00037217140197753906, 0.00040471553802490234, 0.0004372596740722656, 0.0004698038101196289, 0.0005023479461669922, 0.0005348920822143555, 0.0005674362182617188, 0.000599980354309082, 0.0006325244903564453, 0.0006650686264038086, 0.0006976127624511719, 0.0007301568984985352, 0.0007627010345458984, 0.0007952451705932617, 0.000827789306640625, 0.0008603334426879883, 0.0008928775787353516, 0.0009254217147827148, 0.0009579658508300781, 0.0009905099868774414, 0.0010230541229248047, 0.001055598258972168, 0.0010881423950195312]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 5.0, 24.0, 38.0, 86.0, 137.0, 165.0, 172.0, 125.0, 105.0, 66.0, 31.0, 12.0, 9.0, 10.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00792694091796875, -0.007465958595275879, -0.007004976272583008, -0.006543993949890137, -0.006083011627197266, -0.0056220293045043945, -0.0051610469818115234, -0.004700064659118652, -0.004239082336425781, -0.00377810001373291, -0.003317117691040039, -0.002856135368347168, -0.002395153045654297, -0.0019341707229614258, -0.0014731884002685547, -0.0010122060775756836, -0.0005512237548828125, -9.02414321899414e-05, 0.0003707408905029297, 0.0008317232131958008, 0.0012927055358886719, 0.001753687858581543, 0.002214670181274414, 0.002675652503967285, 0.0031366348266601562, 0.0035976171493530273, 0.0040585994720458984, 0.0045195817947387695, 0.004980564117431641, 0.005441546440124512, 0.005902528762817383, 0.006363511085510254, 0.006824493408203125, 0.007285475730895996, 0.007746458053588867, 0.008207440376281738, 0.00866842269897461, 0.00912940502166748, 0.009590387344360352, 0.010051369667053223, 0.010512351989746094, 0.010973334312438965, 0.011434316635131836, 0.011895298957824707, 0.012356281280517578, 0.01281726360321045, 0.01327824592590332, 0.013739228248596191, 0.014200210571289062, 0.014661192893981934, 0.015122175216674805, 0.015583157539367676, 0.016044139862060547, 0.016505122184753418, 0.01696610450744629, 0.01742708683013916, 0.01788806915283203, 0.018349051475524902, 0.018810033798217773, 0.019271016120910645, 0.019731998443603516, 0.020192980766296387, 0.020653963088989258, 0.02111494541168213, 0.021575927734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 5.0, 2.0, 7.0, 6.0, 14.0, 14.0, 15.0, 25.0, 41.0, 79.0, 89.0, 201.0, 265.0, 460.0, 799.0, 1453.0, 3231.0, 8308.0, 30579.0, 547633.0, 410120.0, 29668.0, 8367.0, 3372.0, 1598.0, 856.0, 488.0, 316.0, 179.0, 136.0, 73.0, 44.0, 19.0, 24.0, 22.0, 11.0, 3.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 4.0, 1.0, 2.0], "bins": [-7.832050323486328e-05, -7.601641118526459e-05, -7.37123191356659e-05, -7.14082270860672e-05, -6.91041350364685e-05, -6.680004298686981e-05, -6.449595093727112e-05, -6.219185888767242e-05, -5.988776683807373e-05, -5.758367478847504e-05, -5.527958273887634e-05, -5.297549068927765e-05, -5.0671398639678955e-05, -4.836730659008026e-05, -4.606321454048157e-05, -4.3759122490882874e-05, -4.145503044128418e-05, -3.9150938391685486e-05, -3.684684634208679e-05, -3.45427542924881e-05, -3.2238662242889404e-05, -2.993457019329071e-05, -2.7630478143692017e-05, -2.5326386094093323e-05, -2.302229404449463e-05, -2.0718201994895935e-05, -1.841410994529724e-05, -1.6110017895698547e-05, -1.3805925846099854e-05, -1.150183379650116e-05, -9.197741746902466e-06, -6.893649697303772e-06, -4.589557647705078e-06, -2.2854655981063843e-06, 1.862645149230957e-08, 2.3227185010910034e-06, 4.626810550689697e-06, 6.930902600288391e-06, 9.234994649887085e-06, 1.1539086699485779e-05, 1.3843178749084473e-05, 1.6147270798683167e-05, 1.845136284828186e-05, 2.0755454897880554e-05, 2.3059546947479248e-05, 2.5363638997077942e-05, 2.7667731046676636e-05, 2.997182309627533e-05, 3.2275915145874023e-05, 3.458000719547272e-05, 3.688409924507141e-05, 3.9188191294670105e-05, 4.14922833442688e-05, 4.379637539386749e-05, 4.6100467443466187e-05, 4.840455949306488e-05, 5.0708651542663574e-05, 5.301274359226227e-05, 5.531683564186096e-05, 5.7620927691459656e-05, 5.992501974105835e-05, 6.222911179065704e-05, 6.453320384025574e-05, 6.683729588985443e-05, 6.914138793945312e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 35.0, 0.0, 0.0, 70.0, 0.0, 0.0, 0.0, 121.0, 0.0, 0.0, 0.0, 192.0, 0.0, 0.0, 0.0, 191.0, 0.0, 0.0, 167.0, 0.0, 0.0, 0.0, 124.0, 0.0, 0.0, 0.0, 52.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.76837158203125e-07, -4.6100467443466187e-07, -4.4517219066619873e-07, -4.293397068977356e-07, -4.1350722312927246e-07, -3.976747393608093e-07, -3.818422555923462e-07, -3.6600977182388306e-07, -3.501772880554199e-07, -3.343448042869568e-07, -3.1851232051849365e-07, -3.026798367500305e-07, -2.868473529815674e-07, -2.7101486921310425e-07, -2.551823854446411e-07, -2.39349901676178e-07, -2.2351741790771484e-07, -2.076849341392517e-07, -1.9185245037078857e-07, -1.7601996660232544e-07, -1.601874828338623e-07, -1.4435499906539917e-07, -1.2852251529693604e-07, -1.126900315284729e-07, -9.685754776000977e-08, -8.102506399154663e-08, -6.51925802230835e-08, -4.936009645462036e-08, -3.3527612686157227e-08, -1.7695128917694092e-08, -1.862645149230957e-09, 1.3969838619232178e-08, 2.9802322387695312e-08, 4.563480615615845e-08, 6.146728992462158e-08, 7.729977369308472e-08, 9.313225746154785e-08, 1.0896474123001099e-07, 1.2479722499847412e-07, 1.4062970876693726e-07, 1.564621925354004e-07, 1.7229467630386353e-07, 1.8812716007232666e-07, 2.039596438407898e-07, 2.1979212760925293e-07, 2.3562461137771606e-07, 2.514570951461792e-07, 2.6728957891464233e-07, 2.8312206268310547e-07, 2.989545464515686e-07, 3.1478703022003174e-07, 3.3061951398849487e-07, 3.46451997756958e-07, 3.6228448152542114e-07, 3.781169652938843e-07, 3.939494490623474e-07, 4.0978193283081055e-07, 4.256144165992737e-07, 4.414469003677368e-07, 4.5727938413619995e-07, 4.731118679046631e-07, 4.889443516731262e-07, 5.047768354415894e-07, 5.206093192100525e-07, 5.364418029785156e-07]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 8.0, 4.0, 3.0, 8.0, 8.0, 17.0, 17.0, 30.0, 34.0, 43.0, 52.0, 75.0, 89.0, 161.0, 180.0, 281.0, 406.0, 605.0, 1003.0, 1741.0, 3171.0, 6368.0, 14989.0, 54146.0, 817377.0, 108355.0, 21741.0, 8157.0, 3882.0, 2117.0, 1213.0, 720.0, 456.0, 328.0, 195.0, 165.0, 100.0, 76.0, 56.0, 48.0, 29.0, 27.0, 13.0, 13.0, 19.0, 10.0, 4.0, 6.0, 6.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.604194641113281e-05, -6.395671516656876e-05, -6.18714839220047e-05, -5.978625267744064e-05, -5.770102143287659e-05, -5.561579018831253e-05, -5.3530558943748474e-05, -5.144532769918442e-05, -4.936009645462036e-05, -4.7274865210056305e-05, -4.518963396549225e-05, -4.310440272092819e-05, -4.1019171476364136e-05, -3.893394023180008e-05, -3.684870898723602e-05, -3.4763477742671967e-05, -3.267824649810791e-05, -3.0593015253543854e-05, -2.8507784008979797e-05, -2.642255276441574e-05, -2.4337321519851685e-05, -2.2252090275287628e-05, -2.0166859030723572e-05, -1.8081627786159515e-05, -1.599639654159546e-05, -1.3911165297031403e-05, -1.1825934052467346e-05, -9.74070280790329e-06, -7.655471563339233e-06, -5.570240318775177e-06, -3.4850090742111206e-06, -1.3997778296470642e-06, 6.854534149169922e-07, 2.7706846594810486e-06, 4.855915904045105e-06, 6.941147148609161e-06, 9.026378393173218e-06, 1.1111609637737274e-05, 1.319684088230133e-05, 1.5282072126865387e-05, 1.7367303371429443e-05, 1.94525346159935e-05, 2.1537765860557556e-05, 2.3622997105121613e-05, 2.570822834968567e-05, 2.7793459594249725e-05, 2.9878690838813782e-05, 3.196392208337784e-05, 3.4049153327941895e-05, 3.613438457250595e-05, 3.821961581707001e-05, 4.0304847061634064e-05, 4.239007830619812e-05, 4.4475309550762177e-05, 4.656054079532623e-05, 4.864577203989029e-05, 5.0731003284454346e-05, 5.28162345290184e-05, 5.490146577358246e-05, 5.6986697018146515e-05, 5.907192826271057e-05, 6.115715950727463e-05, 6.324239075183868e-05, 6.532762199640274e-05, 6.74128532409668e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 5.0, 5.0, 7.0, 9.0, 13.0, 11.0, 23.0, 21.0, 52.0, 97.0, 259.0, 258.0, 94.0, 49.0, 37.0, 17.0, 12.0, 8.0, 5.0, 3.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.586841583251953e-05, -2.5223009288311005e-05, -2.4577602744102478e-05, -2.393219619989395e-05, -2.3286789655685425e-05, -2.2641383111476898e-05, -2.199597656726837e-05, -2.1350570023059845e-05, -2.070516347885132e-05, -2.0059756934642792e-05, -1.9414350390434265e-05, -1.876894384622574e-05, -1.8123537302017212e-05, -1.7478130757808685e-05, -1.683272421360016e-05, -1.6187317669391632e-05, -1.5541911125183105e-05, -1.4896504580974579e-05, -1.4251098036766052e-05, -1.3605691492557526e-05, -1.2960284948348999e-05, -1.2314878404140472e-05, -1.1669471859931946e-05, -1.102406531572342e-05, -1.0378658771514893e-05, -9.733252227306366e-06, -9.08784568309784e-06, -8.442439138889313e-06, -7.797032594680786e-06, -7.1516260504722595e-06, -6.506219506263733e-06, -5.860812962055206e-06, -5.21540641784668e-06, -4.569999873638153e-06, -3.9245933294296265e-06, -3.2791867852211e-06, -2.6337802410125732e-06, -1.9883736968040466e-06, -1.34296715259552e-06, -6.975606083869934e-07, -5.21540641784668e-08, 5.932524800300598e-07, 1.2386590242385864e-06, 1.884065568447113e-06, 2.5294721126556396e-06, 3.1748786568641663e-06, 3.820285201072693e-06, 4.4656917452812195e-06, 5.111098289489746e-06, 5.756504833698273e-06, 6.401911377906799e-06, 7.047317922115326e-06, 7.692724466323853e-06, 8.338131010532379e-06, 8.983537554740906e-06, 9.628944098949432e-06, 1.0274350643157959e-05, 1.0919757187366486e-05, 1.1565163731575012e-05, 1.2210570275783539e-05, 1.2855976819992065e-05, 1.3501383364200592e-05, 1.4146789908409119e-05, 1.4792196452617645e-05, 1.5437602996826172e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 0.0, 3.0, 2.0, 2.0, 4.0, 10.0, 6.0, 12.0, 18.0, 26.0, 26.0, 36.0, 76.0, 120.0, 280.0, 128.0, 78.0, 49.0, 33.0, 21.0, 20.0, 15.0, 11.0, 13.0, 2.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027583593036979437, -0.0026314444839954376, -0.002504529897123575, -0.002377615077421069, -0.002250700257718563, -0.0021237856708467007, -0.0019968708511441946, -0.0018699560314416885, -0.0017430413281545043, -0.00161612662486732, -0.001489211805164814, -0.0013622971018776298, -0.0012353823985904455, -0.0011084675788879395, -0.0009815528756007552, -0.0008546381141059101, -0.0007277233526110649, -0.0006008085911162198, -0.00047389385872520506, -0.00034697912633419037, -0.00022006436483934522, -9.314960334450006e-05, 3.3765099942684174e-05, 0.00016067986143752933, 0.0002875946229323745, 0.00041450938442721963, 0.0005414241459220648, 0.000668338849209249, 0.0007952536107040942, 0.0009221683721989393, 0.0010490830754861236, 0.0011759977787733078, 0.0013029123656451702, 0.0014298270689323545, 0.0015567418886348605, 0.0016836565919220448, 0.0018105714116245508, 0.001937486114911735, 0.0020644008181989193, 0.0021913156379014254, 0.0023182304576039314, 0.0024451452773064375, 0.0025720598641783, 0.002698974683880806, 0.002825889503583312, 0.002952804323285818, 0.0030797189101576805, 0.0032066337298601866, 0.003333548316732049, 0.003460463136434555, 0.0035873777233064175, 0.0037142925430089235, 0.0038412073627114296, 0.003968121949583292, 0.004095036536455154, 0.004221951588988304, 0.0043488661758601665, 0.004475780762732029, 0.004602695815265179, 0.004729610402137041, 0.0048565249890089035, 0.004983440041542053, 0.005110354628413916, 0.005237269215285778, 0.005364184267818928]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 9.0, 9.0, 10.0, 17.0, 32.0, 44.0, 72.0, 65.0, 93.0, 114.0, 109.0, 84.0, 89.0, 67.0, 71.0, 35.0, 44.0, 17.0, 7.0, 8.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0052470252849161625, -0.005113922990858555, -0.0049808211624622345, -0.004847718868404627, -0.004714616574347019, -0.004581514745950699, -0.004448412451893091, -0.0043153101578354836, -0.004182208329439163, -0.0040491060353815556, -0.003916004206985235, -0.0037829019129276276, -0.00364979961887002, -0.003516697557643056, -0.003383595496416092, -0.0032504932023584843, -0.0031173909083008766, -0.0029842888470739126, -0.002851186553016305, -0.002718084491789341, -0.0025849821977317333, -0.0024518801365047693, -0.0023187780752778053, -0.0021856757812201977, -0.0020525737199932337, -0.0019194715423509479, -0.001786369364708662, -0.001653267303481698, -0.0015201651258394122, -0.0013870629481971264, -0.0012539608869701624, -0.0011208587093278766, -0.0009877567645162344, -0.0008546545868739486, -0.0007215524674393237, -0.0005884503480046988, -0.00045534817036241293, -0.0003222459927201271, -0.0001891438732855022, -5.6041753850877285e-05, 7.706042379140854e-05, 0.0002101625723298639, 0.0003432647208683193, 0.00047636686940677464, 0.00060946901794523, 0.0007425711955875158, 0.0008756733150221407, 0.0010087754344567657, 0.0011418776120990515, 0.0012749797897413373, 0.0014080819673836231, 0.0015411840286105871, 0.001674286206252873, 0.0018073883838951588, 0.0019404904451221228, 0.0020735925063490868, 0.0022066948004066944, 0.0023397968616336584, 0.002472899155691266, 0.00260600121691823, 0.0027391035109758377, 0.0028722055722028017, 0.0030053076334297657, 0.0031384099274873734, 0.0032715119887143373]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 5.0, 9.0, 3.0, 6.0, 12.0, 8.0, 10.0, 18.0, 26.0, 33.0, 43.0, 77.0, 188.0, 433.0, 1567.0, 7978.0, 76572.0, 894529.0, 58326.0, 6605.0, 1316.0, 377.0, 152.0, 64.0, 35.0, 32.0, 26.0, 17.0, 13.0, 15.0, 11.0, 11.0, 5.0, 6.0, 6.0, 5.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01183319091796875, -0.01146852970123291, -0.01110386848449707, -0.01073920726776123, -0.01037454605102539, -0.01000988483428955, -0.009645223617553711, -0.009280562400817871, -0.008915901184082031, -0.008551239967346191, -0.008186578750610352, -0.007821917533874512, -0.007457256317138672, -0.007092595100402832, -0.006727933883666992, -0.006363272666931152, -0.0059986114501953125, -0.005633950233459473, -0.005269289016723633, -0.004904627799987793, -0.004539966583251953, -0.004175305366516113, -0.0038106441497802734, -0.0034459829330444336, -0.0030813217163085938, -0.002716660499572754, -0.002351999282836914, -0.0019873380661010742, -0.0016226768493652344, -0.0012580156326293945, -0.0008933544158935547, -0.0005286931991577148, -0.000164031982421875, 0.00020062923431396484, 0.0005652904510498047, 0.0009299516677856445, 0.0012946128845214844, 0.0016592741012573242, 0.002023935317993164, 0.002388596534729004, 0.0027532577514648438, 0.0031179189682006836, 0.0034825801849365234, 0.0038472414016723633, 0.004211902618408203, 0.004576563835144043, 0.004941225051879883, 0.005305886268615723, 0.0056705474853515625, 0.006035208702087402, 0.006399869918823242, 0.006764531135559082, 0.007129192352294922, 0.007493853569030762, 0.007858514785766602, 0.008223176002502441, 0.008587837219238281, 0.008952498435974121, 0.009317159652709961, 0.0096818208694458, 0.01004648208618164, 0.01041114330291748, 0.01077580451965332, 0.01114046573638916, 0.011505126953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 8.0, 14.0, 18.0, 35.0, 69.0, 79.0, 129.0, 231.0, 122.0, 100.0, 86.0, 54.0, 35.0, 16.0, 3.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.002857208251953125, -0.0027997568249702454, -0.0027423053979873657, -0.002684853971004486, -0.0026274025440216064, -0.002569951117038727, -0.002512499690055847, -0.0024550482630729675, -0.002397596836090088, -0.0023401454091072083, -0.0022826939821243286, -0.002225242555141449, -0.0021677911281585693, -0.0021103397011756897, -0.00205288827419281, -0.0019954368472099304, -0.0019379854202270508, -0.0018805339932441711, -0.0018230825662612915, -0.0017656311392784119, -0.0017081797122955322, -0.0016507282853126526, -0.001593276858329773, -0.0015358254313468933, -0.0014783740043640137, -0.001420922577381134, -0.0013634711503982544, -0.0013060197234153748, -0.0012485682964324951, -0.0011911168694496155, -0.0011336654424667358, -0.0010762140154838562, -0.0010187625885009766, -0.0009613111615180969, -0.0009038597345352173, -0.0008464083075523376, -0.000788956880569458, -0.0007315054535865784, -0.0006740540266036987, -0.0006166025996208191, -0.0005591511726379395, -0.0005016997456550598, -0.0004442483186721802, -0.00038679689168930054, -0.0003293454647064209, -0.00027189403772354126, -0.00021444261074066162, -0.00015699118375778198, -9.953975677490234e-05, -4.2088329792022705e-05, 1.5363097190856934e-05, 7.281452417373657e-05, 0.0001302659511566162, 0.00018771737813949585, 0.0002451688051223755, 0.0003026202321052551, 0.00036007165908813477, 0.0004175230860710144, 0.00047497451305389404, 0.0005324259400367737, 0.0005898773670196533, 0.000647328794002533, 0.0007047802209854126, 0.0007622316479682922, 0.0008196830749511719]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 1.0, 13.0, 14.0, 26.0, 32.0, 53.0, 92.0, 159.0, 222.0, 413.0, 775.0, 1597.0, 3716.0, 9979.0, 29171.0, 100351.0, 644194.0, 185579.0, 46890.0, 15338.0, 5494.0, 2190.0, 968.0, 520.0, 294.0, 172.0, 110.0, 79.0, 50.0, 30.0, 12.0, 10.0, 3.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002712249755859375, -0.002614349126815796, -0.002516448497772217, -0.0024185478687286377, -0.0023206472396850586, -0.0022227466106414795, -0.0021248459815979004, -0.0020269453525543213, -0.0019290447235107422, -0.001831144094467163, -0.001733243465423584, -0.0016353428363800049, -0.0015374422073364258, -0.0014395415782928467, -0.0013416409492492676, -0.0012437403202056885, -0.0011458396911621094, -0.0010479390621185303, -0.0009500384330749512, -0.0008521378040313721, -0.000754237174987793, -0.0006563365459442139, -0.0005584359169006348, -0.00046053528785705566, -0.00036263465881347656, -0.00026473402976989746, -0.00016683340072631836, -6.893277168273926e-05, 2.8967857360839844e-05, 0.00012686848640441895, 0.00022476911544799805, 0.00032266974449157715, 0.00042057037353515625, 0.0005184710025787354, 0.0006163716316223145, 0.0007142722606658936, 0.0008121728897094727, 0.0009100735187530518, 0.0010079741477966309, 0.00110587477684021, 0.001203775405883789, 0.0013016760349273682, 0.0013995766639709473, 0.0014974772930145264, 0.0015953779220581055, 0.0016932785511016846, 0.0017911791801452637, 0.0018890798091888428, 0.001986980438232422, 0.002084881067276001, 0.00218278169631958, 0.002280682325363159, 0.0023785829544067383, 0.0024764835834503174, 0.0025743842124938965, 0.0026722848415374756, 0.0027701854705810547, 0.002868086099624634, 0.002965986728668213, 0.003063887357711792, 0.003161787986755371, 0.00325968861579895, 0.0033575892448425293, 0.0034554898738861084, 0.0035533905029296875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 9.0, 14.0, 15.0, 16.0, 26.0, 31.0, 30.0, 36.0, 50.0, 60.0, 53.0, 79.0, 142.0, 81.0, 55.0, 48.0, 49.0, 39.0, 40.0, 29.0, 21.0, 12.0, 21.0, 11.0, 8.0, 7.0, 5.0, 3.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0015687942504882812, -0.001525789499282837, -0.0014827847480773926, -0.0014397799968719482, -0.001396775245666504, -0.0013537704944610596, -0.0013107657432556152, -0.001267760992050171, -0.0012247562408447266, -0.0011817514896392822, -0.0011387467384338379, -0.0010957419872283936, -0.0010527372360229492, -0.0010097324848175049, -0.0009667277336120605, -0.0009237229824066162, -0.0008807182312011719, -0.0008377134799957275, -0.0007947087287902832, -0.0007517039775848389, -0.0007086992263793945, -0.0006656944751739502, -0.0006226897239685059, -0.0005796849727630615, -0.0005366802215576172, -0.0004936754703521729, -0.0004506707191467285, -0.0004076659679412842, -0.00036466121673583984, -0.0003216564655303955, -0.00027865171432495117, -0.00023564696311950684, -0.0001926422119140625, -0.00014963746070861816, -0.00010663270950317383, -6.362795829772949e-05, -2.0623207092285156e-05, 2.238154411315918e-05, 6.538629531860352e-05, 0.00010839104652404785, 0.0001513957977294922, 0.00019440054893493652, 0.00023740530014038086, 0.0002804100513458252, 0.00032341480255126953, 0.00036641955375671387, 0.0004094243049621582, 0.00045242905616760254, 0.0004954338073730469, 0.0005384385585784912, 0.0005814433097839355, 0.0006244480609893799, 0.0006674528121948242, 0.0007104575634002686, 0.0007534623146057129, 0.0007964670658111572, 0.0008394718170166016, 0.0008824765682220459, 0.0009254813194274902, 0.0009684860706329346, 0.001011490821838379, 0.0010544955730438232, 0.0010975003242492676, 0.001140505075454712, 0.0011835098266601562]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 4.0, 5.0, 10.0, 12.0, 20.0, 14.0, 28.0, 31.0, 63.0, 93.0, 193.0, 310.0, 527.0, 1032.0, 2330.0, 6506.0, 24222.0, 240386.0, 719787.0, 38448.0, 8831.0, 2953.0, 1324.0, 601.0, 301.0, 188.0, 107.0, 79.0, 43.0, 30.0, 17.0, 23.0, 10.0, 4.0, 5.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-5.131959915161133e-05, -4.977080971002579e-05, -4.8222020268440247e-05, -4.6673230826854706e-05, -4.5124441385269165e-05, -4.3575651943683624e-05, -4.2026862502098083e-05, -4.047807306051254e-05, -3.8929283618927e-05, -3.738049417734146e-05, -3.583170473575592e-05, -3.428291529417038e-05, -3.273412585258484e-05, -3.11853364109993e-05, -2.9636546969413757e-05, -2.8087757527828217e-05, -2.6538968086242676e-05, -2.4990178644657135e-05, -2.3441389203071594e-05, -2.1892599761486053e-05, -2.0343810319900513e-05, -1.8795020878314972e-05, -1.724623143672943e-05, -1.569744199514389e-05, -1.414865255355835e-05, -1.2599863111972809e-05, -1.1051073670387268e-05, -9.502284228801727e-06, -7.953494787216187e-06, -6.404705345630646e-06, -4.855915904045105e-06, -3.307126462459564e-06, -1.7583370208740234e-06, -2.0954757928848267e-07, 1.339241862297058e-06, 2.888031303882599e-06, 4.43682074546814e-06, 5.98561018705368e-06, 7.534399628639221e-06, 9.083189070224762e-06, 1.0631978511810303e-05, 1.2180767953395844e-05, 1.3729557394981384e-05, 1.5278346836566925e-05, 1.6827136278152466e-05, 1.8375925719738007e-05, 1.9924715161323547e-05, 2.1473504602909088e-05, 2.302229404449463e-05, 2.457108348608017e-05, 2.611987292766571e-05, 2.766866236925125e-05, 2.9217451810836792e-05, 3.076624125242233e-05, 3.2315030694007874e-05, 3.3863820135593414e-05, 3.5412609577178955e-05, 3.6961399018764496e-05, 3.851018846035004e-05, 4.005897790193558e-05, 4.160776734352112e-05, 4.315655678510666e-05, 4.47053462266922e-05, 4.625413566827774e-05, 4.780292510986328e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 239.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 371.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 255.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.300366759300232e-07, -2.2165477275848389e-07, -2.1327286958694458e-07, -2.0489096641540527e-07, -1.9650906324386597e-07, -1.8812716007232666e-07, -1.7974525690078735e-07, -1.7136335372924805e-07, -1.6298145055770874e-07, -1.5459954738616943e-07, -1.4621764421463013e-07, -1.3783574104309082e-07, -1.2945383787155151e-07, -1.210719347000122e-07, -1.126900315284729e-07, -1.043081283569336e-07, -9.592622518539429e-08, -8.754432201385498e-08, -7.916241884231567e-08, -7.078051567077637e-08, -6.239861249923706e-08, -5.4016709327697754e-08, -4.563480615615845e-08, -3.725290298461914e-08, -2.8870999813079834e-08, -2.0489096641540527e-08, -1.210719347000122e-08, -3.725290298461914e-09, 4.6566128730773926e-09, 1.30385160446167e-08, 2.1420419216156006e-08, 2.9802322387695312e-08, 3.818422555923462e-08, 4.6566128730773926e-08, 5.494803190231323e-08, 6.332993507385254e-08, 7.171183824539185e-08, 8.009374141693115e-08, 8.847564458847046e-08, 9.685754776000977e-08, 1.0523945093154907e-07, 1.1362135410308838e-07, 1.2200325727462769e-07, 1.30385160446167e-07, 1.387670636177063e-07, 1.471489667892456e-07, 1.555308699607849e-07, 1.6391277313232422e-07, 1.7229467630386353e-07, 1.8067657947540283e-07, 1.8905848264694214e-07, 1.9744038581848145e-07, 2.0582228899002075e-07, 2.1420419216156006e-07, 2.2258609533309937e-07, 2.3096799850463867e-07, 2.39349901676178e-07, 2.477318048477173e-07, 2.561137080192566e-07, 2.644956111907959e-07, 2.728775143623352e-07, 2.812594175338745e-07, 2.896413207054138e-07, 2.980232238769531e-07]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 12.0, 10.0, 16.0, 31.0, 36.0, 74.0, 166.0, 386.0, 704.0, 1657.0, 4093.0, 12592.0, 38011.0, 177642.0, 668703.0, 107779.0, 23324.0, 7807.0, 3051.0, 1344.0, 518.0, 257.0, 119.0, 87.0, 43.0, 28.0, 16.0, 9.0, 9.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.1576881408691406e-05, -2.0965933799743652e-05, -2.03549861907959e-05, -1.9744038581848145e-05, -1.913309097290039e-05, -1.8522143363952637e-05, -1.7911195755004883e-05, -1.730024814605713e-05, -1.6689300537109375e-05, -1.607835292816162e-05, -1.5467405319213867e-05, -1.4856457710266113e-05, -1.424551010131836e-05, -1.3634562492370605e-05, -1.3023614883422852e-05, -1.2412667274475098e-05, -1.1801719665527344e-05, -1.119077205657959e-05, -1.0579824447631836e-05, -9.968876838684082e-06, -9.357929229736328e-06, -8.746981620788574e-06, -8.13603401184082e-06, -7.525086402893066e-06, -6.9141387939453125e-06, -6.303191184997559e-06, -5.692243576049805e-06, -5.081295967102051e-06, -4.470348358154297e-06, -3.859400749206543e-06, -3.248453140258789e-06, -2.637505531311035e-06, -2.0265579223632812e-06, -1.4156103134155273e-06, -8.046627044677734e-07, -1.9371509552001953e-07, 4.172325134277344e-07, 1.0281801223754883e-06, 1.6391277313232422e-06, 2.250075340270996e-06, 2.86102294921875e-06, 3.471970558166504e-06, 4.082918167114258e-06, 4.693865776062012e-06, 5.304813385009766e-06, 5.9157609939575195e-06, 6.5267086029052734e-06, 7.137656211853027e-06, 7.748603820800781e-06, 8.359551429748535e-06, 8.970499038696289e-06, 9.581446647644043e-06, 1.0192394256591797e-05, 1.080334186553955e-05, 1.1414289474487305e-05, 1.2025237083435059e-05, 1.2636184692382812e-05, 1.3247132301330566e-05, 1.385807991027832e-05, 1.4469027519226074e-05, 1.5079975128173828e-05, 1.5690922737121582e-05, 1.6301870346069336e-05, 1.691281795501709e-05, 1.7523765563964844e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 5.0, 7.0, 6.0, 11.0, 10.0, 12.0, 21.0, 19.0, 27.0, 19.0, 36.0, 28.0, 46.0, 57.0, 90.0, 96.0, 94.0, 60.0, 72.0, 69.0, 43.0, 27.0, 44.0, 13.0, 18.0, 11.0, 10.0, 9.0, 8.0, 7.0, 8.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.616115570068359e-06, -6.3925981521606445e-06, -6.16908073425293e-06, -5.945563316345215e-06, -5.7220458984375e-06, -5.498528480529785e-06, -5.27501106262207e-06, -5.0514936447143555e-06, -4.827976226806641e-06, -4.604458808898926e-06, -4.380941390991211e-06, -4.157423973083496e-06, -3.933906555175781e-06, -3.7103891372680664e-06, -3.4868717193603516e-06, -3.2633543014526367e-06, -3.039836883544922e-06, -2.816319465637207e-06, -2.592802047729492e-06, -2.3692846298217773e-06, -2.1457672119140625e-06, -1.9222497940063477e-06, -1.6987323760986328e-06, -1.475214958190918e-06, -1.2516975402832031e-06, -1.0281801223754883e-06, -8.046627044677734e-07, -5.811452865600586e-07, -3.5762786865234375e-07, -1.341104507446289e-07, 8.940696716308594e-08, 3.129243850708008e-07, 5.364418029785156e-07, 7.599592208862305e-07, 9.834766387939453e-07, 1.2069940567016602e-06, 1.430511474609375e-06, 1.6540288925170898e-06, 1.8775463104248047e-06, 2.1010637283325195e-06, 2.3245811462402344e-06, 2.5480985641479492e-06, 2.771615982055664e-06, 2.995133399963379e-06, 3.2186508178710938e-06, 3.4421682357788086e-06, 3.6656856536865234e-06, 3.889203071594238e-06, 4.112720489501953e-06, 4.336237907409668e-06, 4.559755325317383e-06, 4.783272743225098e-06, 5.0067901611328125e-06, 5.230307579040527e-06, 5.453824996948242e-06, 5.677342414855957e-06, 5.900859832763672e-06, 6.124377250671387e-06, 6.3478946685791016e-06, 6.571412086486816e-06, 6.794929504394531e-06, 7.018446922302246e-06, 7.241964340209961e-06, 7.465481758117676e-06, 7.68899917602539e-06]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 14.0, 11.0, 22.0, 40.0, 45.0, 56.0, 111.0, 208.0, 193.0, 86.0, 51.0, 40.0, 34.0, 30.0, 13.0, 12.0, 5.0, 4.0, 7.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004900715313851833, -0.004774927161633968, -0.004649139009416103, -0.004523351322859526, -0.004397563170641661, -0.004271775018423796, -0.004145986866205931, -0.004020198713988066, -0.0038944107946008444, -0.0037686226423829794, -0.003642834722995758, -0.003517046570777893, -0.003391258418560028, -0.0032654704991728067, -0.0031396823469549417, -0.0030138944275677204, -0.0028881062753498554, -0.0027623181231319904, -0.002636530203744769, -0.002510742051526904, -0.0023849541321396828, -0.0022591659799218178, -0.002133377827703953, -0.002007589675486088, -0.0018818017560988665, -0.0017560137202963233, -0.0016302256844937801, -0.0015044375322759151, -0.001378649496473372, -0.0012528614606708288, -0.0011270733084529638, -0.0010012852726504207, -0.0008754967711865902, -0.000749708735384047, -0.000623920641373843, -0.0004981325473636389, -0.0003723445115610957, -0.00024655647575855255, -0.00012076838174834847, 5.019712261855602e-06, 0.00013080774806439877, 0.0002565958129707724, 0.000382383877877146, 0.0005081719718873501, 0.0006339600076898932, 0.0007597480434924364, 0.0008855361375026405, 0.0010113242315128446, 0.0011371122673153877, 0.0012629003031179309, 0.001388688338920474, 0.001514476491138339, 0.0016402645269408822, 0.0017660525627434254, 0.0018918407149612904, 0.0020176288671791553, 0.0021434167865663767, 0.0022692049387842417, 0.002394992858171463, 0.002520781010389328, 0.002646569162607193, 0.0027723570819944143, 0.0028981452342122793, 0.0030239331535995007, 0.0031497213058173656]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 7.0, 2.0, 7.0, 8.0, 7.0, 10.0, 14.0, 10.0, 21.0, 23.0, 32.0, 26.0, 37.0, 32.0, 31.0, 33.0, 49.0, 42.0, 39.0, 35.0, 40.0, 42.0, 44.0, 47.0, 34.0, 46.0, 34.0, 37.0, 25.0, 29.0, 31.0, 28.0, 23.0, 10.0, 10.0, 13.0, 7.0, 7.0, 10.0, 6.0, 10.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018034909153357148, -0.0017470433376729488, -0.0016905957600101829, -0.0016341481823474169, -0.001577700604684651, -0.001521253027021885, -0.0014648053329437971, -0.001408357871696353, -0.0013519101776182652, -0.0012954625999554992, -0.0012390150222927332, -0.0011825674446299672, -0.0011261198669672012, -0.0010696722893044353, -0.0010132247116416693, -0.0009567770757712424, -0.0009003295563161373, -0.0008438819786533713, -0.0007874344009906054, -0.0007309868233278394, -0.0006745392456650734, -0.0006180916680023074, -0.0005616440321318805, -0.0005051964544691145, -0.00044874887680634856, -0.0003923012991435826, -0.0003358537214808166, -0.00027940611471422017, -0.00022295853705145419, -0.0001665109593886882, -0.00011006335262209177, -5.361577495932579e-05, 2.8318027034401894e-06, 5.927938764216378e-05, 0.00011572697258088738, 0.00017217456479556859, 0.00022862214245833457, 0.00028506972012110054, 0.000341517326887697, 0.00039796490455046296, 0.00045441248221322894, 0.0005108600598759949, 0.0005673076375387609, 0.0006237552734091878, 0.0006802028510719538, 0.0007366504287347198, 0.0007930980063974857, 0.0008495455840602517, 0.0009059931617230177, 0.0009624407393857837, 0.0010188883170485497, 0.0010753358947113156, 0.0011317834723740816, 0.0011882310500368476, 0.0012446786276996136, 0.0013011263217777014, 0.0013575737830251455, 0.0014140213606879115, 0.0014704689383506775, 0.0015269165160134435, 0.0015833640936762094, 0.0016398116713389754, 0.0016962592490017414, 0.0017527069430798292, 0.0018091545207425952]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 2.0, 2.0, 9.0, 10.0, 10.0, 14.0, 22.0, 18.0, 40.0, 30.0, 56.0, 63.0, 85.0, 115.0, 130.0, 156.0, 195.0, 272.0, 459.0, 950.0, 20279.0, 4105070.0, 63178.0, 1338.0, 496.0, 278.0, 202.0, 174.0, 120.0, 126.0, 91.0, 80.0, 47.0, 34.0, 34.0, 29.0, 16.0, 16.0, 10.0, 10.0, 8.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004001617431640625, -0.0038617849349975586, -0.003721952438354492, -0.0035821199417114258, -0.0034422874450683594, -0.003302454948425293, -0.0031626224517822266, -0.00302278995513916, -0.0028829574584960938, -0.0027431249618530273, -0.002603292465209961, -0.0024634599685668945, -0.002323627471923828, -0.0021837949752807617, -0.0020439624786376953, -0.001904129981994629, -0.0017642974853515625, -0.001624464988708496, -0.0014846324920654297, -0.0013447999954223633, -0.0012049674987792969, -0.0010651350021362305, -0.0009253025054931641, -0.0007854700088500977, -0.0006456375122070312, -0.0005058050155639648, -0.00036597251892089844, -0.00022614002227783203, -8.630752563476562e-05, 5.352497100830078e-05, 0.0001933574676513672, 0.0003331899642944336, 0.0004730224609375, 0.0006128549575805664, 0.0007526874542236328, 0.0008925199508666992, 0.0010323524475097656, 0.001172184944152832, 0.0013120174407958984, 0.0014518499374389648, 0.0015916824340820312, 0.0017315149307250977, 0.001871347427368164, 0.0020111799240112305, 0.002151012420654297, 0.0022908449172973633, 0.0024306774139404297, 0.002570509910583496, 0.0027103424072265625, 0.002850174903869629, 0.0029900074005126953, 0.0031298398971557617, 0.003269672393798828, 0.0034095048904418945, 0.003549337387084961, 0.0036891698837280273, 0.0038290023803710938, 0.00396883487701416, 0.0041086673736572266, 0.004248499870300293, 0.004388332366943359, 0.004528164863586426, 0.004667997360229492, 0.004807829856872559, 0.004947662353515625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 8.0, 4.0, 14.0, 15.0, 19.0, 20.0, 28.0, 33.0, 31.0, 28.0, 31.0, 47.0, 43.0, 44.0, 50.0, 107.0, 70.0, 43.0, 40.0, 43.0, 36.0, 28.0, 29.0, 28.0, 26.0, 30.0, 22.0, 15.0, 9.0, 8.0, 5.0, 9.0, 9.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012378692626953125, -0.0011946409940719604, -0.0011514127254486084, -0.0011081844568252563, -0.0010649561882019043, -0.0010217279195785522, -0.0009784996509552002, -0.0009352713823318481, -0.0008920431137084961, -0.000848814845085144, -0.000805586576461792, -0.0007623583078384399, -0.0007191300392150879, -0.0006759017705917358, -0.0006326735019683838, -0.0005894452333450317, -0.0005462169647216797, -0.0005029886960983276, -0.0004597604274749756, -0.00041653215885162354, -0.0003733038902282715, -0.00033007562160491943, -0.0002868473529815674, -0.00024361908435821533, -0.00020039081573486328, -0.00015716254711151123, -0.00011393427848815918, -7.070600986480713e-05, -2.7477741241455078e-05, 1.5750527381896973e-05, 5.8978796005249023e-05, 0.00010220706462860107, 0.00014543533325195312, 0.00018866360187530518, 0.00023189187049865723, 0.0002751201391220093, 0.00031834840774536133, 0.0003615766763687134, 0.00040480494499206543, 0.0004480332136154175, 0.0004912614822387695, 0.0005344897508621216, 0.0005777180194854736, 0.0006209462881088257, 0.0006641745567321777, 0.0007074028253555298, 0.0007506310939788818, 0.0007938593626022339, 0.0008370876312255859, 0.000880315899848938, 0.00092354416847229, 0.0009667724370956421, 0.0010100007057189941, 0.0010532289743423462, 0.0010964572429656982, 0.0011396855115890503, 0.0011829137802124023, 0.0012261420488357544, 0.0012693703174591064, 0.0013125985860824585, 0.0013558268547058105, 0.0013990551233291626, 0.0014422833919525146, 0.0014855116605758667, 0.0015287399291992188]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 14.0, 12.0, 32.0, 54.0, 95.0, 219.0, 486.0, 1441.0, 11106.0, 4173321.0, 5979.0, 914.0, 349.0, 143.0, 59.0, 34.0, 12.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0148468017578125, -0.014552295207977295, -0.01425778865814209, -0.013963282108306885, -0.01366877555847168, -0.013374269008636475, -0.01307976245880127, -0.012785255908966064, -0.01249074935913086, -0.012196242809295654, -0.01190173625946045, -0.011607229709625244, -0.011312723159790039, -0.011018216609954834, -0.010723710060119629, -0.010429203510284424, -0.010134696960449219, -0.009840190410614014, -0.009545683860778809, -0.009251177310943604, -0.008956670761108398, -0.008662164211273193, -0.008367657661437988, -0.008073151111602783, -0.007778644561767578, -0.007484138011932373, -0.007189631462097168, -0.006895124912261963, -0.006600618362426758, -0.006306111812591553, -0.006011605262756348, -0.005717098712921143, -0.0054225921630859375, -0.005128085613250732, -0.004833579063415527, -0.004539072513580322, -0.004244565963745117, -0.003950059413909912, -0.003655552864074707, -0.003361046314239502, -0.003066539764404297, -0.002772033214569092, -0.0024775266647338867, -0.0021830201148986816, -0.0018885135650634766, -0.0015940070152282715, -0.0012995004653930664, -0.0010049939155578613, -0.0007104873657226562, -0.00041598081588745117, -0.0001214742660522461, 0.00017303228378295898, 0.00046753883361816406, 0.0007620453834533691, 0.0010565519332885742, 0.0013510584831237793, 0.0016455650329589844, 0.0019400715827941895, 0.0022345781326293945, 0.0025290846824645996, 0.0028235912322998047, 0.0031180977821350098, 0.003412604331970215, 0.00370711088180542, 0.004001617431640625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 16.0, 28.0, 141.0, 3319.0, 417.0, 87.0, 28.0, 9.0, 4.0, 4.0, 4.0, 0.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005512237548828125, -0.0005109012126922607, -0.000470578670501709, -0.0004302561283111572, -0.00038993358612060547, -0.0003496110439300537, -0.00030928850173950195, -0.0002689659595489502, -0.00022864341735839844, -0.00018832087516784668, -0.00014799833297729492, -0.00010767579078674316, -6.73532485961914e-05, -2.703070640563965e-05, 1.329183578491211e-05, 5.361437797546387e-05, 9.393692016601562e-05, 0.00013425946235656738, 0.00017458200454711914, 0.0002149045467376709, 0.00025522708892822266, 0.0002955496311187744, 0.00033587217330932617, 0.00037619471549987793, 0.0004165172576904297, 0.00045683979988098145, 0.0004971623420715332, 0.000537484884262085, 0.0005778074264526367, 0.0006181299686431885, 0.0006584525108337402, 0.000698775053024292, 0.0007390975952148438, 0.0007794201374053955, 0.0008197426795959473, 0.000860065221786499, 0.0009003877639770508, 0.0009407103061676025, 0.0009810328483581543, 0.001021355390548706, 0.0010616779327392578, 0.0011020004749298096, 0.0011423230171203613, 0.001182645559310913, 0.0012229681015014648, 0.0012632906436920166, 0.0013036131858825684, 0.0013439357280731201, 0.0013842582702636719, 0.0014245808124542236, 0.0014649033546447754, 0.0015052258968353271, 0.001545548439025879, 0.0015858709812164307, 0.0016261935234069824, 0.0016665160655975342, 0.001706838607788086, 0.0017471611499786377, 0.0017874836921691895, 0.0018278062343597412, 0.001868128776550293, 0.0019084513187408447, 0.0019487738609313965, 0.0019890964031219482, 0.0020294189453125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 5.0, 6.0, 10.0, 19.0, 41.0, 57.0, 87.0, 167.0, 315.0, 107.0, 58.0, 38.0, 30.0, 18.0, 7.0, 15.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005676188971847296, -0.005548175889998674, -0.005420162808150053, -0.005292149726301432, -0.005164136178791523, -0.005036123096942902, -0.00490811001509428, -0.004780096933245659, -0.0046520838513970375, -0.004524070769548416, -0.004396057687699795, -0.004268044605851173, -0.004140031524002552, -0.004012017976492643, -0.003884004894644022, -0.0037559918127954006, -0.0036279787309467793, -0.003499965649098158, -0.0033719525672495365, -0.0032439392525702715, -0.00311592617072165, -0.0029879130888730288, -0.0028598997741937637, -0.0027318866923451424, -0.002603873610496521, -0.0024758605286478996, -0.0023478474467992783, -0.0022198341321200132, -0.002091821050271392, -0.0019638079684227705, -0.0018357947701588273, -0.0017077815718948841, -0.0015797687228769064, -0.001451755641028285, -0.0013237424427643418, -0.0011957292445003986, -0.0010677161626517773, -0.000939703022595495, -0.0008116898825392127, -0.0006836767424829304, -0.0005556636024266481, -0.00042765046237036586, -0.0002996373223140836, -0.0001716241822578013, -4.361104220151901e-05, 8.440209785476327e-05, 0.00021241523791104555, 0.00034042837796732783, 0.0004684415180236101, 0.0005964546580798924, 0.0007244677981361747, 0.000852480938192457, 0.0009804940782487392, 0.0011085071600973606, 0.0012365203583613038, 0.001364533556625247, 0.0014925466384738684, 0.0016205597203224897, 0.001748572918586433, 0.0018765861168503761, 0.0020045991986989975, 0.002132612280547619, 0.0022606253623962402, 0.0023886386770755053, 0.0025166517589241266]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 5.0, 7.0, 7.0, 9.0, 11.0, 14.0, 22.0, 16.0, 35.0, 29.0, 37.0, 47.0, 45.0, 54.0, 60.0, 64.0, 56.0, 48.0, 49.0, 55.0, 56.0, 50.0, 51.0, 32.0, 42.0, 25.0, 17.0, 11.0, 12.0, 12.0, 9.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0018952483078464866, -0.0018359655514359474, -0.0017766827950254083, -0.0017174000386148691, -0.00165811728220433, -0.0015988345257937908, -0.0015395516529679298, -0.0014802690129727125, -0.0014209861401468515, -0.0013617033837363124, -0.0013024206273257732, -0.001243137870915234, -0.001183855114504695, -0.0011245723580941558, -0.0010652896016836166, -0.0010060067288577557, -0.0009467240888625383, -0.0008874413324519992, -0.00082815857604146, -0.0007688758196309209, -0.0007095930632203817, -0.0006503103068098426, -0.0005910274921916425, -0.0005317447357811034, -0.0004724619793705642, -0.00041317922296002507, -0.0003538964665494859, -0.0002946136810351163, -0.00023533092462457716, -0.00017604816821403801, -0.00011676538269966841, -5.748262628912926e-05, 1.80024653673172e-06, 6.108301022322848e-05, 0.00012036577390972525, 0.00017964854487217963, 0.00023893130128271878, 0.00029821405769325793, 0.00035749684320762753, 0.0004167795996181667, 0.00047606235602870584, 0.000535345112439245, 0.0005946278688497841, 0.0006539106834679842, 0.0007131934398785233, 0.0007724761962890625, 0.0008317589526996017, 0.0008910417091101408, 0.00095032446552068, 0.001009607221931219, 0.0010688899783417583, 0.0011281727347522974, 0.0011874554911628366, 0.0012467382475733757, 0.0013060211203992367, 0.001365303760394454, 0.001424586633220315, 0.0014838693896308541, 0.0015431521460413933, 0.0016024349024519324, 0.0016617176588624716, 0.0017210004152730107, 0.0017802831716835499, 0.0018395660445094109, 0.0018988486845046282]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 7.0, 14.0, 32.0, 44.0, 79.0, 111.0, 147.0, 266.0, 436.0, 850.0, 1731.0, 4069.0, 11445.0, 39696.0, 216595.0, 668643.0, 74865.0, 18403.0, 6118.0, 2411.0, 1108.0, 592.0, 326.0, 209.0, 114.0, 73.0, 54.0, 41.0, 19.0, 10.0, 11.0, 9.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.000385284423828125, -0.0003729388117790222, -0.00036059319972991943, -0.00034824758768081665, -0.00033590197563171387, -0.0003235563635826111, -0.0003112107515335083, -0.0002988651394844055, -0.00028651952743530273, -0.00027417391538619995, -0.00026182830333709717, -0.0002494826912879944, -0.0002371370792388916, -0.00022479146718978882, -0.00021244585514068604, -0.00020010024309158325, -0.00018775463104248047, -0.00017540901899337769, -0.0001630634069442749, -0.00015071779489517212, -0.00013837218284606934, -0.00012602657079696655, -0.00011368095874786377, -0.00010133534669876099, -8.89897346496582e-05, -7.664412260055542e-05, -6.429851055145264e-05, -5.1952898502349854e-05, -3.960728645324707e-05, -2.7261674404144287e-05, -1.4916062355041504e-05, -2.5704503059387207e-06, 9.775161743164062e-06, 2.2120773792266846e-05, 3.446638584136963e-05, 4.681199789047241e-05, 5.9157609939575195e-05, 7.150322198867798e-05, 8.384883403778076e-05, 9.619444608688354e-05, 0.00010854005813598633, 0.00012088567018508911, 0.0001332312822341919, 0.00014557689428329468, 0.00015792250633239746, 0.00017026811838150024, 0.00018261373043060303, 0.0001949593424797058, 0.0002073049545288086, 0.00021965056657791138, 0.00023199617862701416, 0.00024434179067611694, 0.0002566874027252197, 0.0002690330147743225, 0.0002813786268234253, 0.0002937242388725281, 0.00030606985092163086, 0.00031841546297073364, 0.0003307610750198364, 0.0003431066870689392, 0.000355452299118042, 0.0003677979111671448, 0.00038014352321624756, 0.00039248913526535034, 0.0004048347473144531]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 9.0, 1.0, 13.0, 16.0, 18.0, 27.0, 23.0, 35.0, 41.0, 44.0, 58.0, 65.0, 105.0, 133.0, 64.0, 53.0, 58.0, 56.0, 44.0, 35.0, 33.0, 22.0, 12.0, 8.0, 3.0, 9.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00162506103515625, -0.0015730112791061401, -0.0015209615230560303, -0.0014689117670059204, -0.0014168620109558105, -0.0013648122549057007, -0.0013127624988555908, -0.001260712742805481, -0.001208662986755371, -0.0011566132307052612, -0.0011045634746551514, -0.0010525137186050415, -0.0010004639625549316, -0.0009484142065048218, -0.0008963644504547119, -0.000844314694404602, -0.0007922649383544922, -0.0007402151823043823, -0.0006881654262542725, -0.0006361156702041626, -0.0005840659141540527, -0.0005320161581039429, -0.000479966402053833, -0.00042791664600372314, -0.0003758668899536133, -0.0003238171339035034, -0.00027176737785339355, -0.0002197176218032837, -0.00016766786575317383, -0.00011561810970306396, -6.35683536529541e-05, -1.1518597602844238e-05, 4.0531158447265625e-05, 9.258091449737549e-05, 0.00014463067054748535, 0.00019668042659759521, 0.0002487301826477051, 0.00030077993869781494, 0.0003528296947479248, 0.00040487945079803467, 0.00045692920684814453, 0.0005089789628982544, 0.0005610287189483643, 0.0006130784749984741, 0.000665128231048584, 0.0007171779870986938, 0.0007692277431488037, 0.0008212774991989136, 0.0008733272552490234, 0.0009253770112991333, 0.0009774267673492432, 0.001029476523399353, 0.0010815262794494629, 0.0011335760354995728, 0.0011856257915496826, 0.0012376755475997925, 0.0012897253036499023, 0.0013417750597000122, 0.001393824815750122, 0.001445874571800232, 0.0014979243278503418, 0.0015499740839004517, 0.0016020238399505615, 0.0016540735960006714, 0.0017061233520507812]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 10.0, 9.0, 10.0, 21.0, 22.0, 23.0, 23.0, 40.0, 84.0, 121.0, 197.0, 429.0, 860.0, 2036.0, 4949.0, 13049.0, 35547.0, 107804.0, 537879.0, 242345.0, 65083.0, 22768.0, 8701.0, 3529.0, 1460.0, 719.0, 343.0, 188.0, 101.0, 82.0, 38.0, 22.0, 22.0, 17.0, 5.0, 5.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00028133392333984375, -0.0002734716981649399, -0.000265609472990036, -0.00025774724781513214, -0.00024988502264022827, -0.0002420227974653244, -0.00023416057229042053, -0.00022629834711551666, -0.0002184361219406128, -0.00021057389676570892, -0.00020271167159080505, -0.00019484944641590118, -0.00018698722124099731, -0.00017912499606609344, -0.00017126277089118958, -0.0001634005457162857, -0.00015553832054138184, -0.00014767609536647797, -0.0001398138701915741, -0.00013195164501667023, -0.00012408941984176636, -0.00011622719466686249, -0.00010836496949195862, -0.00010050274431705475, -9.264051914215088e-05, -8.477829396724701e-05, -7.691606879234314e-05, -6.905384361743927e-05, -6.11916184425354e-05, -5.332939326763153e-05, -4.546716809272766e-05, -3.760494291782379e-05, -2.9742717742919922e-05, -2.1880492568016052e-05, -1.4018267393112183e-05, -6.156042218208313e-06, 1.7061829566955566e-06, 9.568408131599426e-06, 1.7430633306503296e-05, 2.5292858481407166e-05, 3.3155083656311035e-05, 4.1017308831214905e-05, 4.8879534006118774e-05, 5.6741759181022644e-05, 6.460398435592651e-05, 7.246620953083038e-05, 8.032843470573425e-05, 8.819065988063812e-05, 9.605288505554199e-05, 0.00010391511023044586, 0.00011177733540534973, 0.0001196395605802536, 0.00012750178575515747, 0.00013536401093006134, 0.0001432262361049652, 0.00015108846127986908, 0.00015895068645477295, 0.00016681291162967682, 0.0001746751368045807, 0.00018253736197948456, 0.00019039958715438843, 0.0001982618123292923, 0.00020612403750419617, 0.00021398626267910004, 0.0002218484878540039]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 6.0, 16.0, 12.0, 20.0, 26.0, 27.0, 38.0, 49.0, 55.0, 60.0, 82.0, 75.0, 85.0, 74.0, 69.0, 56.0, 57.0, 40.0, 36.0, 25.0, 26.0, 14.0, 23.0, 12.0, 6.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.004718780517578125, -0.004607260227203369, -0.004495739936828613, -0.004384219646453857, -0.0042726993560791016, -0.004161179065704346, -0.00404965877532959, -0.003938138484954834, -0.003826618194580078, -0.0037150979042053223, -0.0036035776138305664, -0.0034920573234558105, -0.0033805370330810547, -0.003269016742706299, -0.003157496452331543, -0.003045976161956787, -0.0029344558715820312, -0.0028229355812072754, -0.0027114152908325195, -0.0025998950004577637, -0.002488374710083008, -0.002376854419708252, -0.002265334129333496, -0.0021538138389587402, -0.0020422935485839844, -0.0019307732582092285, -0.0018192529678344727, -0.0017077326774597168, -0.001596212387084961, -0.001484692096710205, -0.0013731718063354492, -0.0012616515159606934, -0.0011501312255859375, -0.0010386109352111816, -0.0009270906448364258, -0.0008155703544616699, -0.0007040500640869141, -0.0005925297737121582, -0.00048100948333740234, -0.0003694891929626465, -0.0002579689025878906, -0.00014644861221313477, -3.4928321838378906e-05, 7.659196853637695e-05, 0.0001881122589111328, 0.00029963254928588867, 0.00041115283966064453, 0.0005226731300354004, 0.0006341934204101562, 0.0007457137107849121, 0.000857234001159668, 0.0009687542915344238, 0.0010802745819091797, 0.0011917948722839355, 0.0013033151626586914, 0.0014148354530334473, 0.0015263557434082031, 0.001637876033782959, 0.0017493963241577148, 0.0018609166145324707, 0.0019724369049072266, 0.0020839571952819824, 0.0021954774856567383, 0.002306997776031494, 0.00241851806640625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 2.0, 12.0, 7.0, 14.0, 32.0, 43.0, 46.0, 92.0, 158.0, 234.0, 471.0, 903.0, 1462.0, 3518.0, 8717.0, 30488.0, 646182.0, 309446.0, 30305.0, 9182.0, 3663.0, 1690.0, 797.0, 430.0, 241.0, 138.0, 96.0, 49.0, 43.0, 28.0, 14.0, 12.0, 11.0, 12.0, 6.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7881393432617188e-05, -1.7355196177959442e-05, -1.6828998923301697e-05, -1.630280166864395e-05, -1.5776604413986206e-05, -1.525040715932846e-05, -1.4724209904670715e-05, -1.419801265001297e-05, -1.3671815395355225e-05, -1.314561814069748e-05, -1.2619420886039734e-05, -1.2093223631381989e-05, -1.1567026376724243e-05, -1.1040829122066498e-05, -1.0514631867408752e-05, -9.988434612751007e-06, -9.462237358093262e-06, -8.936040103435516e-06, -8.409842848777771e-06, -7.883645594120026e-06, -7.35744833946228e-06, -6.831251084804535e-06, -6.3050538301467896e-06, -5.778856575489044e-06, -5.252659320831299e-06, -4.7264620661735535e-06, -4.200264811515808e-06, -3.6740675568580627e-06, -3.1478703022003174e-06, -2.621673047542572e-06, -2.0954757928848267e-06, -1.5692785382270813e-06, -1.043081283569336e-06, -5.168840289115906e-07, 9.313225746154785e-09, 5.355104804039001e-07, 1.0617077350616455e-06, 1.5879049897193909e-06, 2.1141022443771362e-06, 2.6402994990348816e-06, 3.166496753692627e-06, 3.6926940083503723e-06, 4.218891263008118e-06, 4.745088517665863e-06, 5.271285772323608e-06, 5.797483026981354e-06, 6.323680281639099e-06, 6.8498775362968445e-06, 7.37607479095459e-06, 7.902272045612335e-06, 8.42846930027008e-06, 8.954666554927826e-06, 9.480863809585571e-06, 1.0007061064243317e-05, 1.0533258318901062e-05, 1.1059455573558807e-05, 1.1585652828216553e-05, 1.2111850082874298e-05, 1.2638047337532043e-05, 1.3164244592189789e-05, 1.3690441846847534e-05, 1.421663910150528e-05, 1.4742836356163025e-05, 1.526903361082077e-05, 1.5795230865478516e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 60.0, 0.0, 0.0, 0.0, 142.0, 0.0, 0.0, 198.0, 0.0, 0.0, 0.0, 206.0, 0.0, 0.0, 0.0, 198.0, 0.0, 0.0, 124.0, 0.0, 0.0, 0.0, 41.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-07, -4.600733518600464e-07, -4.4330954551696777e-07, -4.2654573917388916e-07, -4.0978193283081055e-07, -3.9301812648773193e-07, -3.762543201446533e-07, -3.594905138015747e-07, -3.427267074584961e-07, -3.259629011154175e-07, -3.0919909477233887e-07, -2.9243528842926025e-07, -2.7567148208618164e-07, -2.5890767574310303e-07, -2.421438694000244e-07, -2.253800630569458e-07, -2.086162567138672e-07, -1.9185245037078857e-07, -1.7508864402770996e-07, -1.5832483768463135e-07, -1.4156103134155273e-07, -1.2479722499847412e-07, -1.0803341865539551e-07, -9.12696123123169e-08, -7.450580596923828e-08, -5.774199962615967e-08, -4.0978193283081055e-08, -2.421438694000244e-08, -7.450580596923828e-09, 9.313225746154785e-09, 2.60770320892334e-08, 4.284083843231201e-08, 5.960464477539063e-08, 7.636845111846924e-08, 9.313225746154785e-08, 1.0989606380462646e-07, 1.2665987014770508e-07, 1.434236764907837e-07, 1.601874828338623e-07, 1.7695128917694092e-07, 1.9371509552001953e-07, 2.1047890186309814e-07, 2.2724270820617676e-07, 2.4400651454925537e-07, 2.60770320892334e-07, 2.775341272354126e-07, 2.942979335784912e-07, 3.110617399215698e-07, 3.2782554626464844e-07, 3.4458935260772705e-07, 3.6135315895080566e-07, 3.781169652938843e-07, 3.948807716369629e-07, 4.116445779800415e-07, 4.284083843231201e-07, 4.4517219066619873e-07, 4.6193599700927734e-07, 4.78699803352356e-07, 4.954636096954346e-07, 5.122274160385132e-07, 5.289912223815918e-07, 5.457550287246704e-07, 5.62518835067749e-07, 5.792826414108276e-07, 5.960464477539062e-07]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 7.0, 18.0, 15.0, 36.0, 37.0, 77.0, 138.0, 296.0, 717.0, 1870.0, 6292.0, 30490.0, 825131.0, 161434.0, 15764.0, 3966.0, 1269.0, 496.0, 205.0, 103.0, 74.0, 46.0, 23.0, 17.0, 11.0, 6.0, 8.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.811981201171875e-05, -1.764018088579178e-05, -1.7160549759864807e-05, -1.6680918633937836e-05, -1.6201287508010864e-05, -1.5721656382083893e-05, -1.5242025256156921e-05, -1.476239413022995e-05, -1.4282763004302979e-05, -1.3803131878376007e-05, -1.3323500752449036e-05, -1.2843869626522064e-05, -1.2364238500595093e-05, -1.1884607374668121e-05, -1.140497624874115e-05, -1.0925345122814178e-05, -1.0445713996887207e-05, -9.966082870960236e-06, -9.486451745033264e-06, -9.006820619106293e-06, -8.527189493179321e-06, -8.04755836725235e-06, -7.567927241325378e-06, -7.088296115398407e-06, -6.6086649894714355e-06, -6.129033863544464e-06, -5.649402737617493e-06, -5.169771611690521e-06, -4.69014048576355e-06, -4.210509359836578e-06, -3.730878233909607e-06, -3.2512471079826355e-06, -2.771615982055664e-06, -2.2919848561286926e-06, -1.8123537302017212e-06, -1.3327226042747498e-06, -8.530914783477783e-07, -3.734603524208069e-07, 1.0617077350616455e-07, 5.85801899433136e-07, 1.0654330253601074e-06, 1.5450641512870789e-06, 2.0246952772140503e-06, 2.5043264031410217e-06, 2.983957529067993e-06, 3.4635886549949646e-06, 3.943219780921936e-06, 4.4228509068489075e-06, 4.902482032775879e-06, 5.38211315870285e-06, 5.861744284629822e-06, 6.341375410556793e-06, 6.821006536483765e-06, 7.300637662410736e-06, 7.780268788337708e-06, 8.259899914264679e-06, 8.73953104019165e-06, 9.219162166118622e-06, 9.698793292045593e-06, 1.0178424417972565e-05, 1.0658055543899536e-05, 1.1137686669826508e-05, 1.1617317795753479e-05, 1.209694892168045e-05, 1.2576580047607422e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 5.0, 15.0, 15.0, 14.0, 35.0, 59.0, 60.0, 221.0, 254.0, 108.0, 93.0, 42.0, 14.0, 22.0, 9.0, 4.0, 9.0, 7.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6226043701171875e-06, -2.5229528546333313e-06, -2.423301339149475e-06, -2.323649823665619e-06, -2.2239983081817627e-06, -2.1243467926979065e-06, -2.0246952772140503e-06, -1.925043761730194e-06, -1.8253922462463379e-06, -1.7257407307624817e-06, -1.6260892152786255e-06, -1.5264376997947693e-06, -1.426786184310913e-06, -1.3271346688270569e-06, -1.2274831533432007e-06, -1.1278316378593445e-06, -1.0281801223754883e-06, -9.285286068916321e-07, -8.288770914077759e-07, -7.292255759239197e-07, -6.295740604400635e-07, -5.299225449562073e-07, -4.302710294723511e-07, -3.3061951398849487e-07, -2.3096799850463867e-07, -1.3131648302078247e-07, -3.166496753692627e-08, 6.798654794692993e-08, 1.6763806343078613e-07, 2.6728957891464233e-07, 3.6694109439849854e-07, 4.6659260988235474e-07, 5.662441253662109e-07, 6.658956408500671e-07, 7.655471563339233e-07, 8.651986718177795e-07, 9.648501873016357e-07, 1.064501702785492e-06, 1.1641532182693481e-06, 1.2638047337532043e-06, 1.3634562492370605e-06, 1.4631077647209167e-06, 1.562759280204773e-06, 1.6624107956886292e-06, 1.7620623111724854e-06, 1.8617138266563416e-06, 1.9613653421401978e-06, 2.061016857624054e-06, 2.16066837310791e-06, 2.2603198885917664e-06, 2.3599714040756226e-06, 2.4596229195594788e-06, 2.559274435043335e-06, 2.658925950527191e-06, 2.7585774660110474e-06, 2.8582289814949036e-06, 2.9578804969787598e-06, 3.057532012462616e-06, 3.157183527946472e-06, 3.2568350434303284e-06, 3.3564865589141846e-06, 3.4561380743980408e-06, 3.555789589881897e-06, 3.655441105365753e-06, 3.7550926208496094e-06]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 7.0, 17.0, 38.0, 66.0, 148.0, 411.0, 140.0, 67.0, 38.0, 25.0, 13.0, 13.0, 8.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005755851045250893, -0.005639663897454739, -0.005523476749658585, -0.005407289601862431, -0.0052911024540662766, -0.00517491577193141, -0.005058728624135256, -0.004942541476339102, -0.004826354328542948, -0.004710167180746794, -0.00459398003295064, -0.004477792885154486, -0.004361606203019619, -0.004245419055223465, -0.004129231907427311, -0.004013044759631157, -0.003896857611835003, -0.003780670464038849, -0.003664483316242695, -0.0035482964012771845, -0.0034321092534810305, -0.0033159221056848764, -0.003199735190719366, -0.003083548042923212, -0.002967360895127058, -0.002851173747330904, -0.00273498659953475, -0.0026187996845692396, -0.0025026125367730856, -0.0023864253889769316, -0.002270238474011421, -0.002154051326215267, -0.002037864178419113, -0.0019216770306229591, -0.001805489999242127, -0.0016893029678612947, -0.0015731158200651407, -0.0014569286722689867, -0.0013407416408881545, -0.0012245546095073223, -0.0011083675781264901, -0.000992180546745658, -0.0008759933989495039, -0.0007598063093610108, -0.0006436192197725177, -0.0005274321301840246, -0.00041124504059553146, -0.00029505795100703835, -0.00017887086141854525, -6.268377183005214e-05, 5.350331775844097e-05, 0.00016969040734693408, 0.0002858774969354272, 0.0004020645865239203, 0.0005182516761124134, 0.0006344387657009065, 0.0007506258552893996, 0.0008668129448778927, 0.0009830000344663858, 0.0010991871822625399, 0.001215374213643372, 0.0013315612450242043, 0.0014477483928203583, 0.0015639355406165123, 0.0016801225719973445]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 8.0, 4.0, 12.0, 18.0, 19.0, 30.0, 28.0, 42.0, 47.0, 51.0, 64.0, 73.0, 84.0, 57.0, 65.0, 63.0, 67.0, 65.0, 47.0, 39.0, 34.0, 22.0, 17.0, 12.0, 5.0, 7.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0014516121009364724, -0.001405073911882937, -0.0013585356064140797, -0.0013119974173605442, -0.0012654592283070087, -0.0012189209228381515, -0.001172382733784616, -0.0011258444283157587, -0.0010793062392622232, -0.0010327680502086878, -0.0009862297447398305, -0.000939691555686295, -0.0008931533084250987, -0.0008466150611639023, -0.0008000768721103668, -0.0007535386248491704, -0.0007070003775879741, -0.0006604621303267777, -0.0006139238830655813, -0.0005673856940120459, -0.0005208474467508495, -0.0004743091994896531, -0.0004277709813322872, -0.0003812327631749213, -0.0003346945159137249, -0.0002881562686525285, -0.0002416180504951626, -0.00019507981778588146, -0.0001485415850766003, -0.00010200335236731917, -5.546511965803802e-05, -8.926901500672102e-06, 3.7611229345202446e-05, 8.414946205448359e-05, 0.00013068769476376474, 0.00017722592747304589, 0.00022376416018232703, 0.0002703024074435234, 0.0003168406256008893, 0.00036337884375825524, 0.0004099170910194516, 0.000456455338280648, 0.0005029935855418444, 0.0005495317745953798, 0.0005960700218565762, 0.0006426082691177726, 0.000689146458171308, 0.0007356847054325044, 0.0007822229526937008, 0.0008287611999548972, 0.0008752994472160935, 0.000921837636269629, 0.0009683758835308254, 0.0010149141307920218, 0.0010614523198455572, 0.0011079905088990927, 0.00115452881436795, 0.0012010670034214854, 0.0012476053088903427, 0.0012941434979438782, 0.0013406816869974136, 0.001387219992466271, 0.0014337581815198064, 0.0014802964869886637, 0.0015268346760421991]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 11.0, 12.0, 20.0, 21.0, 29.0, 52.0, 66.0, 116.0, 152.0, 244.0, 386.0, 630.0, 1166.0, 2362.0, 4771.0, 10809.0, 25969.0, 71586.0, 303474.0, 490358.0, 83926.0, 29283.0, 12175.0, 5301.0, 2526.0, 1271.0, 699.0, 395.0, 246.0, 166.0, 108.0, 66.0, 46.0, 48.0, 26.0, 15.0, 5.0, 7.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0017995834350585938, -0.0017467588186264038, -0.0016939342021942139, -0.001641109585762024, -0.001588284969329834, -0.001535460352897644, -0.001482635736465454, -0.0014298111200332642, -0.0013769865036010742, -0.0013241618871688843, -0.0012713372707366943, -0.0012185126543045044, -0.0011656880378723145, -0.0011128634214401245, -0.0010600388050079346, -0.0010072141885757446, -0.0009543895721435547, -0.0009015649557113647, -0.0008487403392791748, -0.0007959157228469849, -0.0007430911064147949, -0.000690266489982605, -0.000637441873550415, -0.0005846172571182251, -0.0005317926406860352, -0.0004789680242538452, -0.0004261434078216553, -0.00037331879138946533, -0.0003204941749572754, -0.00026766955852508545, -0.0002148449420928955, -0.00016202032566070557, -0.00010919570922851562, -5.6371092796325684e-05, -3.546476364135742e-06, 4.92781400680542e-05, 0.00010210275650024414, 0.00015492737293243408, 0.00020775198936462402, 0.00026057660579681396, 0.0003134012222290039, 0.00036622583866119385, 0.0004190504550933838, 0.00047187507152557373, 0.0005246996879577637, 0.0005775243043899536, 0.0006303489208221436, 0.0006831735372543335, 0.0007359981536865234, 0.0007888227701187134, 0.0008416473865509033, 0.0008944720029830933, 0.0009472966194152832, 0.0010001212358474731, 0.001052945852279663, 0.001105770468711853, 0.001158595085144043, 0.001211419701576233, 0.0012642443180084229, 0.0013170689344406128, 0.0013698935508728027, 0.0014227181673049927, 0.0014755427837371826, 0.0015283674001693726, 0.0015811920166015625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 10.0, 4.0, 14.0, 15.0, 25.0, 26.0, 31.0, 36.0, 37.0, 56.0, 58.0, 57.0, 86.0, 111.0, 75.0, 55.0, 55.0, 47.0, 54.0, 32.0, 26.0, 22.0, 21.0, 7.0, 10.0, 6.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00040149688720703125, -0.00038978084921836853, -0.0003780648112297058, -0.0003663487732410431, -0.00035463273525238037, -0.00034291669726371765, -0.00033120065927505493, -0.0003194846212863922, -0.0003077685832977295, -0.00029605254530906677, -0.00028433650732040405, -0.00027262046933174133, -0.0002609044313430786, -0.0002491883933544159, -0.00023747235536575317, -0.00022575631737709045, -0.00021404027938842773, -0.00020232424139976501, -0.0001906082034111023, -0.00017889216542243958, -0.00016717612743377686, -0.00015546008944511414, -0.00014374405145645142, -0.0001320280134677887, -0.00012031197547912598, -0.00010859593749046326, -9.687989950180054e-05, -8.516386151313782e-05, -7.34478235244751e-05, -6.173178553581238e-05, -5.001574754714966e-05, -3.829970955848694e-05, -2.658367156982422e-05, -1.4867633581161499e-05, -3.1515955924987793e-06, 8.56444239616394e-06, 2.028048038482666e-05, 3.199651837348938e-05, 4.37125563621521e-05, 5.542859435081482e-05, 6.714463233947754e-05, 7.886067032814026e-05, 9.057670831680298e-05, 0.0001022927463054657, 0.00011400878429412842, 0.00012572482228279114, 0.00013744086027145386, 0.00014915689826011658, 0.0001608729362487793, 0.00017258897423744202, 0.00018430501222610474, 0.00019602105021476746, 0.00020773708820343018, 0.0002194531261920929, 0.00023116916418075562, 0.00024288520216941833, 0.00025460124015808105, 0.0002663172781467438, 0.0002780333161354065, 0.0002897493541240692, 0.00030146539211273193, 0.00031318143010139465, 0.0003248974680900574, 0.0003366135060787201, 0.0003483295440673828]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 10.0, 27.0, 39.0, 30.0, 41.0, 52.0, 96.0, 135.0, 234.0, 356.0, 511.0, 831.0, 1438.0, 2493.0, 4325.0, 7786.0, 13773.0, 25772.0, 51508.0, 114739.0, 441989.0, 215994.0, 81656.0, 38802.0, 20079.0, 11016.0, 6194.0, 3598.0, 1946.0, 1169.0, 667.0, 461.0, 254.0, 169.0, 127.0, 69.0, 68.0, 30.0, 18.0, 10.0, 8.0, 13.0, 6.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0005688667297363281, -0.0005497783422470093, -0.0005306899547576904, -0.0005116015672683716, -0.0004925131797790527, -0.0004734247922897339, -0.00045433640480041504, -0.0004352480173110962, -0.00041615962982177734, -0.0003970712423324585, -0.00037798285484313965, -0.0003588944673538208, -0.00033980607986450195, -0.0003207176923751831, -0.00030162930488586426, -0.0002825409173965454, -0.00026345252990722656, -0.0002443641424179077, -0.00022527575492858887, -0.00020618736743927002, -0.00018709897994995117, -0.00016801059246063232, -0.00014892220497131348, -0.00012983381748199463, -0.00011074542999267578, -9.165704250335693e-05, -7.256865501403809e-05, -5.348026752471924e-05, -3.439188003540039e-05, -1.5303492546081543e-05, 3.7848949432373047e-06, 2.2873282432556152e-05, 4.1961669921875e-05, 6.105005741119385e-05, 8.01384449005127e-05, 9.922683238983154e-05, 0.00011831521987915039, 0.00013740360736846924, 0.00015649199485778809, 0.00017558038234710693, 0.00019466876983642578, 0.00021375715732574463, 0.00023284554481506348, 0.0002519339323043823, 0.00027102231979370117, 0.00029011070728302, 0.00030919909477233887, 0.0003282874822616577, 0.00034737586975097656, 0.0003664642572402954, 0.00038555264472961426, 0.0004046410322189331, 0.00042372941970825195, 0.0004428178071975708, 0.00046190619468688965, 0.0004809945821762085, 0.0005000829696655273, 0.0005191713571548462, 0.000538259744644165, 0.0005573481321334839, 0.0005764365196228027, 0.0005955249071121216, 0.0006146132946014404, 0.0006337016820907593, 0.0006527900695800781]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 8.0, 5.0, 14.0, 8.0, 18.0, 18.0, 23.0, 21.0, 29.0, 36.0, 48.0, 43.0, 51.0, 52.0, 54.0, 58.0, 51.0, 65.0, 48.0, 53.0, 39.0, 44.0, 33.0, 30.0, 28.0, 21.0, 25.0, 15.0, 25.0, 12.0, 8.0, 7.0, 4.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005545616149902344, -0.0005384311079978943, -0.0005223006010055542, -0.0005061700940132141, -0.000490039587020874, -0.00047390908002853394, -0.00045777857303619385, -0.00044164806604385376, -0.00042551755905151367, -0.0004093870520591736, -0.0003932565450668335, -0.0003771260380744934, -0.0003609955310821533, -0.00034486502408981323, -0.00032873451709747314, -0.00031260401010513306, -0.00029647350311279297, -0.0002803429961204529, -0.0002642124891281128, -0.0002480819821357727, -0.00023195147514343262, -0.00021582096815109253, -0.00019969046115875244, -0.00018355995416641235, -0.00016742944717407227, -0.00015129894018173218, -0.0001351684331893921, -0.000119037926197052, -0.00010290741920471191, -8.677691221237183e-05, -7.064640522003174e-05, -5.451589822769165e-05, -3.838539123535156e-05, -2.2254884243011475e-05, -6.124377250671387e-06, 1.0006129741668701e-05, 2.613663673400879e-05, 4.226714372634888e-05, 5.8397650718688965e-05, 7.452815771102905e-05, 9.065866470336914e-05, 0.00010678917169570923, 0.00012291967868804932, 0.0001390501856803894, 0.0001551806926727295, 0.00017131119966506958, 0.00018744170665740967, 0.00020357221364974976, 0.00021970272064208984, 0.00023583322763442993, 0.00025196373462677, 0.0002680942416191101, 0.0002842247486114502, 0.0003003552556037903, 0.00031648576259613037, 0.00033261626958847046, 0.00034874677658081055, 0.00036487728357315063, 0.0003810077905654907, 0.0003971382975578308, 0.0004132688045501709, 0.000429399311542511, 0.0004455298185348511, 0.00046166032552719116, 0.00047779083251953125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 8.0, 8.0, 15.0, 22.0, 31.0, 31.0, 62.0, 72.0, 105.0, 166.0, 213.0, 314.0, 523.0, 961.0, 1981.0, 6091.0, 41193.0, 882798.0, 98774.0, 9543.0, 2649.0, 1182.0, 646.0, 392.0, 222.0, 188.0, 105.0, 88.0, 49.0, 28.0, 24.0, 24.0, 10.0, 12.0, 5.0, 8.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8715858459472656e-05, -1.8124468624591827e-05, -1.7533078789711e-05, -1.694168895483017e-05, -1.635029911994934e-05, -1.5758909285068512e-05, -1.5167519450187683e-05, -1.4576129615306854e-05, -1.3984739780426025e-05, -1.3393349945545197e-05, -1.2801960110664368e-05, -1.2210570275783539e-05, -1.161918044090271e-05, -1.1027790606021881e-05, -1.0436400771141052e-05, -9.845010936260223e-06, -9.253621101379395e-06, -8.662231266498566e-06, -8.070841431617737e-06, -7.479451596736908e-06, -6.888061761856079e-06, -6.29667192697525e-06, -5.705282092094421e-06, -5.1138922572135925e-06, -4.522502422332764e-06, -3.931112587451935e-06, -3.339722752571106e-06, -2.748332917690277e-06, -2.1569430828094482e-06, -1.5655532479286194e-06, -9.741634130477905e-07, -3.8277357816696167e-07, 2.086162567138672e-07, 8.00006091594696e-07, 1.391395926475525e-06, 1.9827857613563538e-06, 2.5741755962371826e-06, 3.1655654311180115e-06, 3.7569552659988403e-06, 4.348345100879669e-06, 4.939734935760498e-06, 5.531124770641327e-06, 6.122514605522156e-06, 6.713904440402985e-06, 7.3052942752838135e-06, 7.896684110164642e-06, 8.488073945045471e-06, 9.0794637799263e-06, 9.670853614807129e-06, 1.0262243449687958e-05, 1.0853633284568787e-05, 1.1445023119449615e-05, 1.2036412954330444e-05, 1.2627802789211273e-05, 1.3219192624092102e-05, 1.3810582458972931e-05, 1.440197229385376e-05, 1.4993362128734589e-05, 1.5584751963615417e-05, 1.6176141798496246e-05, 1.6767531633377075e-05, 1.7358921468257904e-05, 1.7950311303138733e-05, 1.8541701138019562e-05, 1.913309097290039e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [29.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 196.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 578.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 179.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1920928955078125e-07, -1.1455267667770386e-07, -1.0989606380462646e-07, -1.0523945093154907e-07, -1.0058283805847168e-07, -9.592622518539429e-08, -9.12696123123169e-08, -8.66129994392395e-08, -8.195638656616211e-08, -7.729977369308472e-08, -7.264316082000732e-08, -6.798654794692993e-08, -6.332993507385254e-08, -5.8673322200775146e-08, -5.4016709327697754e-08, -4.936009645462036e-08, -4.470348358154297e-08, -4.0046870708465576e-08, -3.5390257835388184e-08, -3.073364496231079e-08, -2.60770320892334e-08, -2.1420419216156006e-08, -1.6763806343078613e-08, -1.210719347000122e-08, -7.450580596923828e-09, -2.7939677238464355e-09, 1.862645149230957e-09, 6.51925802230835e-09, 1.1175870895385742e-08, 1.5832483768463135e-08, 2.0489096641540527e-08, 2.514570951461792e-08, 2.9802322387695312e-08, 3.4458935260772705e-08, 3.91155481338501e-08, 4.377216100692749e-08, 4.842877388000488e-08, 5.3085386753082275e-08, 5.774199962615967e-08, 6.239861249923706e-08, 6.705522537231445e-08, 7.171183824539185e-08, 7.636845111846924e-08, 8.102506399154663e-08, 8.568167686462402e-08, 9.033828973770142e-08, 9.499490261077881e-08, 9.96515154838562e-08, 1.043081283569336e-07, 1.0896474123001099e-07, 1.1362135410308838e-07, 1.1827796697616577e-07, 1.2293457984924316e-07, 1.2759119272232056e-07, 1.3224780559539795e-07, 1.3690441846847534e-07, 1.4156103134155273e-07, 1.4621764421463013e-07, 1.5087425708770752e-07, 1.555308699607849e-07, 1.601874828338623e-07, 1.648440957069397e-07, 1.695007085800171e-07, 1.7415732145309448e-07, 1.7881393432617188e-07]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 1.0, 13.0, 8.0, 23.0, 41.0, 52.0, 97.0, 144.0, 243.0, 488.0, 977.0, 2539.0, 9456.0, 103798.0, 894730.0, 27791.0, 4850.0, 1691.0, 700.0, 403.0, 223.0, 111.0, 61.0, 33.0, 26.0, 22.0, 13.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.282857894897461e-05, -2.2162683308124542e-05, -2.1496787667274475e-05, -2.0830892026424408e-05, -2.016499638557434e-05, -1.9499100744724274e-05, -1.8833205103874207e-05, -1.816730946302414e-05, -1.7501413822174072e-05, -1.6835518181324005e-05, -1.6169622540473938e-05, -1.550372689962387e-05, -1.4837831258773804e-05, -1.4171935617923737e-05, -1.350603997707367e-05, -1.2840144336223602e-05, -1.2174248695373535e-05, -1.1508353054523468e-05, -1.0842457413673401e-05, -1.0176561772823334e-05, -9.510666131973267e-06, -8.8447704911232e-06, -8.178874850273132e-06, -7.512979209423065e-06, -6.847083568572998e-06, -6.181187927722931e-06, -5.515292286872864e-06, -4.849396646022797e-06, -4.1835010051727295e-06, -3.5176053643226624e-06, -2.8517097234725952e-06, -2.185814082622528e-06, -1.519918441772461e-06, -8.540228009223938e-07, -1.8812716007232666e-07, 4.777684807777405e-07, 1.1436641216278076e-06, 1.8095597624778748e-06, 2.475455403327942e-06, 3.141351044178009e-06, 3.807246685028076e-06, 4.473142325878143e-06, 5.1390379667282104e-06, 5.804933607578278e-06, 6.470829248428345e-06, 7.136724889278412e-06, 7.802620530128479e-06, 8.468516170978546e-06, 9.134411811828613e-06, 9.80030745267868e-06, 1.0466203093528748e-05, 1.1132098734378815e-05, 1.1797994375228882e-05, 1.2463890016078949e-05, 1.3129785656929016e-05, 1.3795681297779083e-05, 1.446157693862915e-05, 1.5127472579479218e-05, 1.5793368220329285e-05, 1.6459263861179352e-05, 1.712515950202942e-05, 1.7791055142879486e-05, 1.8456950783729553e-05, 1.912284642457962e-05, 1.9788742065429688e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 2.0, 4.0, 4.0, 7.0, 3.0, 7.0, 13.0, 11.0, 18.0, 29.0, 70.0, 107.0, 193.0, 246.0, 122.0, 56.0, 36.0, 18.0, 12.0, 15.0, 7.0, 4.0, 6.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.52346420288086e-06, -8.239410817623138e-06, -7.955357432365417e-06, -7.671304047107697e-06, -7.387250661849976e-06, -7.103197276592255e-06, -6.819143891334534e-06, -6.535090506076813e-06, -6.251037120819092e-06, -5.966983735561371e-06, -5.68293035030365e-06, -5.398876965045929e-06, -5.114823579788208e-06, -4.830770194530487e-06, -4.546716809272766e-06, -4.262663424015045e-06, -3.978610038757324e-06, -3.6945566534996033e-06, -3.4105032682418823e-06, -3.1264498829841614e-06, -2.8423964977264404e-06, -2.5583431124687195e-06, -2.2742897272109985e-06, -1.9902363419532776e-06, -1.7061829566955566e-06, -1.4221295714378357e-06, -1.1380761861801147e-06, -8.540228009223938e-07, -5.699694156646729e-07, -2.859160304069519e-07, -1.862645149230957e-09, 2.8219074010849e-07, 5.662441253662109e-07, 8.502975106239319e-07, 1.1343508958816528e-06, 1.4184042811393738e-06, 1.7024576663970947e-06, 1.9865110516548157e-06, 2.2705644369125366e-06, 2.5546178221702576e-06, 2.8386712074279785e-06, 3.1227245926856995e-06, 3.4067779779434204e-06, 3.6908313632011414e-06, 3.974884748458862e-06, 4.258938133716583e-06, 4.542991518974304e-06, 4.827044904232025e-06, 5.111098289489746e-06, 5.395151674747467e-06, 5.679205060005188e-06, 5.963258445262909e-06, 6.24731183052063e-06, 6.531365215778351e-06, 6.815418601036072e-06, 7.099471986293793e-06, 7.383525371551514e-06, 7.667578756809235e-06, 7.951632142066956e-06, 8.235685527324677e-06, 8.519738912582397e-06, 8.803792297840118e-06, 9.08784568309784e-06, 9.37189906835556e-06, 9.655952453613281e-06]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 6.0, 11.0, 9.0, 24.0, 22.0, 43.0, 52.0, 81.0, 208.0, 254.0, 99.0, 56.0, 41.0, 24.0, 17.0, 14.0, 9.0, 4.0, 5.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015356190269812942, -0.0014891847968101501, -0.001442750683054328, -0.001396316452883184, -0.0013498823391273618, -0.0013034481089562178, -0.0012570139952003956, -0.0012105797650292516, -0.0011641455348581076, -0.0011177113046869636, -0.0010712771909311414, -0.0010248429607599974, -0.0009784088470041752, -0.0009319746168330312, -0.0008855404448695481, -0.000839106272906065, -0.0007926721009425819, -0.0007462379289790988, -0.0006998037570156157, -0.0006533695850521326, -0.0006069353548809886, -0.0005605011829175055, -0.0005140670109540224, -0.00046763280988670886, -0.00042119863792322576, -0.00037476446595974267, -0.0003283302648924291, -0.000281896092928946, -0.0002354619064135477, -0.00018902771989814937, -0.00014259354793466628, -9.615934686735272e-05, -4.972517490386963e-05, -3.2909920264501125e-06, 4.3143190850969404e-05, 8.957737009041011e-05, 0.00013601155660580844, 0.00018244574312120676, 0.00022887991508468986, 0.0002753141161520034, 0.0003217482881154865, 0.0003681824600789696, 0.00041461666114628315, 0.00046105083310976624, 0.0005074850050732493, 0.0005539192352443933, 0.0006003533490002155, 0.0006467875791713595, 0.0006932217511348426, 0.0007396559230983257, 0.0007860900950618088, 0.0008325242670252919, 0.0008789584971964359, 0.000925392669159919, 0.0009718268411234021, 0.0010182610712945461, 0.0010646951850503683, 0.0011111294152215123, 0.0011575635289773345, 0.0012039977591484785, 0.0012504318729043007, 0.0012968661030754447, 0.0013433003332465887, 0.0013897344470024109, 0.001436168677173555]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 8.0, 15.0, 11.0, 14.0, 22.0, 19.0, 26.0, 26.0, 31.0, 42.0, 32.0, 43.0, 41.0, 44.0, 29.0, 58.0, 40.0, 33.0, 38.0, 43.0, 40.0, 33.0, 36.0, 35.0, 35.0, 33.0, 23.0, 19.0, 18.0, 23.0, 15.0, 11.0, 7.0, 12.0, 6.0, 9.0, 3.0, 5.0, 3.0, 3.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006491825915873051, -0.0006252751336432993, -0.0006013676174916327, -0.000577460159547627, -0.0005535526433959603, -0.0005296451854519546, -0.0005057377275079489, -0.00048183021135628223, -0.0004579227534122765, -0.0004340152663644403, -0.00041010777931660414, -0.0003862003213725984, -0.0003622928343247622, -0.00033838534727692604, -0.00031447786022908986, -0.00029057037318125367, -0.0002666628861334175, -0.0002427553990855813, -0.00021884792658966035, -0.00019494043954182416, -0.0001710329670459032, -0.00014712547999806702, -0.00012321799295023084, -9.931052045430988e-05, -7.54030334064737e-05, -5.1495553634595126e-05, -2.758807022473775e-05, -3.680586814880371e-06, 2.02268929569982e-05, 4.413437272887677e-05, 6.804185977671295e-05, 9.194933227263391e-05, 0.0001158568193204701, 0.00013976430636830628, 0.00016367177886422724, 0.00018757926591206342, 0.00021148673840798438, 0.00023539422545582056, 0.00025930171250365674, 0.00028320919955149293, 0.00030711665749549866, 0.00033102414454333484, 0.000354931631591171, 0.00037883908953517675, 0.00040274657658301294, 0.0004266540636308491, 0.0004505615506786853, 0.0004744690377265215, 0.0004983765538781881, 0.0005222840118221939, 0.0005461915279738605, 0.0005700989859178662, 0.0005940065020695329, 0.0006179139600135386, 0.0006418214179575443, 0.000665728934109211, 0.0006896363920532167, 0.0007135438499972224, 0.0007374513661488891, 0.0007613588240928948, 0.0007852663402445614, 0.0008091737981885672, 0.0008330813143402338, 0.0008569887722842395, 0.0008808962302282453]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 8.0, 8.0, 15.0, 28.0, 45.0, 82.0, 148.0, 269.0, 589.0, 1221.0, 2600.0, 5363.0, 11284.0, 24197.0, 51081.0, 105323.0, 208805.0, 407663.0, 2012684.0, 745283.0, 291628.0, 154997.0, 80988.0, 42188.0, 22457.0, 11744.0, 6283.0, 3239.0, 1792.0, 928.0, 546.0, 319.0, 180.0, 121.0, 64.0, 38.0, 22.0, 21.0, 12.0, 3.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017595291137695312, -0.00016940012574195862, -0.0001628473401069641, -0.0001562945544719696, -0.0001497417688369751, -0.0001431889832019806, -0.00013663619756698608, -0.00013008341193199158, -0.00012353062629699707, -0.00011697784066200256, -0.00011042505502700806, -0.00010387226939201355, -9.731948375701904e-05, -9.076669812202454e-05, -8.421391248703003e-05, -7.766112685203552e-05, -7.110834121704102e-05, -6.455555558204651e-05, -5.8002769947052e-05, -5.1449984312057495e-05, -4.489719867706299e-05, -3.834441304206848e-05, -3.1791627407073975e-05, -2.5238841772079468e-05, -1.868605613708496e-05, -1.2133270502090454e-05, -5.580484867095947e-06, 9.723007678985596e-07, 7.525086402893066e-06, 1.4077872037887573e-05, 2.063065767288208e-05, 2.7183443307876587e-05, 3.3736228942871094e-05, 4.02890145778656e-05, 4.684180021286011e-05, 5.3394585847854614e-05, 5.994737148284912e-05, 6.650015711784363e-05, 7.305294275283813e-05, 7.960572838783264e-05, 8.615851402282715e-05, 9.271129965782166e-05, 9.926408529281616e-05, 0.00010581687092781067, 0.00011236965656280518, 0.00011892244219779968, 0.0001254752278327942, 0.0001320280134677887, 0.0001385807991027832, 0.0001451335847377777, 0.00015168637037277222, 0.00015823915600776672, 0.00016479194164276123, 0.00017134472727775574, 0.00017789751291275024, 0.00018445029854774475, 0.00019100308418273926, 0.00019755586981773376, 0.00020410865545272827, 0.00021066144108772278, 0.00021721422672271729, 0.0002237670123577118, 0.0002303197979927063, 0.0002368725836277008, 0.0002434253692626953]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 10.0, 10.0, 8.0, 10.0, 20.0, 21.0, 20.0, 27.0, 22.0, 27.0, 28.0, 47.0, 24.0, 29.0, 45.0, 40.0, 37.0, 47.0, 55.0, 59.0, 38.0, 48.0, 33.0, 31.0, 28.0, 28.0, 26.0, 19.0, 23.0, 29.0, 20.0, 9.0, 12.0, 11.0, 10.0, 10.0, 4.0, 10.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.8417835235595703e-05, -1.783110201358795e-05, -1.72443687915802e-05, -1.665763556957245e-05, -1.6070902347564697e-05, -1.5484169125556946e-05, -1.4897435903549194e-05, -1.4310702681541443e-05, -1.3723969459533691e-05, -1.313723623752594e-05, -1.2550503015518188e-05, -1.1963769793510437e-05, -1.1377036571502686e-05, -1.0790303349494934e-05, -1.0203570127487183e-05, -9.616836905479431e-06, -9.03010368347168e-06, -8.443370461463928e-06, -7.856637239456177e-06, -7.269904017448425e-06, -6.683170795440674e-06, -6.096437573432922e-06, -5.509704351425171e-06, -4.9229711294174194e-06, -4.336237907409668e-06, -3.7495046854019165e-06, -3.162771463394165e-06, -2.5760382413864136e-06, -1.989305019378662e-06, -1.4025717973709106e-06, -8.158385753631592e-07, -2.2910535335540771e-07, 3.5762786865234375e-07, 9.443610906600952e-07, 1.5310943126678467e-06, 2.117827534675598e-06, 2.7045607566833496e-06, 3.291293978691101e-06, 3.8780272006988525e-06, 4.464760422706604e-06, 5.0514936447143555e-06, 5.638226866722107e-06, 6.224960088729858e-06, 6.81169331073761e-06, 7.398426532745361e-06, 7.985159754753113e-06, 8.571892976760864e-06, 9.158626198768616e-06, 9.745359420776367e-06, 1.0332092642784119e-05, 1.091882586479187e-05, 1.1505559086799622e-05, 1.2092292308807373e-05, 1.2679025530815125e-05, 1.3265758752822876e-05, 1.3852491974830627e-05, 1.4439225196838379e-05, 1.502595841884613e-05, 1.5612691640853882e-05, 1.6199424862861633e-05, 1.6786158084869385e-05, 1.7372891306877136e-05, 1.7959624528884888e-05, 1.854635775089264e-05, 1.913309097290039e-05]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 8.0, 14.0, 22.0, 35.0, 50.0, 100.0, 149.0, 192.0, 316.0, 730.0, 5899.0, 4167838.0, 17438.0, 666.0, 275.0, 162.0, 144.0, 88.0, 59.0, 32.0, 31.0, 10.0, 13.0, 10.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005135536193847656, -0.00048435479402542114, -0.00045515596866607666, -0.0004259571433067322, -0.0003967583179473877, -0.0003675594925880432, -0.00033836066722869873, -0.00030916184186935425, -0.00027996301651000977, -0.0002507641911506653, -0.0002215653657913208, -0.00019236654043197632, -0.00016316771507263184, -0.00013396888971328735, -0.00010477006435394287, -7.557123899459839e-05, -4.6372413635253906e-05, -1.7173588275909424e-05, 1.2025237083435059e-05, 4.122406244277954e-05, 7.042288780212402e-05, 9.96217131614685e-05, 0.000128820538520813, 0.00015801936388015747, 0.00018721818923950195, 0.00021641701459884644, 0.0002456158399581909, 0.0002748146653175354, 0.0003040134906768799, 0.00033321231603622437, 0.00036241114139556885, 0.00039160996675491333, 0.0004208087921142578, 0.0004500076174736023, 0.0004792064428329468, 0.0005084052681922913, 0.0005376040935516357, 0.0005668029189109802, 0.0005960017442703247, 0.0006252005696296692, 0.0006543993949890137, 0.0006835982203483582, 0.0007127970457077026, 0.0007419958710670471, 0.0007711946964263916, 0.0008003935217857361, 0.0008295923471450806, 0.000858791172504425, 0.0008879899978637695, 0.000917188823223114, 0.0009463876485824585, 0.000975586473941803, 0.0010047852993011475, 0.001033984124660492, 0.0010631829500198364, 0.001092381775379181, 0.0011215806007385254, 0.0011507794260978699, 0.0011799782514572144, 0.0012091770768165588, 0.0012383759021759033, 0.0012675747275352478, 0.0012967735528945923, 0.0013259723782539368, 0.0013551712036132812]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 20.0, 17.0, 36.0, 56.0, 88.0, 147.0, 174.0, 248.0, 344.0, 462.0, 895.0, 488.0, 313.0, 223.0, 164.0, 141.0, 92.0, 65.0, 31.0, 30.0, 13.0, 10.0, 9.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.0279159545898438e-05, -2.84537672996521e-05, -2.6628375053405762e-05, -2.4802982807159424e-05, -2.2977590560913086e-05, -2.1152198314666748e-05, -1.932680606842041e-05, -1.7501413822174072e-05, -1.5676021575927734e-05, -1.3850629329681396e-05, -1.2025237083435059e-05, -1.019984483718872e-05, -8.374452590942383e-06, -6.549060344696045e-06, -4.723668098449707e-06, -2.898275852203369e-06, -1.0728836059570312e-06, 7.525086402893066e-07, 2.5779008865356445e-06, 4.403293132781982e-06, 6.22868537902832e-06, 8.054077625274658e-06, 9.879469871520996e-06, 1.1704862117767334e-05, 1.3530254364013672e-05, 1.535564661026001e-05, 1.7181038856506348e-05, 1.9006431102752686e-05, 2.0831823348999023e-05, 2.265721559524536e-05, 2.44826078414917e-05, 2.6308000087738037e-05, 2.8133392333984375e-05, 2.9958784580230713e-05, 3.178417682647705e-05, 3.360956907272339e-05, 3.5434961318969727e-05, 3.7260353565216064e-05, 3.90857458114624e-05, 4.091113805770874e-05, 4.273653030395508e-05, 4.4561922550201416e-05, 4.6387314796447754e-05, 4.821270704269409e-05, 5.003809928894043e-05, 5.186349153518677e-05, 5.3688883781433105e-05, 5.551427602767944e-05, 5.733966827392578e-05, 5.916506052017212e-05, 6.099045276641846e-05, 6.28158450126648e-05, 6.464123725891113e-05, 6.646662950515747e-05, 6.829202175140381e-05, 7.011741399765015e-05, 7.194280624389648e-05, 7.376819849014282e-05, 7.559359073638916e-05, 7.74189829826355e-05, 7.924437522888184e-05, 8.106976747512817e-05, 8.289515972137451e-05, 8.472055196762085e-05, 8.654594421386719e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 15.0, 27.0, 71.0, 311.0, 468.0, 82.0, 27.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006887888303026557, -0.0006651565781794488, -0.000641524326056242, -0.0006178920157253742, -0.0005942597636021674, -0.0005706275114789605, -0.0005469952593557537, -0.0005233630072325468, -0.000499730696901679, -0.0004760984447784722, -0.0004524661635514349, -0.000428833911428228, -0.0004052016302011907, -0.00038156937807798386, -0.000357937125954777, -0.00033430487383157015, -0.0003106726217083633, -0.00028704036958515644, -0.00026340808835811913, -0.00023977583623491228, -0.0002161435695597902, -0.0001925113028846681, -0.00016887905076146126, -0.00014524678408633918, -0.0001216145174112171, -9.798225073609501e-05, -7.434999133693054e-05, -5.0717731937766075e-05, -2.7085465262643993e-05, -3.4531985875219107e-06, 2.0179053535684943e-05, 4.3811320210807025e-05, 6.744364509359002e-05, 9.10759117687121e-05, 0.00011470817116787657, 0.00013834043056704104, 0.00016197269724216312, 0.0001856049639172852, 0.00020923721604049206, 0.00023286948271561414, 0.0002565017493907362, 0.0002801340015139431, 0.0003037662827409804, 0.00032739853486418724, 0.0003510307869873941, 0.0003746630682144314, 0.00039829532033763826, 0.00042192760156467557, 0.0004455598536878824, 0.0004691921058110893, 0.0004928243579342961, 0.0005164566682651639, 0.0005400889203883708, 0.0005637211725115776, 0.0005873534246347845, 0.0006109856767579913, 0.0006346179870888591, 0.0006582502392120659, 0.0006818824913352728, 0.0007055148016661406, 0.0007291470537893474, 0.0007527793059125543, 0.0007764115580357611, 0.000800043810158968, 0.0008236760622821748]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 10.0, 7.0, 16.0, 11.0, 19.0, 21.0, 18.0, 29.0, 33.0, 36.0, 43.0, 40.0, 48.0, 51.0, 53.0, 56.0, 42.0, 52.0, 52.0, 42.0, 43.0, 43.0, 32.0, 35.0, 23.0, 31.0, 23.0, 17.0, 16.0, 14.0, 10.0, 10.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00012286388664506376, -0.00011956603702856228, -0.00011626819468801841, -0.00011297034507151693, -0.00010967249545501545, -0.00010637465311447158, -0.0001030768034979701, -9.977896115742624e-05, -9.648111154092476e-05, -9.318326192442328e-05, -8.988541958387941e-05, -8.658756996737793e-05, -8.328972035087645e-05, -7.999187801033258e-05, -7.66940283938311e-05, -7.339617877732962e-05, -7.009833643678576e-05, -6.680048682028428e-05, -6.350264447974041e-05, -6.020479486323893e-05, -5.690694888471626e-05, -5.3609102906193584e-05, -5.0311253289692104e-05, -4.701340731116943e-05, -4.371555405668914e-05, -4.041770807816647e-05, -3.711985846166499e-05, -3.3822012483142316e-05, -3.052416650461964e-05, -2.7226318707107566e-05, -2.392847090959549e-05, -2.0630624931072816e-05, -1.7332778952550143e-05, -1.4034932064532768e-05, -1.0737085176515393e-05, -7.439237379003316e-06, -4.141390490985941e-06, -8.435436029685661e-07, 2.4543041945435107e-06, 5.752150173066184e-06, 9.04999797057826e-06, 1.2347844858595636e-05, 1.564569174661301e-05, 1.8943539544125088e-05, 2.2241387341637164e-05, 2.5539233320159838e-05, 2.8837081117671914e-05, 3.213492891518399e-05, 3.5432774893706664e-05, 3.873062087222934e-05, 4.202847048873082e-05, 4.532631646725349e-05, 4.8624162445776165e-05, 5.1922012062277645e-05, 5.521985804080032e-05, 5.851770401932299e-05, 6.181555363582447e-05, 6.511340325232595e-05, 6.841124559286982e-05, 7.17090952093713e-05, 7.500694482587278e-05, 7.830478716641665e-05, 8.160263678291813e-05, 8.49004863994196e-05, 8.819832873996347e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 5.0, 12.0, 9.0, 6.0, 18.0, 20.0, 41.0, 68.0, 149.0, 346.0, 1009.0, 4138.0, 19248.0, 193707.0, 767900.0, 50344.0, 8545.0, 1934.0, 579.0, 214.0, 90.0, 58.0, 31.0, 24.0, 14.0, 7.0, 5.0, 8.0, 5.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.802776336669922e-05, -3.681052476167679e-05, -3.559328615665436e-05, -3.437604755163193e-05, -3.31588089466095e-05, -3.194157034158707e-05, -3.0724331736564636e-05, -2.9507093131542206e-05, -2.8289854526519775e-05, -2.7072615921497345e-05, -2.5855377316474915e-05, -2.4638138711452484e-05, -2.3420900106430054e-05, -2.2203661501407623e-05, -2.0986422896385193e-05, -1.9769184291362762e-05, -1.8551945686340332e-05, -1.73347070813179e-05, -1.611746847629547e-05, -1.490022987127304e-05, -1.368299126625061e-05, -1.246575266122818e-05, -1.124851405620575e-05, -1.0031275451183319e-05, -8.814036846160889e-06, -7.596798241138458e-06, -6.379559636116028e-06, -5.162321031093597e-06, -3.945082426071167e-06, -2.7278438210487366e-06, -1.5106052160263062e-06, -2.9336661100387573e-07, 9.238719940185547e-07, 2.141110599040985e-06, 3.3583492040634155e-06, 4.575587809085846e-06, 5.792826414108276e-06, 7.010065019130707e-06, 8.227303624153137e-06, 9.444542229175568e-06, 1.0661780834197998e-05, 1.1879019439220428e-05, 1.3096258044242859e-05, 1.431349664926529e-05, 1.553073525428772e-05, 1.674797385931015e-05, 1.796521246433258e-05, 1.918245106935501e-05, 2.039968967437744e-05, 2.1616928279399872e-05, 2.2834166884422302e-05, 2.4051405489444733e-05, 2.5268644094467163e-05, 2.6485882699489594e-05, 2.7703121304512024e-05, 2.8920359909534454e-05, 3.0137598514556885e-05, 3.1354837119579315e-05, 3.2572075724601746e-05, 3.3789314329624176e-05, 3.5006552934646606e-05, 3.622379153966904e-05, 3.744103014469147e-05, 3.86582687497139e-05, 3.987550735473633e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 17.0, 24.0, 34.0, 42.0, 67.0, 80.0, 91.0, 134.0, 133.0, 87.0, 75.0, 64.0, 41.0, 45.0, 26.0, 14.0, 12.0, 7.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.118152618408203e-05, -7.671304047107697e-05, -7.22445547580719e-05, -6.777606904506683e-05, -6.330758333206177e-05, -5.88390976190567e-05, -5.4370611906051636e-05, -4.990212619304657e-05, -4.5433640480041504e-05, -4.096515476703644e-05, -3.649666905403137e-05, -3.2028183341026306e-05, -2.755969762802124e-05, -2.3091211915016174e-05, -1.862272620201111e-05, -1.4154240489006042e-05, -9.685754776000977e-06, -5.217269062995911e-06, -7.487833499908447e-07, 3.719702363014221e-06, 8.188188076019287e-06, 1.2656673789024353e-05, 1.712515950202942e-05, 2.1593645215034485e-05, 2.606213092803955e-05, 3.053061664104462e-05, 3.499910235404968e-05, 3.946758806705475e-05, 4.3936073780059814e-05, 4.840455949306488e-05, 5.2873045206069946e-05, 5.734153091907501e-05, 6.181001663208008e-05, 6.627850234508514e-05, 7.074698805809021e-05, 7.521547377109528e-05, 7.968395948410034e-05, 8.415244519710541e-05, 8.862093091011047e-05, 9.308941662311554e-05, 9.75579023361206e-05, 0.00010202638804912567, 0.00010649487376213074, 0.0001109633594751358, 0.00011543184518814087, 0.00011990033090114594, 0.000124368816614151, 0.00012883730232715607, 0.00013330578804016113, 0.0001377742737531662, 0.00014224275946617126, 0.00014671124517917633, 0.0001511797308921814, 0.00015564821660518646, 0.00016011670231819153, 0.0001645851880311966, 0.00016905367374420166, 0.00017352215945720673, 0.0001779906451702118, 0.00018245913088321686, 0.00018692761659622192, 0.000191396102309227, 0.00019586458802223206, 0.00020033307373523712, 0.0002048015594482422]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 1.0, 9.0, 10.0, 15.0, 25.0, 14.0, 25.0, 45.0, 67.0, 107.0, 149.0, 229.0, 370.0, 619.0, 884.0, 1660.0, 2868.0, 5205.0, 7081.0, 15985.0, 33629.0, 75722.0, 217854.0, 443575.0, 136620.0, 53638.0, 24908.0, 12282.0, 6288.0, 3448.0, 2056.0, 949.0, 760.0, 509.0, 308.0, 193.0, 125.0, 106.0, 58.0, 47.0, 23.0, 26.0, 17.0, 10.0, 11.0, 10.0, 1.0, 3.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.881092071533203e-06, -8.587725460529327e-06, -8.294358849525452e-06, -8.000992238521576e-06, -7.7076256275177e-06, -7.4142590165138245e-06, -7.120892405509949e-06, -6.827525794506073e-06, -6.534159183502197e-06, -6.2407925724983215e-06, -5.947425961494446e-06, -5.65405935049057e-06, -5.360692739486694e-06, -5.067326128482819e-06, -4.773959517478943e-06, -4.480592906475067e-06, -4.187226295471191e-06, -3.893859684467316e-06, -3.60049307346344e-06, -3.307126462459564e-06, -3.0137598514556885e-06, -2.7203932404518127e-06, -2.427026629447937e-06, -2.1336600184440613e-06, -1.8402934074401855e-06, -1.5469267964363098e-06, -1.253560185432434e-06, -9.601935744285583e-07, -6.668269634246826e-07, -3.734603524208069e-07, -8.009374141693115e-08, 2.1327286958694458e-07, 5.066394805908203e-07, 8.00006091594696e-07, 1.0933727025985718e-06, 1.3867393136024475e-06, 1.6801059246063232e-06, 1.973472535610199e-06, 2.2668391466140747e-06, 2.5602057576179504e-06, 2.853572368621826e-06, 3.146938979625702e-06, 3.4403055906295776e-06, 3.7336722016334534e-06, 4.027038812637329e-06, 4.320405423641205e-06, 4.6137720346450806e-06, 4.907138645648956e-06, 5.200505256652832e-06, 5.493871867656708e-06, 5.7872384786605835e-06, 6.080605089664459e-06, 6.373971700668335e-06, 6.667338311672211e-06, 6.9607049226760864e-06, 7.254071533679962e-06, 7.547438144683838e-06, 7.840804755687714e-06, 8.13417136669159e-06, 8.427537977695465e-06, 8.72090458869934e-06, 9.014271199703217e-06, 9.307637810707092e-06, 9.601004421710968e-06, 9.894371032714844e-06]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 9.0, 9.0, 13.0, 15.0, 13.0, 23.0, 31.0, 23.0, 36.0, 46.0, 40.0, 49.0, 63.0, 66.0, 58.0, 56.0, 64.0, 40.0, 68.0, 49.0, 36.0, 34.0, 24.0, 32.0, 21.0, 18.0, 23.0, 12.0, 10.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010645389556884766, -0.00010175816714763641, -9.706243872642517e-05, -9.236671030521393e-05, -8.767098188400269e-05, -8.297525346279144e-05, -7.82795250415802e-05, -7.358379662036896e-05, -6.888806819915771e-05, -6.419233977794647e-05, -5.949661135673523e-05, -5.480088293552399e-05, -5.0105154514312744e-05, -4.54094260931015e-05, -4.071369767189026e-05, -3.6017969250679016e-05, -3.1322240829467773e-05, -2.662651240825653e-05, -2.1930783987045288e-05, -1.7235055565834045e-05, -1.2539327144622803e-05, -7.84359872341156e-06, -3.1478703022003174e-06, 1.5478581190109253e-06, 6.243586540222168e-06, 1.093931496143341e-05, 1.5635043382644653e-05, 2.0330771803855896e-05, 2.502650022506714e-05, 2.972222864627838e-05, 3.4417957067489624e-05, 3.911368548870087e-05, 4.380941390991211e-05, 4.850514233112335e-05, 5.3200870752334595e-05, 5.789659917354584e-05, 6.259232759475708e-05, 6.728805601596832e-05, 7.198378443717957e-05, 7.667951285839081e-05, 8.137524127960205e-05, 8.60709697008133e-05, 9.076669812202454e-05, 9.546242654323578e-05, 0.00010015815496444702, 0.00010485388338565826, 0.00010954961180686951, 0.00011424534022808075, 0.00011894106864929199, 0.00012363679707050323, 0.00012833252549171448, 0.00013302825391292572, 0.00013772398233413696, 0.0001424197107553482, 0.00014711543917655945, 0.0001518111675977707, 0.00015650689601898193, 0.00016120262444019318, 0.00016589835286140442, 0.00017059408128261566, 0.0001752898097038269, 0.00017998553812503815, 0.0001846812665462494, 0.00018937699496746063, 0.00019407272338867188]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 5.0, 5.0, 4.0, 3.0, 2.0, 10.0, 3.0, 9.0, 14.0, 6.0, 30.0, 48.0, 40.0, 95.0, 183.0, 150.0, 474.0, 933.0, 808.0, 2909.0, 2890.0, 14596.0, 100466.0, 802943.0, 99427.0, 13913.0, 2834.0, 2868.0, 1383.0, 372.0, 507.0, 175.0, 187.0, 101.0, 30.0, 40.0, 28.0, 9.0, 15.0, 6.0, 6.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9802322387695312e-06, -2.882443368434906e-06, -2.7846544981002808e-06, -2.6868656277656555e-06, -2.5890767574310303e-06, -2.491287887096405e-06, -2.3934990167617798e-06, -2.2957101464271545e-06, -2.1979212760925293e-06, -2.100132405757904e-06, -2.002343535423279e-06, -1.9045546650886536e-06, -1.8067657947540283e-06, -1.708976924419403e-06, -1.6111880540847778e-06, -1.5133991837501526e-06, -1.4156103134155273e-06, -1.317821443080902e-06, -1.2200325727462769e-06, -1.1222437024116516e-06, -1.0244548320770264e-06, -9.266659617424011e-07, -8.288770914077759e-07, -7.310882210731506e-07, -6.332993507385254e-07, -5.355104804039001e-07, -4.377216100692749e-07, -3.3993273973464966e-07, -2.421438694000244e-07, -1.4435499906539917e-07, -4.6566128730773926e-08, 5.122274160385132e-08, 1.4901161193847656e-07, 2.468004822731018e-07, 3.4458935260772705e-07, 4.423782229423523e-07, 5.401670932769775e-07, 6.379559636116028e-07, 7.35744833946228e-07, 8.335337042808533e-07, 9.313225746154785e-07, 1.0291114449501038e-06, 1.126900315284729e-06, 1.2246891856193542e-06, 1.3224780559539795e-06, 1.4202669262886047e-06, 1.51805579662323e-06, 1.6158446669578552e-06, 1.7136335372924805e-06, 1.8114224076271057e-06, 1.909211277961731e-06, 2.007000148296356e-06, 2.1047890186309814e-06, 2.2025778889656067e-06, 2.300366759300232e-06, 2.398155629634857e-06, 2.4959444999694824e-06, 2.5937333703041077e-06, 2.691522240638733e-06, 2.789311110973358e-06, 2.8870999813079834e-06, 2.9848888516426086e-06, 3.082677721977234e-06, 3.180466592311859e-06, 3.2782554626464844e-06]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.0, 0.0, 0.0, 0.0, 0.0, 0.0, 211.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 300.0, 0.0, 0.0, 0.0, 0.0, 0.0, 198.0, 0.0, 0.0, 0.0, 0.0, 0.0, 119.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.980232238769531e-07, -2.8870999813079834e-07, -2.7939677238464355e-07, -2.7008354663848877e-07, -2.60770320892334e-07, -2.514570951461792e-07, -2.421438694000244e-07, -2.3283064365386963e-07, -2.2351741790771484e-07, -2.1420419216156006e-07, -2.0489096641540527e-07, -1.955777406692505e-07, -1.862645149230957e-07, -1.7695128917694092e-07, -1.6763806343078613e-07, -1.5832483768463135e-07, -1.4901161193847656e-07, -1.3969838619232178e-07, -1.30385160446167e-07, -1.210719347000122e-07, -1.1175870895385742e-07, -1.0244548320770264e-07, -9.313225746154785e-08, -8.381903171539307e-08, -7.450580596923828e-08, -6.51925802230835e-08, -5.587935447692871e-08, -4.6566128730773926e-08, -3.725290298461914e-08, -2.7939677238464355e-08, -1.862645149230957e-08, -9.313225746154785e-09, 0.0, 9.313225746154785e-09, 1.862645149230957e-08, 2.7939677238464355e-08, 3.725290298461914e-08, 4.6566128730773926e-08, 5.587935447692871e-08, 6.51925802230835e-08, 7.450580596923828e-08, 8.381903171539307e-08, 9.313225746154785e-08, 1.0244548320770264e-07, 1.1175870895385742e-07, 1.210719347000122e-07, 1.30385160446167e-07, 1.3969838619232178e-07, 1.4901161193847656e-07, 1.5832483768463135e-07, 1.6763806343078613e-07, 1.7695128917694092e-07, 1.862645149230957e-07, 1.955777406692505e-07, 2.0489096641540527e-07, 2.1420419216156006e-07, 2.2351741790771484e-07, 2.3283064365386963e-07, 2.421438694000244e-07, 2.514570951461792e-07, 2.60770320892334e-07, 2.7008354663848877e-07, 2.7939677238464355e-07, 2.8870999813079834e-07, 2.980232238769531e-07]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 0.0, 1.0, 7.0, 3.0, 8.0, 22.0, 33.0, 77.0, 196.0, 501.0, 1232.0, 3497.0, 12548.0, 911398.0, 106235.0, 8643.0, 2531.0, 954.0, 354.0, 164.0, 70.0, 33.0, 9.0, 14.0, 1.0, 5.0, 0.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.258487701416016e-06, -6.016343832015991e-06, -5.774199962615967e-06, -5.532056093215942e-06, -5.289912223815918e-06, -5.0477683544158936e-06, -4.805624485015869e-06, -4.563480615615845e-06, -4.32133674621582e-06, -4.079192876815796e-06, -3.8370490074157715e-06, -3.594905138015747e-06, -3.3527612686157227e-06, -3.1106173992156982e-06, -2.868473529815674e-06, -2.6263296604156494e-06, -2.384185791015625e-06, -2.1420419216156006e-06, -1.8998980522155762e-06, -1.6577541828155518e-06, -1.4156103134155273e-06, -1.173466444015503e-06, -9.313225746154785e-07, -6.891787052154541e-07, -4.470348358154297e-07, -2.0489096641540527e-07, 3.725290298461914e-08, 2.7939677238464355e-07, 5.21540641784668e-07, 7.636845111846924e-07, 1.0058283805847168e-06, 1.2479722499847412e-06, 1.4901161193847656e-06, 1.73225998878479e-06, 1.9744038581848145e-06, 2.216547727584839e-06, 2.4586915969848633e-06, 2.7008354663848877e-06, 2.942979335784912e-06, 3.1851232051849365e-06, 3.427267074584961e-06, 3.6694109439849854e-06, 3.91155481338501e-06, 4.153698682785034e-06, 4.395842552185059e-06, 4.637986421585083e-06, 4.880130290985107e-06, 5.122274160385132e-06, 5.364418029785156e-06, 5.606561899185181e-06, 5.848705768585205e-06, 6.0908496379852295e-06, 6.332993507385254e-06, 6.575137376785278e-06, 6.817281246185303e-06, 7.059425115585327e-06, 7.3015689849853516e-06, 7.543712854385376e-06, 7.7858567237854e-06, 8.028000593185425e-06, 8.27014446258545e-06, 8.512288331985474e-06, 8.754432201385498e-06, 8.996576070785522e-06, 9.238719940185547e-06]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 0.0, 5.0, 0.0, 0.0, 2.0, 0.0, 11.0, 0.0, 9.0, 0.0, 40.0, 0.0, 110.0, 0.0, 637.0, 0.0, 93.0, 0.0, 0.0, 43.0, 0.0, 15.0, 0.0, 10.0, 0.0, 8.0, 0.0, 5.0, 0.0, 4.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.748603820800781e-07, -7.469207048416138e-07, -7.189810276031494e-07, -6.910413503646851e-07, -6.631016731262207e-07, -6.351619958877563e-07, -6.07222318649292e-07, -5.792826414108276e-07, -5.513429641723633e-07, -5.234032869338989e-07, -4.954636096954346e-07, -4.675239324569702e-07, -4.3958425521850586e-07, -4.116445779800415e-07, -3.8370490074157715e-07, -3.557652235031128e-07, -3.2782554626464844e-07, -2.998858690261841e-07, -2.7194619178771973e-07, -2.4400651454925537e-07, -2.1606683731079102e-07, -1.8812716007232666e-07, -1.601874828338623e-07, -1.3224780559539795e-07, -1.043081283569336e-07, -7.636845111846924e-08, -4.842877388000488e-08, -2.0489096641540527e-08, 7.450580596923828e-09, 3.5390257835388184e-08, 6.332993507385254e-08, 9.12696123123169e-08, 1.1920928955078125e-07, 1.471489667892456e-07, 1.7508864402770996e-07, 2.0302832126617432e-07, 2.3096799850463867e-07, 2.5890767574310303e-07, 2.868473529815674e-07, 3.1478703022003174e-07, 3.427267074584961e-07, 3.7066638469696045e-07, 3.986060619354248e-07, 4.2654573917388916e-07, 4.544854164123535e-07, 4.824250936508179e-07, 5.103647708892822e-07, 5.383044481277466e-07, 5.662441253662109e-07, 5.941838026046753e-07, 6.221234798431396e-07, 6.50063157081604e-07, 6.780028343200684e-07, 7.059425115585327e-07, 7.338821887969971e-07, 7.618218660354614e-07, 7.897615432739258e-07, 8.177012205123901e-07, 8.456408977508545e-07, 8.735805749893188e-07, 9.015202522277832e-07, 9.294599294662476e-07, 9.57399606704712e-07, 9.853392839431763e-07, 1.0132789611816406e-06]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 9.0, 80.0, 837.0, 87.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024290654982905835, -0.00021080153237562627, -0.00017869651492219418, -0.0001465914974687621, -0.00011448648001533002, -8.238146256189793e-05, -5.027644510846585e-05, -1.8171427655033767e-05, 1.3933589798398316e-05, 4.60386072518304e-05, 7.814362470526248e-05, 0.00011024864215869457, 0.00014235365961212665, 0.00017445867706555873, 0.00020656369451899081, 0.0002386687119724229, 0.00027077371487393975, 0.00030287873232737184, 0.0003349837497808039, 0.000367088767234236, 0.0003991937846876681, 0.00043129880214110017, 0.00046340381959453225, 0.0004955088370479643, 0.0005276138545013964, 0.0005597188719548285, 0.0005918238894082606, 0.0006239289068616927, 0.0006560339243151248, 0.0006881389417685568, 0.0007202439592219889, 0.000752348976675421, 0.0007844539359211922, 0.0008165589533746243, 0.0008486639708280563, 0.0008807689882814884, 0.0009128740057349205, 0.0009449790231883526, 0.0009770840406417847, 0.0010091890580952168, 0.0010412940755486488, 0.001073399093002081, 0.001105504110455513, 0.001137609127908945, 0.0011697141453623772, 0.0012018191628158092, 0.0012339241802692413, 0.0012660291977226734, 0.0012981342151761055, 0.0013302392326295376, 0.0013623442500829697, 0.0013944492675364017, 0.0014265542849898338, 0.001458659302443266, 0.001490764319896698, 0.00152286933735013, 0.0015549743548035622, 0.0015870793722569942, 0.0016191843897104263, 0.0016512894071638584, 0.0016833944246172905, 0.0017154994420707226, 0.0017476044595241547, 0.0017797094769775867, 0.0018118144944310188]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 17.0, 23.0, 34.0, 32.0, 53.0, 87.0, 81.0, 97.0, 109.0, 85.0, 95.0, 78.0, 65.0, 46.0, 37.0, 25.0, 17.0, 12.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.487415859941393e-05, -7.089783321134746e-05, -6.692150782328099e-05, -6.294518243521452e-05, -5.896885340916924e-05, -5.499252802110277e-05, -5.1016198995057493e-05, -4.703987360699102e-05, -4.306354821892455e-05, -3.908722283085808e-05, -3.511089744279161e-05, -3.113456841674633e-05, -2.7158243028679863e-05, -2.3181917640613392e-05, -1.9205590433557518e-05, -1.5229263226501644e-05, -1.1252937838435173e-05, -7.276611540874001e-06, -3.3002852433128282e-06, 6.760410542483442e-07, 4.6523673518095165e-06, 8.628692739875987e-06, 1.2605019946931861e-05, 1.6581347153987736e-05, 2.0557672542054206e-05, 2.4533997930120677e-05, 2.851032513717655e-05, 3.2486652344232425e-05, 3.6462977732298896e-05, 4.0439303120365366e-05, 4.4415632146410644e-05, 4.8391957534477115e-05, 5.2368282922543585e-05, 5.6344608310610056e-05, 6.0320933698676527e-05, 6.4297259086743e-05, 6.827358447480947e-05, 7.224990986287594e-05, 7.622624252690002e-05, 8.02025679149665e-05, 8.417889330303296e-05, 8.815521869109944e-05, 9.21315440791659e-05, 9.610786946723238e-05, 0.00010008420213125646, 0.00010406052751932293, 0.0001080368529073894, 0.00011201317829545587, 0.00011598950368352234, 0.00011996582907158881, 0.00012394215445965528, 0.00012791847984772176, 0.00013189480523578823, 0.0001358711306238547, 0.00013984745601192117, 0.00014382379595190287, 0.0001478001067880541, 0.00015177643217612058, 0.00015575275756418705, 0.00015972908295225352, 0.00016370540834032, 0.00016768173372838646, 0.00017165805911645293, 0.00017563439905643463, 0.0001796107244445011]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 15.0, 16.0, 8.0, 31.0, 37.0, 61.0, 94.0, 176.0, 281.0, 546.0, 963.0, 1884.0, 3509.0, 6679.0, 13690.0, 29297.0, 69126.0, 250514.0, 521882.0, 83255.0, 34306.0, 15967.0, 7606.0, 3926.0, 2161.0, 1112.0, 612.0, 296.0, 199.0, 99.0, 69.0, 33.0, 25.0, 18.0, 17.0, 9.0, 4.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.00010323524475097656, -0.00010020751506090164, -9.717978537082672e-05, -9.41520556807518e-05, -9.112432599067688e-05, -8.809659630060196e-05, -8.506886661052704e-05, -8.204113692045212e-05, -7.90134072303772e-05, -7.598567754030228e-05, -7.295794785022736e-05, -6.993021816015244e-05, -6.690248847007751e-05, -6.38747587800026e-05, -6.084702908992767e-05, -5.781929939985275e-05, -5.479156970977783e-05, -5.176384001970291e-05, -4.873611032962799e-05, -4.570838063955307e-05, -4.268065094947815e-05, -3.965292125940323e-05, -3.662519156932831e-05, -3.359746187925339e-05, -3.056973218917847e-05, -2.7542002499103546e-05, -2.4514272809028625e-05, -2.1486543118953705e-05, -1.8458813428878784e-05, -1.5431083738803864e-05, -1.2403354048728943e-05, -9.375624358654022e-06, -6.3478946685791016e-06, -3.320164978504181e-06, -2.9243528842926025e-07, 2.7352944016456604e-06, 5.763024091720581e-06, 8.790753781795502e-06, 1.1818483471870422e-05, 1.4846213161945343e-05, 1.7873942852020264e-05, 2.0901672542095184e-05, 2.3929402232170105e-05, 2.6957131922245026e-05, 2.9984861612319946e-05, 3.301259130239487e-05, 3.604032099246979e-05, 3.906805068254471e-05, 4.209578037261963e-05, 4.512351006269455e-05, 4.815123975276947e-05, 5.117896944284439e-05, 5.420669913291931e-05, 5.723442882299423e-05, 6.026215851306915e-05, 6.328988820314407e-05, 6.6317617893219e-05, 6.934534758329391e-05, 7.237307727336884e-05, 7.540080696344376e-05, 7.842853665351868e-05, 8.14562663435936e-05, 8.448399603366852e-05, 8.751172572374344e-05, 9.053945541381836e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 8.0, 6.0, 8.0, 11.0, 12.0, 10.0, 12.0, 15.0, 18.0, 26.0, 21.0, 32.0, 35.0, 35.0, 33.0, 31.0, 32.0, 56.0, 58.0, 70.0, 57.0, 42.0, 35.0, 34.0, 39.0, 28.0, 25.0, 32.0, 29.0, 18.0, 18.0, 19.0, 11.0, 14.0, 18.0, 6.0, 15.0, 10.0, 7.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0002491474151611328, -0.00024078786373138428, -0.00023242831230163574, -0.0002240687608718872, -0.00021570920944213867, -0.00020734965801239014, -0.0001989901065826416, -0.00019063055515289307, -0.00018227100372314453, -0.000173911452293396, -0.00016555190086364746, -0.00015719234943389893, -0.0001488327980041504, -0.00014047324657440186, -0.00013211369514465332, -0.00012375414371490479, -0.00011539459228515625, -0.00010703504085540771, -9.867548942565918e-05, -9.031593799591064e-05, -8.195638656616211e-05, -7.359683513641357e-05, -6.523728370666504e-05, -5.6877732276916504e-05, -4.851818084716797e-05, -4.0158629417419434e-05, -3.17990779876709e-05, -2.3439526557922363e-05, -1.5079975128173828e-05, -6.720423698425293e-06, 1.6391277313232422e-06, 9.998679161071777e-06, 1.8358230590820312e-05, 2.6717782020568848e-05, 3.507733345031738e-05, 4.343688488006592e-05, 5.179643630981445e-05, 6.015598773956299e-05, 6.851553916931152e-05, 7.687509059906006e-05, 8.52346420288086e-05, 9.359419345855713e-05, 0.00010195374488830566, 0.0001103132963180542, 0.00011867284774780273, 0.00012703239917755127, 0.0001353919506072998, 0.00014375150203704834, 0.00015211105346679688, 0.0001604706048965454, 0.00016883015632629395, 0.00017718970775604248, 0.00018554925918579102, 0.00019390881061553955, 0.00020226836204528809, 0.00021062791347503662, 0.00021898746490478516, 0.0002273470163345337, 0.00023570656776428223, 0.00024406611919403076, 0.0002524256706237793, 0.00026078522205352783, 0.00026914477348327637, 0.0002775043249130249, 0.00028586387634277344]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 2.0, 8.0, 14.0, 12.0, 18.0, 26.0, 21.0, 43.0, 38.0, 36.0, 92.0, 302.0, 32405.0, 1014586.0, 555.0, 118.0, 48.0, 45.0, 36.0, 37.0, 28.0, 17.0, 18.0, 12.0, 8.0, 4.0, 4.0, 2.0, 9.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0011873245239257812, -0.001152530312538147, -0.0011177361011505127, -0.0010829418897628784, -0.0010481476783752441, -0.0010133534669876099, -0.0009785592555999756, -0.0009437650442123413, -0.000908970832824707, -0.0008741766214370728, -0.0008393824100494385, -0.0008045881986618042, -0.0007697939872741699, -0.0007349997758865356, -0.0007002055644989014, -0.0006654113531112671, -0.0006306171417236328, -0.0005958229303359985, -0.0005610287189483643, -0.00052623450756073, -0.0004914402961730957, -0.0004566460847854614, -0.00042185187339782715, -0.00038705766201019287, -0.0003522634506225586, -0.0003174692392349243, -0.00028267502784729004, -0.00024788081645965576, -0.00021308660507202148, -0.0001782923936843872, -0.00014349818229675293, -0.00010870397090911865, -7.390975952148438e-05, -3.91155481338501e-05, -4.32133674621582e-06, 3.0472874641418457e-05, 6.526708602905273e-05, 0.00010006129741668701, 0.0001348555088043213, 0.00016964972019195557, 0.00020444393157958984, 0.00023923814296722412, 0.0002740323543548584, 0.0003088265657424927, 0.00034362077713012695, 0.00037841498851776123, 0.0004132091999053955, 0.0004480034112930298, 0.00048279762268066406, 0.0005175918340682983, 0.0005523860454559326, 0.0005871802568435669, 0.0006219744682312012, 0.0006567686796188354, 0.0006915628910064697, 0.000726357102394104, 0.0007611513137817383, 0.0007959455251693726, 0.0008307397365570068, 0.0008655339479446411, 0.0009003281593322754, 0.0009351223707199097, 0.0009699165821075439, 0.0010047107934951782, 0.0010395050048828125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 2.0, 8.0, 14.0, 11.0, 18.0, 26.0, 19.0, 45.0, 35.0, 34.0, 48.0, 60.0, 126.0, 163.0, 62.0, 59.0, 44.0, 41.0, 37.0, 37.0, 27.0, 19.0, 16.0, 13.0, 9.0, 4.0, 4.0, 2.0, 9.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0006346702575683594, -0.0006160959601402283, -0.0005975216627120972, -0.0005789473652839661, -0.000560373067855835, -0.0005417987704277039, -0.0005232244729995728, -0.0005046501755714417, -0.00048607587814331055, -0.00046750158071517944, -0.00044892728328704834, -0.00043035298585891724, -0.00041177868843078613, -0.00039320439100265503, -0.0003746300935745239, -0.0003560557961463928, -0.0003374814987182617, -0.0003189072012901306, -0.0003003329038619995, -0.0002817586064338684, -0.0002631843090057373, -0.0002446100115776062, -0.0002260357141494751, -0.000207461416721344, -0.0001888871192932129, -0.0001703128218650818, -0.00015173852443695068, -0.00013316422700881958, -0.00011458992958068848, -9.601563215255737e-05, -7.744133472442627e-05, -5.8867037296295166e-05, -4.029273986816406e-05, -2.171844244003296e-05, -3.1441450119018555e-06, 1.5430152416229248e-05, 3.400444984436035e-05, 5.2578747272491455e-05, 7.115304470062256e-05, 8.972734212875366e-05, 0.00010830163955688477, 0.00012687593698501587, 0.00014545023441314697, 0.00016402453184127808, 0.00018259882926940918, 0.00020117312669754028, 0.0002197474241256714, 0.0002383217215538025, 0.0002568960189819336, 0.0002754703164100647, 0.0002940446138381958, 0.0003126189112663269, 0.000331193208694458, 0.0003497675061225891, 0.0003683418035507202, 0.0003869161009788513, 0.0004054903984069824, 0.0004240646958351135, 0.00044263899326324463, 0.00046121329069137573, 0.00047978758811950684, 0.0004983618855476379, 0.000516936182975769, 0.0005355104804039001, 0.0005540847778320312]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 0.0, 4.0, 4.0, 4.0, 0.0, 5.0, 26.0, 31.0, 0.0, 113.0, 186.0, 580.0, 0.0, 1421.0, 5551.0, 38894.0, 0.0, 954603.0, 39118.0, 5595.0, 0.0, 1486.0, 558.0, 202.0, 0.0, 102.0, 31.0, 20.0, 0.0, 11.0, 9.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.430511474609375e-06, -1.385807991027832e-06, -1.341104507446289e-06, -1.296401023864746e-06, -1.2516975402832031e-06, -1.2069940567016602e-06, -1.1622905731201172e-06, -1.1175870895385742e-06, -1.0728836059570312e-06, -1.0281801223754883e-06, -9.834766387939453e-07, -9.387731552124023e-07, -8.940696716308594e-07, -8.493661880493164e-07, -8.046627044677734e-07, -7.599592208862305e-07, -7.152557373046875e-07, -6.705522537231445e-07, -6.258487701416016e-07, -5.811452865600586e-07, -5.364418029785156e-07, -4.917383193969727e-07, -4.470348358154297e-07, -4.023313522338867e-07, -3.5762786865234375e-07, -3.129243850708008e-07, -2.682209014892578e-07, -2.2351741790771484e-07, -1.7881393432617188e-07, -1.341104507446289e-07, -8.940696716308594e-08, -4.470348358154297e-08, 0.0, 4.470348358154297e-08, 8.940696716308594e-08, 1.341104507446289e-07, 1.7881393432617188e-07, 2.2351741790771484e-07, 2.682209014892578e-07, 3.129243850708008e-07, 3.5762786865234375e-07, 4.023313522338867e-07, 4.470348358154297e-07, 4.917383193969727e-07, 5.364418029785156e-07, 5.811452865600586e-07, 6.258487701416016e-07, 6.705522537231445e-07, 7.152557373046875e-07, 7.599592208862305e-07, 8.046627044677734e-07, 8.493661880493164e-07, 8.940696716308594e-07, 9.387731552124023e-07, 9.834766387939453e-07, 1.0281801223754883e-06, 1.0728836059570312e-06, 1.1175870895385742e-06, 1.1622905731201172e-06, 1.2069940567016602e-06, 1.2516975402832031e-06, 1.296401023864746e-06, 1.341104507446289e-06, 1.385807991027832e-06, 1.430511474609375e-06]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [86.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 863.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 6.0, 0.0, 4.0, 9.0, 0.0, 17.0, 0.0, 21.0, 52.0, 0.0, 98.0, 195.0, 0.0, 399.0, 905.0, 0.0, 2508.0, 8647.0, 0.0, 45198.0, 0.0, 933058.0, 44671.0, 0.0, 8614.0, 2439.0, 0.0, 924.0, 393.0, 0.0, 200.0, 0.0, 105.0, 50.0, 0.0, 24.0, 14.0, 0.0, 5.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0728836059570312e-06, -1.0346993803977966e-06, -9.96515154838562e-07, -9.583309292793274e-07, -9.201467037200928e-07, -8.819624781608582e-07, -8.437782526016235e-07, -8.055940270423889e-07, -7.674098014831543e-07, -7.292255759239197e-07, -6.910413503646851e-07, -6.528571248054504e-07, -6.146728992462158e-07, -5.764886736869812e-07, -5.383044481277466e-07, -5.00120222568512e-07, -4.6193599700927734e-07, -4.237517714500427e-07, -3.855675458908081e-07, -3.473833203315735e-07, -3.0919909477233887e-07, -2.7101486921310425e-07, -2.3283064365386963e-07, -1.94646418094635e-07, -1.564621925354004e-07, -1.1827796697616577e-07, -8.009374141693115e-08, -4.190951585769653e-08, -3.725290298461914e-09, 3.4458935260772705e-08, 7.264316082000732e-08, 1.1082738637924194e-07, 1.4901161193847656e-07, 1.8719583749771118e-07, 2.253800630569458e-07, 2.635642886161804e-07, 3.0174851417541504e-07, 3.3993273973464966e-07, 3.781169652938843e-07, 4.163011908531189e-07, 4.544854164123535e-07, 4.926696419715881e-07, 5.308538675308228e-07, 5.690380930900574e-07, 6.07222318649292e-07, 6.454065442085266e-07, 6.835907697677612e-07, 7.217749953269958e-07, 7.599592208862305e-07, 7.981434464454651e-07, 8.363276720046997e-07, 8.745118975639343e-07, 9.126961231231689e-07, 9.508803486824036e-07, 9.890645742416382e-07, 1.0272487998008728e-06, 1.0654330253601074e-06, 1.103617250919342e-06, 1.1418014764785767e-06, 1.1799857020378113e-06, 1.218169927597046e-06, 1.2563541531562805e-06, 1.2945383787155151e-06, 1.3327226042747498e-06, 1.3709068298339844e-06]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 10.0, 0.0, 0.0, 17.0, 0.0, 0.0, 44.0, 0.0, 0.0, 68.0, 0.0, 0.0, 729.0, 0.0, 0.0, 87.0, 0.0, 0.0, 30.0, 0.0, 0.0, 14.0, 0.0, 0.0, 7.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.364418029785156e-07, -5.168840289115906e-07, -4.973262548446655e-07, -4.777684807777405e-07, -4.5821070671081543e-07, -4.386529326438904e-07, -4.1909515857696533e-07, -3.995373845100403e-07, -3.7997961044311523e-07, -3.604218363761902e-07, -3.4086406230926514e-07, -3.213062882423401e-07, -3.0174851417541504e-07, -2.8219074010849e-07, -2.6263296604156494e-07, -2.430751919746399e-07, -2.2351741790771484e-07, -2.039596438407898e-07, -1.8440186977386475e-07, -1.648440957069397e-07, -1.4528632164001465e-07, -1.257285475730896e-07, -1.0617077350616455e-07, -8.66129994392395e-08, -6.705522537231445e-08, -4.7497451305389404e-08, -2.7939677238464355e-08, -8.381903171539307e-09, 1.1175870895385742e-08, 3.073364496231079e-08, 5.029141902923584e-08, 6.984919309616089e-08, 8.940696716308594e-08, 1.0896474123001099e-07, 1.2852251529693604e-07, 1.4808028936386108e-07, 1.6763806343078613e-07, 1.8719583749771118e-07, 2.0675361156463623e-07, 2.2631138563156128e-07, 2.4586915969848633e-07, 2.654269337654114e-07, 2.849847078323364e-07, 3.045424818992615e-07, 3.241002559661865e-07, 3.4365803003311157e-07, 3.632158041000366e-07, 3.8277357816696167e-07, 4.023313522338867e-07, 4.2188912630081177e-07, 4.414469003677368e-07, 4.6100467443466187e-07, 4.805624485015869e-07, 5.00120222568512e-07, 5.19677996635437e-07, 5.392357707023621e-07, 5.587935447692871e-07, 5.783513188362122e-07, 5.979090929031372e-07, 6.174668669700623e-07, 6.370246410369873e-07, 6.565824151039124e-07, 6.761401891708374e-07, 6.956979632377625e-07, 7.152557373046875e-07]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1020.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006957369623705745, -0.0004026503302156925, -0.00010956369806081057, 0.0001835229340940714, 0.00047660956624895334, 0.0007696961984038353, 0.0010627828305587173, 0.0013558693462982774, 0.0016489560948684812, 0.0019420427270233631, 0.002235129475593567, 0.002528215991333127, 0.002821302507072687, 0.003114389255642891, 0.0034074760042130947, 0.003700562287122011, 0.003993649035692215, 0.004286735784262419, 0.0045798225328326225, 0.004872908815741539, 0.005165995564311743, 0.0054590823128819466, 0.005752168595790863, 0.006045255344361067, 0.006338342092931271, 0.006631428841501474, 0.006924515590071678, 0.007217601872980595, 0.007510688621550798, 0.007803775370121002, 0.008096861653029919, 0.008389947935938835, 0.008683035150170326, 0.008976121433079243, 0.009269208647310734, 0.00956229493021965, 0.009855382144451141, 0.010148468427360058, 0.010441554710268974, 0.010734641924500465, 0.011027728207409382, 0.011320814490318298, 0.01161390170454979, 0.011906987987458706, 0.012200074270367622, 0.012493161484599113, 0.01278624776750803, 0.013079334050416946, 0.013372421264648438, 0.013665507547557354, 0.013958594761788845, 0.014251681044697762, 0.014544768258929253, 0.014837854541838169, 0.015130940824747086, 0.015424028038978577, 0.015717115253210068, 0.01601020246744156, 0.0163032878190279, 0.016596375033259392, 0.016889462247490883, 0.017182547599077225, 0.017475634813308716, 0.017768722027540207, 0.01806180737912655]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 3.0, 3.0, 6.0, 9.0, 5.0, 11.0, 10.0, 13.0, 16.0, 16.0, 23.0, 23.0, 31.0, 31.0, 32.0, 36.0, 42.0, 43.0, 39.0, 48.0, 46.0, 43.0, 36.0, 39.0, 34.0, 45.0, 50.0, 33.0, 33.0, 32.0, 28.0, 27.0, 16.0, 24.0, 18.0, 5.0, 6.0, 9.0, 4.0, 8.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006542268092744052, -0.0006325971917249262, -0.0006109675741754472, -0.0005893379566259682, -0.0005677083390764892, -0.0005460786633193493, -0.0005244490457698703, -0.0005028194282203913, -0.00048118981067091227, -0.00045956019312143326, -0.00043793057557195425, -0.00041630095802247524, -0.0003946713113691658, -0.00037304169381968677, -0.00035141207627020776, -0.0003297824296168983, -0.00030815284117124975, -0.00028652322362177074, -0.00026489360607229173, -0.0002432639739708975, -0.00022163434186950326, -0.00020000472432002425, -0.00017837510677054524, -0.000156745474669151, -0.000135115857119672, -0.00011348623229423538, -9.185660746879876e-05, -7.022698991931975e-05, -4.859736509388313e-05, -2.6967740268446505e-05, -5.338122718967497e-06, 1.629150938242674e-05, 3.7921126931905746e-05, 5.955075175734237e-05, 8.118037658277899e-05, 0.000102809994132258, 0.00012443962623365223, 0.00014606924378313124, 0.00016769886133261025, 0.00018932849343400449, 0.0002109581109834835, 0.0002325877285329625, 0.00025421736063435674, 0.00027584697818383574, 0.00029747659573331475, 0.00031910621328279376, 0.00034073583083227277, 0.00036236547748558223, 0.00038399509503506124, 0.00040562471258454025, 0.00042725433013401926, 0.0004488839767873287, 0.00047051359433680773, 0.0004921432118862867, 0.0005137728294357657, 0.0005354024469852448, 0.0005570320645347238, 0.0005786616820842028, 0.0006002912996336818, 0.0006219209171831608, 0.0006435505347326398, 0.0006651801522821188, 0.0006868097698315978, 0.0007084394455887377, 0.0007300690631382167]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 4.0, 7.0, 9.0, 15.0, 16.0, 17.0, 17.0, 19.0, 31.0, 30.0, 29.0, 39.0, 45.0, 71.0, 179.0, 759.0, 4180749.0, 11456.0, 309.0, 102.0, 70.0, 51.0, 47.0, 22.0, 24.0, 28.0, 24.0, 18.0, 24.0, 11.0, 7.0, 4.0, 10.0, 5.0, 5.0, 4.0, 6.0, 4.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0006632804870605469, -0.0006430372595787048, -0.0006227940320968628, -0.0006025508046150208, -0.0005823075771331787, -0.0005620643496513367, -0.0005418211221694946, -0.0005215778946876526, -0.0005013346672058105, -0.0004810914397239685, -0.00046084821224212646, -0.0004406049847602844, -0.0004203617572784424, -0.00040011852979660034, -0.0003798753023147583, -0.00035963207483291626, -0.0003393888473510742, -0.0003191456198692322, -0.00029890239238739014, -0.0002786591649055481, -0.00025841593742370605, -0.00023817270994186401, -0.00021792948246002197, -0.00019768625497817993, -0.0001774430274963379, -0.00015719980001449585, -0.0001369565725326538, -0.00011671334505081177, -9.647011756896973e-05, -7.622689008712769e-05, -5.5983662605285645e-05, -3.5740435123443604e-05, -1.5497207641601562e-05, 4.7460198402404785e-06, 2.498924732208252e-05, 4.523247480392456e-05, 6.54757022857666e-05, 8.571892976760864e-05, 0.00010596215724945068, 0.00012620538473129272, 0.00014644861221313477, 0.0001666918396949768, 0.00018693506717681885, 0.0002071782946586609, 0.00022742152214050293, 0.00024766474962234497, 0.000267907977104187, 0.00028815120458602905, 0.0003083944320678711, 0.00032863765954971313, 0.0003488808870315552, 0.0003691241145133972, 0.00038936734199523926, 0.0004096105694770813, 0.00042985379695892334, 0.0004500970244407654, 0.0004703402519226074, 0.0004905834794044495, 0.0005108267068862915, 0.0005310699343681335, 0.0005513131618499756, 0.0005715563893318176, 0.0005917996168136597, 0.0006120428442955017, 0.0006322860717773438]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 2.0, 4.0, 9.0, 13.0, 16.0, 14.0, 19.0, 23.0, 30.0, 37.0, 35.0, 40.0, 50.0, 47.0, 42.0, 89.0, 62.0, 45.0, 52.0, 50.0, 51.0, 47.0, 40.0, 40.0, 35.0, 29.0, 19.0, 18.0, 10.0, 11.0, 12.0, 0.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.59634780883789e-06, -9.219162166118622e-06, -8.841976523399353e-06, -8.464790880680084e-06, -8.087605237960815e-06, -7.710419595241547e-06, -7.333233952522278e-06, -6.956048309803009e-06, -6.57886266708374e-06, -6.2016770243644714e-06, -5.824491381645203e-06, -5.447305738925934e-06, -5.070120096206665e-06, -4.692934453487396e-06, -4.3157488107681274e-06, -3.938563168048859e-06, -3.56137752532959e-06, -3.184191882610321e-06, -2.8070062398910522e-06, -2.4298205971717834e-06, -2.0526349544525146e-06, -1.6754493117332458e-06, -1.298263669013977e-06, -9.210780262947083e-07, -5.438923835754395e-07, -1.6670674085617065e-07, 2.1047890186309814e-07, 5.876645445823669e-07, 9.648501873016357e-07, 1.3420358300209045e-06, 1.7192214727401733e-06, 2.096407115459442e-06, 2.473592758178711e-06, 2.8507784008979797e-06, 3.2279640436172485e-06, 3.6051496863365173e-06, 3.982335329055786e-06, 4.359520971775055e-06, 4.736706614494324e-06, 5.1138922572135925e-06, 5.491077899932861e-06, 5.86826354265213e-06, 6.245449185371399e-06, 6.622634828090668e-06, 6.9998204708099365e-06, 7.377006113529205e-06, 7.754191756248474e-06, 8.131377398967743e-06, 8.508563041687012e-06, 8.88574868440628e-06, 9.26293432712555e-06, 9.640119969844818e-06, 1.0017305612564087e-05, 1.0394491255283356e-05, 1.0771676898002625e-05, 1.1148862540721893e-05, 1.1526048183441162e-05, 1.1903233826160431e-05, 1.22804194688797e-05, 1.2657605111598969e-05, 1.3034790754318237e-05, 1.3411976397037506e-05, 1.3789162039756775e-05, 1.4166347682476044e-05, 1.4543533325195312e-05]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 5.0, 9.0, 9.0, 6.0, 10.0, 21.0, 28.0, 60.0, 147.0, 2306.0, 4190598.0, 834.0, 113.0, 51.0, 42.0, 22.0, 9.0, 9.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00030159950256347656, -0.00028060004115104675, -0.00025960057973861694, -0.00023860111832618713, -0.00021760165691375732, -0.00019660219550132751, -0.0001756027340888977, -0.0001546032726764679, -0.00013360381126403809, -0.00011260434985160828, -9.160488843917847e-05, -7.060542702674866e-05, -4.960596561431885e-05, -2.8606504201889038e-05, -7.6070427894592285e-06, 1.3392418622970581e-05, 3.439188003540039e-05, 5.53913414478302e-05, 7.639080286026001e-05, 9.739026427268982e-05, 0.00011838972568511963, 0.00013938918709754944, 0.00016038864850997925, 0.00018138810992240906, 0.00020238757133483887, 0.00022338703274726868, 0.0002443864941596985, 0.0002653859555721283, 0.0002863854169845581, 0.0003073848783969879, 0.0003283843398094177, 0.00034938380122184753, 0.00037038326263427734, 0.00039138272404670715, 0.00041238218545913696, 0.00043338164687156677, 0.0004543811082839966, 0.0004753805696964264, 0.0004963800311088562, 0.000517379492521286, 0.0005383789539337158, 0.0005593784153461456, 0.0005803778767585754, 0.0006013773381710052, 0.0006223767995834351, 0.0006433762609958649, 0.0006643757224082947, 0.0006853751838207245, 0.0007063746452331543, 0.0007273741066455841, 0.0007483735680580139, 0.0007693730294704437, 0.0007903724908828735, 0.0008113719522953033, 0.0008323714137077332, 0.000853370875120163, 0.0008743703365325928, 0.0008953697979450226, 0.0009163692593574524, 0.0009373687207698822, 0.000958368182182312, 0.0009793676435947418, 0.0010003671050071716, 0.0010213665664196014, 0.0010423660278320312]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 8.0, 10.0, 10.0, 15.0, 26.0, 41.0, 72.0, 183.0, 437.0, 2380.0, 603.0, 139.0, 67.0, 38.0, 17.0, 14.0, 10.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.138448715209961e-05, -1.0695308446884155e-05, -1.0006129741668701e-05, -9.316951036453247e-06, -8.627772331237793e-06, -7.938593626022339e-06, -7.249414920806885e-06, -6.560236215591431e-06, -5.8710575103759766e-06, -5.1818788051605225e-06, -4.492700099945068e-06, -3.8035213947296143e-06, -3.11434268951416e-06, -2.425163984298706e-06, -1.735985279083252e-06, -1.0468065738677979e-06, -3.5762786865234375e-07, 3.3155083656311035e-07, 1.0207295417785645e-06, 1.7099082469940186e-06, 2.3990869522094727e-06, 3.0882656574249268e-06, 3.777444362640381e-06, 4.466623067855835e-06, 5.155801773071289e-06, 5.844980478286743e-06, 6.534159183502197e-06, 7.223337888717651e-06, 7.912516593933105e-06, 8.60169529914856e-06, 9.290874004364014e-06, 9.980052709579468e-06, 1.0669231414794922e-05, 1.1358410120010376e-05, 1.204758882522583e-05, 1.2736767530441284e-05, 1.3425946235656738e-05, 1.4115124940872192e-05, 1.4804303646087646e-05, 1.54934823513031e-05, 1.6182661056518555e-05, 1.687183976173401e-05, 1.7561018466949463e-05, 1.8250197172164917e-05, 1.893937587738037e-05, 1.9628554582595825e-05, 2.031773328781128e-05, 2.1006911993026733e-05, 2.1696090698242188e-05, 2.238526940345764e-05, 2.3074448108673096e-05, 2.376362681388855e-05, 2.4452805519104004e-05, 2.5141984224319458e-05, 2.5831162929534912e-05, 2.6520341634750366e-05, 2.720952033996582e-05, 2.7898699045181274e-05, 2.858787775039673e-05, 2.9277056455612183e-05, 2.9966235160827637e-05, 3.065541386604309e-05, 3.1344592571258545e-05, 3.2033771276474e-05, 3.272294998168945e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 16.0, 12.0, 25.0, 32.0, 68.0, 119.0, 200.0, 204.0, 134.0, 82.0, 54.0, 21.0, 20.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.961693725315854e-05, -6.784372817492113e-05, -6.607051909668371e-05, -6.42973100184463e-05, -6.252410094020888e-05, -6.075088822399266e-05, -5.8977679145755246e-05, -5.7204466429539025e-05, -5.543125735130161e-05, -5.3658048273064196e-05, -5.188483919482678e-05, -5.011162647861056e-05, -4.8338417400373146e-05, -4.656520832213573e-05, -4.479199924389832e-05, -4.3018786527682096e-05, -4.124557744944468e-05, -3.947236837120727e-05, -3.769915929296985e-05, -3.592594657675363e-05, -3.415273749851622e-05, -3.23795284202788e-05, -3.060631934204139e-05, -2.883310844481457e-05, -2.705990118556656e-05, -2.5286692107329145e-05, -2.3513481210102327e-05, -2.1740272131864913e-05, -1.9967061234638095e-05, -1.819385215640068e-05, -1.6420643078163266e-05, -1.4647432180936448e-05, -1.287422128370963e-05, -1.1101011295977514e-05, -9.327801308245398e-06, -7.554591775260633e-06, -5.781381787528517e-06, -4.0081722545437515e-06, -2.2349622668116353e-06, -4.617522790795192e-07, 1.311457708652597e-06, 3.084667696384713e-06, 4.857877684116829e-06, 6.6310872171015944e-06, 8.40429675008636e-06, 1.0177506737818476e-05, 1.1950716725550592e-05, 1.3723926713282708e-05, 1.5497136701014824e-05, 1.727034577925224e-05, 1.9043556676479056e-05, 2.081676575471647e-05, 2.258997665194329e-05, 2.4363185730180703e-05, 2.613639662740752e-05, 2.7909605705644935e-05, 2.968281478388235e-05, 3.1456023862119764e-05, 3.322923294035718e-05, 3.50024456565734e-05, 3.6775654734810814e-05, 3.854886381304823e-05, 4.032207289128564e-05, 4.2095285607501864e-05, 4.386849468573928e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 7.0, 12.0, 9.0, 25.0, 23.0, 21.0, 32.0, 44.0, 44.0, 47.0, 56.0, 66.0, 52.0, 48.0, 46.0, 74.0, 58.0, 42.0, 47.0, 47.0, 45.0, 39.0, 31.0, 20.0, 19.0, 9.0, 5.0, 8.0, 10.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.645035056048073e-05, -2.5690462280181237e-05, -2.493057218089234e-05, -2.417068390059285e-05, -2.3410793801303953e-05, -2.265090552100446e-05, -2.1891015421715565e-05, -2.1131127141416073e-05, -2.0371237042127177e-05, -1.9611348761827685e-05, -1.885145866253879e-05, -1.8091570382239297e-05, -1.73316802829504e-05, -1.657179200265091e-05, -1.5811901903362013e-05, -1.5052013623062521e-05, -1.4292124433268327e-05, -1.3532235243474133e-05, -1.277234605367994e-05, -1.2012456863885745e-05, -1.1252567674091551e-05, -1.0492678484297357e-05, -9.732790203997865e-06, -8.97290010470897e-06, -8.213011824409477e-06, -7.4531226346152835e-06, -6.6932334448210895e-06, -5.9333442550268956e-06, -5.173455065232702e-06, -4.413565875438508e-06, -3.6536771403916646e-06, -2.8937879505974706e-06, -2.1338983060559258e-06, -1.3740091162617318e-06, -6.141200401543756e-07, 1.4576903595298063e-07, 9.056582257471746e-07, 1.6655474155413685e-06, 2.425436377961887e-06, 3.185325567756081e-06, 3.945214757550275e-06, 4.705103947344469e-06, 5.464993137138663e-06, 6.224881872185506e-06, 6.9847710619797e-06, 7.744660251773894e-06, 8.504549441568088e-06, 9.264438631362282e-06, 1.0024327821156476e-05, 1.078421701095067e-05, 1.1544106200744864e-05, 1.2303995390539058e-05, 1.3063884580333252e-05, 1.3823773770127445e-05, 1.4583662050426938e-05, 1.5343552149715833e-05, 1.6103440430015326e-05, 1.6863328710314818e-05, 1.7623218809603713e-05, 1.8383107089903206e-05, 1.91429971891921e-05, 1.9902885469491594e-05, 2.066277556878049e-05, 2.142266384907998e-05, 2.2182553948368877e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 1.0, 9.0, 11.0, 21.0, 17.0, 37.0, 77.0, 112.0, 156.0, 334.0, 715.0, 1797.0, 3998.0, 23451.0, 309614.0, 640540.0, 55479.0, 8190.0, 2278.0, 722.0, 444.0, 239.0, 115.0, 71.0, 48.0, 21.0, 26.0, 8.0, 8.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.357929229736328e-06, -9.075738489627838e-06, -8.793547749519348e-06, -8.511357009410858e-06, -8.229166269302368e-06, -7.946975529193878e-06, -7.664784789085388e-06, -7.382594048976898e-06, -7.100403308868408e-06, -6.818212568759918e-06, -6.536021828651428e-06, -6.253831088542938e-06, -5.971640348434448e-06, -5.689449608325958e-06, -5.407258868217468e-06, -5.125068128108978e-06, -4.842877388000488e-06, -4.560686647891998e-06, -4.278495907783508e-06, -3.996305167675018e-06, -3.7141144275665283e-06, -3.4319236874580383e-06, -3.1497329473495483e-06, -2.8675422072410583e-06, -2.5853514671325684e-06, -2.3031607270240784e-06, -2.0209699869155884e-06, -1.7387792468070984e-06, -1.4565885066986084e-06, -1.1743977665901184e-06, -8.922070264816284e-07, -6.100162863731384e-07, -3.2782554626464844e-07, -4.563480615615845e-08, 2.3655593395233154e-07, 5.187466740608215e-07, 8.009374141693115e-07, 1.0831281542778015e-06, 1.3653188943862915e-06, 1.6475096344947815e-06, 1.9297003746032715e-06, 2.2118911147117615e-06, 2.4940818548202515e-06, 2.7762725949287415e-06, 3.0584633350372314e-06, 3.3406540751457214e-06, 3.6228448152542114e-06, 3.905035555362701e-06, 4.187226295471191e-06, 4.469417035579681e-06, 4.751607775688171e-06, 5.033798515796661e-06, 5.315989255905151e-06, 5.598179996013641e-06, 5.880370736122131e-06, 6.162561476230621e-06, 6.444752216339111e-06, 6.726942956447601e-06, 7.009133696556091e-06, 7.291324436664581e-06, 7.573515176773071e-06, 7.855705916881561e-06, 8.137896656990051e-06, 8.420087397098541e-06, 8.702278137207031e-06]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 9.0, 12.0, 15.0, 21.0, 22.0, 36.0, 50.0, 41.0, 77.0, 56.0, 78.0, 81.0, 75.0, 83.0, 63.0, 63.0, 56.0, 38.0, 35.0, 29.0, 23.0, 11.0, 11.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7940998077392578e-05, -1.7248094081878662e-05, -1.6555190086364746e-05, -1.586228609085083e-05, -1.5169382095336914e-05, -1.4476478099822998e-05, -1.3783574104309082e-05, -1.3090670108795166e-05, -1.239776611328125e-05, -1.1704862117767334e-05, -1.1011958122253418e-05, -1.0319054126739502e-05, -9.626150131225586e-06, -8.93324613571167e-06, -8.240342140197754e-06, -7.547438144683838e-06, -6.854534149169922e-06, -6.161630153656006e-06, -5.46872615814209e-06, -4.775822162628174e-06, -4.082918167114258e-06, -3.390014171600342e-06, -2.6971101760864258e-06, -2.0042061805725098e-06, -1.3113021850585938e-06, -6.183981895446777e-07, 7.450580596923828e-08, 7.674098014831543e-07, 1.4603137969970703e-06, 2.1532177925109863e-06, 2.8461217880249023e-06, 3.5390257835388184e-06, 4.231929779052734e-06, 4.92483377456665e-06, 5.617737770080566e-06, 6.310641765594482e-06, 7.0035457611083984e-06, 7.696449756622314e-06, 8.38935375213623e-06, 9.082257747650146e-06, 9.775161743164062e-06, 1.0468065738677979e-05, 1.1160969734191895e-05, 1.185387372970581e-05, 1.2546777725219727e-05, 1.3239681720733643e-05, 1.3932585716247559e-05, 1.4625489711761475e-05, 1.531839370727539e-05, 1.6011297702789307e-05, 1.6704201698303223e-05, 1.739710569381714e-05, 1.8090009689331055e-05, 1.878291368484497e-05, 1.9475817680358887e-05, 2.0168721675872803e-05, 2.086162567138672e-05, 2.1554529666900635e-05, 2.224743366241455e-05, 2.2940337657928467e-05, 2.3633241653442383e-05, 2.43261456489563e-05, 2.5019049644470215e-05, 2.571195363998413e-05, 2.6404857635498047e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 17.0, 12.0, 17.0, 26.0, 33.0, 46.0, 67.0, 96.0, 155.0, 514.0, 525.0, 775.0, 1306.0, 2133.0, 3574.0, 6051.0, 10584.0, 19998.0, 117038.0, 180019.0, 360612.0, 180960.0, 78471.0, 38574.0, 20302.0, 11185.0, 6085.0, 5765.0, 1268.0, 772.0, 513.0, 342.0, 219.0, 162.0, 104.0, 55.0, 89.0, 28.0, 22.0, 14.0, 6.0, 3.0, 7.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.9669532775878906e-06, -1.9008293747901917e-06, -1.8347054719924927e-06, -1.7685815691947937e-06, -1.7024576663970947e-06, -1.6363337635993958e-06, -1.5702098608016968e-06, -1.5040859580039978e-06, -1.4379620552062988e-06, -1.3718381524085999e-06, -1.3057142496109009e-06, -1.239590346813202e-06, -1.173466444015503e-06, -1.107342541217804e-06, -1.041218638420105e-06, -9.75094735622406e-07, -9.08970832824707e-07, -8.428469300270081e-07, -7.767230272293091e-07, -7.105991244316101e-07, -6.444752216339111e-07, -5.783513188362122e-07, -5.122274160385132e-07, -4.461035132408142e-07, -3.7997961044311523e-07, -3.1385570764541626e-07, -2.477318048477173e-07, -1.816079020500183e-07, -1.1548399925231934e-07, -4.936009645462036e-08, 1.6763806343078613e-08, 8.288770914077759e-08, 1.4901161193847656e-07, 2.1513551473617554e-07, 2.812594175338745e-07, 3.473833203315735e-07, 4.1350722312927246e-07, 4.796311259269714e-07, 5.457550287246704e-07, 6.118789315223694e-07, 6.780028343200684e-07, 7.441267371177673e-07, 8.102506399154663e-07, 8.763745427131653e-07, 9.424984455108643e-07, 1.0086223483085632e-06, 1.0747462511062622e-06, 1.1408701539039612e-06, 1.2069940567016602e-06, 1.2731179594993591e-06, 1.339241862297058e-06, 1.405365765094757e-06, 1.471489667892456e-06, 1.537613570690155e-06, 1.603737473487854e-06, 1.669861376285553e-06, 1.735985279083252e-06, 1.802109181880951e-06, 1.86823308467865e-06, 1.934356987476349e-06, 2.000480890274048e-06, 2.066604793071747e-06, 2.132728695869446e-06, 2.1988525986671448e-06, 2.2649765014648438e-06]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 11.0, 1.0, 12.0, 5.0, 9.0, 18.0, 21.0, 27.0, 39.0, 33.0, 29.0, 45.0, 52.0, 56.0, 58.0, 44.0, 59.0, 51.0, 56.0, 56.0, 46.0, 42.0, 31.0, 40.0, 30.0, 24.0, 25.0, 22.0, 13.0, 7.0, 8.0, 6.0, 3.0, 7.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7954578399658203e-05, -2.6806257665157318e-05, -2.5657936930656433e-05, -2.4509616196155548e-05, -2.3361295461654663e-05, -2.2212974727153778e-05, -2.1064653992652893e-05, -1.9916333258152008e-05, -1.8768012523651123e-05, -1.7619691789150238e-05, -1.6471371054649353e-05, -1.5323050320148468e-05, -1.4174729585647583e-05, -1.3026408851146698e-05, -1.1878088116645813e-05, -1.0729767382144928e-05, -9.581446647644043e-06, -8.433125913143158e-06, -7.284805178642273e-06, -6.136484444141388e-06, -4.988163709640503e-06, -3.839842975139618e-06, -2.691522240638733e-06, -1.543201506137848e-06, -3.948807716369629e-07, 7.534399628639221e-07, 1.9017606973648071e-06, 3.050081431865692e-06, 4.198402166366577e-06, 5.346722900867462e-06, 6.495043635368347e-06, 7.643364369869232e-06, 8.791685104370117e-06, 9.940005838871002e-06, 1.1088326573371887e-05, 1.2236647307872772e-05, 1.3384968042373657e-05, 1.4533288776874542e-05, 1.5681609511375427e-05, 1.6829930245876312e-05, 1.7978250980377197e-05, 1.9126571714878082e-05, 2.0274892449378967e-05, 2.1423213183879852e-05, 2.2571533918380737e-05, 2.3719854652881622e-05, 2.4868175387382507e-05, 2.6016496121883392e-05, 2.7164816856384277e-05, 2.8313137590885162e-05, 2.9461458325386047e-05, 3.060977905988693e-05, 3.175809979438782e-05, 3.29064205288887e-05, 3.405474126338959e-05, 3.520306199789047e-05, 3.635138273239136e-05, 3.749970346689224e-05, 3.864802420139313e-05, 3.979634493589401e-05, 4.09446656703949e-05, 4.209298640489578e-05, 4.324130713939667e-05, 4.438962787389755e-05, 4.553794860839844e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 351.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11432.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024629.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11715.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 323.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-2.384185791015625e-07, -2.300366759300232e-07, -2.2165477275848389e-07, -2.1327286958694458e-07, -2.0489096641540527e-07, -1.9650906324386597e-07, -1.8812716007232666e-07, -1.7974525690078735e-07, -1.7136335372924805e-07, -1.6298145055770874e-07, -1.5459954738616943e-07, -1.4621764421463013e-07, -1.3783574104309082e-07, -1.2945383787155151e-07, -1.210719347000122e-07, -1.126900315284729e-07, -1.043081283569336e-07, -9.592622518539429e-08, -8.754432201385498e-08, -7.916241884231567e-08, -7.078051567077637e-08, -6.239861249923706e-08, -5.4016709327697754e-08, -4.563480615615845e-08, -3.725290298461914e-08, -2.8870999813079834e-08, -2.0489096641540527e-08, -1.210719347000122e-08, -3.725290298461914e-09, 4.6566128730773926e-09, 1.30385160446167e-08, 2.1420419216156006e-08, 2.9802322387695312e-08, 3.818422555923462e-08, 4.6566128730773926e-08, 5.494803190231323e-08, 6.332993507385254e-08, 7.171183824539185e-08, 8.009374141693115e-08, 8.847564458847046e-08, 9.685754776000977e-08, 1.0523945093154907e-07, 1.1362135410308838e-07, 1.2200325727462769e-07, 1.30385160446167e-07, 1.387670636177063e-07, 1.471489667892456e-07, 1.555308699607849e-07, 1.6391277313232422e-07, 1.7229467630386353e-07, 1.8067657947540283e-07, 1.8905848264694214e-07, 1.9744038581848145e-07, 2.0582228899002075e-07, 2.1420419216156006e-07, 2.2258609533309937e-07, 2.3096799850463867e-07, 2.39349901676178e-07, 2.477318048477173e-07, 2.561137080192566e-07, 2.644956111907959e-07, 2.728775143623352e-07, 2.812594175338745e-07, 2.896413207054138e-07, 2.980232238769531e-07]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 185.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 457.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 183.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07, 1.862645149230957e-07, 1.9371509552001953e-07, 2.0116567611694336e-07, 2.086162567138672e-07, 2.1606683731079102e-07, 2.2351741790771484e-07, 2.3096799850463867e-07, 2.384185791015625e-07]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [27.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 31.0, 0.0, 0.0, 201.0, 0.0, 0.0, 10835.0, 0.0, 0.0, 0.0, 1026362.0, 0.0, 0.0, 10799.0, 0.0, 0.0, 205.0, 0.0, 0.0, 27.0, 0.0, 0.0, 31.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.0], "bins": [-5.960464477539062e-07, -5.774199962615967e-07, -5.587935447692871e-07, -5.401670932769775e-07, -5.21540641784668e-07, -5.029141902923584e-07, -4.842877388000488e-07, -4.6566128730773926e-07, -4.470348358154297e-07, -4.284083843231201e-07, -4.0978193283081055e-07, -3.91155481338501e-07, -3.725290298461914e-07, -3.5390257835388184e-07, -3.3527612686157227e-07, -3.166496753692627e-07, -2.980232238769531e-07, -2.7939677238464355e-07, -2.60770320892334e-07, -2.421438694000244e-07, -2.2351741790771484e-07, -2.0489096641540527e-07, -1.862645149230957e-07, -1.6763806343078613e-07, -1.4901161193847656e-07, -1.30385160446167e-07, -1.1175870895385742e-07, -9.313225746154785e-08, -7.450580596923828e-08, -5.587935447692871e-08, -3.725290298461914e-08, -1.862645149230957e-08, 0.0, 1.862645149230957e-08, 3.725290298461914e-08, 5.587935447692871e-08, 7.450580596923828e-08, 9.313225746154785e-08, 1.1175870895385742e-07, 1.30385160446167e-07, 1.4901161193847656e-07, 1.6763806343078613e-07, 1.862645149230957e-07, 2.0489096641540527e-07, 2.2351741790771484e-07, 2.421438694000244e-07, 2.60770320892334e-07, 2.7939677238464355e-07, 2.980232238769531e-07, 3.166496753692627e-07, 3.3527612686157227e-07, 3.5390257835388184e-07, 3.725290298461914e-07, 3.91155481338501e-07, 4.0978193283081055e-07, 4.284083843231201e-07, 4.470348358154297e-07, 4.6566128730773926e-07, 4.842877388000488e-07, 5.029141902923584e-07, 5.21540641784668e-07, 5.401670932769775e-07, 5.587935447692871e-07, 5.774199962615967e-07, 5.960464477539062e-07]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [27.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 966.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 18.0, 94.0, 625.0, 230.0, 39.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017511485202703625, -0.00017100990226026624, -0.00016690495249349624, -0.00016280000272672623, -0.00015869505295995623, -0.00015459011774510145, -0.00015048516797833145, -0.00014638021821156144, -0.00014227526844479144, -0.00013817031867802143, -0.00013406536891125143, -0.00012996041914448142, -0.00012585546937771142, -0.00012175052688689902, -0.00011764557712012902, -0.00011354062735335901, -0.00010943567758658901, -0.000105330727819819, -0.000101225778053049, -9.712083556223661e-05, -9.30158857954666e-05, -8.89109360286966e-05, -8.480598626192659e-05, -8.070103649515659e-05, -7.659608672838658e-05, -7.249113696161658e-05, -6.838618719484657e-05, -6.428123742807657e-05, -6.0176294937264174e-05, -5.607134517049417e-05, -5.1966395403724164e-05, -4.786144563695416e-05, -4.375650314614177e-05, -3.965155337937176e-05, -3.5546607250580564e-05, -3.144165748381056e-05, -2.7336709536029957e-05, -2.3231761588249356e-05, -1.912681182147935e-05, -1.5021863873698749e-05, -1.0916915925918147e-05, -6.811967523390194e-06, -2.707019120862242e-06, 1.3979297364130616e-06, 5.502877684193663e-06, 9.607825631974265e-06, 1.371277539874427e-05, 1.7817723346524872e-05, 2.1922671294305474e-05, 2.6027619242086075e-05, 3.0132567189866677e-05, 3.423751695663668e-05, 3.834246308542788e-05, 4.2447412852197886e-05, 4.655236261896789e-05, 5.0657312385737896e-05, 5.4762258514529094e-05, 5.88672082812991e-05, 6.29721544100903e-05, 6.70771041768603e-05, 7.118205394363031e-05, 7.52869964344427e-05, 7.93919462012127e-05, 8.349689596798271e-05, 8.760184573475271e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 9.0, 18.0, 22.0, 25.0, 38.0, 35.0, 58.0, 80.0, 75.0, 80.0, 60.0, 77.0, 78.0, 74.0, 57.0, 53.0, 45.0, 36.0, 29.0, 14.0, 13.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.053537536994554e-05, -1.984487425943371e-05, -1.9154373148921877e-05, -1.846387385739945e-05, -1.7773372746887617e-05, -1.7082871636375785e-05, -1.6392370525863953e-05, -1.570186941535212e-05, -1.5011368304840289e-05, -1.4320867194328457e-05, -1.3630366993311327e-05, -1.2939865882799495e-05, -1.2249364772287663e-05, -1.1558864571270533e-05, -1.0868363460758701e-05, -1.0177862350246869e-05, -9.487362149229739e-06, -8.796861038717907e-06, -8.106360837700777e-06, -7.415859727188945e-06, -6.725358616677113e-06, -6.034857960912632e-06, -5.344357305148151e-06, -4.653856194636319e-06, -3.963355538871838e-06, -3.2728546557336813e-06, -2.5823537725955248e-06, -1.8918531168310437e-06, -1.2013522336928872e-06, -5.108513505547307e-07, 1.796493052097503e-07, 8.701504157215822e-07, 1.5606510714860633e-06, 2.25115195462422e-06, 2.9416528377623763e-06, 3.6321534935268573e-06, 4.322654604038689e-06, 5.01315525980317e-06, 5.703655915567651e-06, 6.394157026079483e-06, 7.084657681843964e-06, 7.775158337608445e-06, 8.465659448120277e-06, 9.156159649137408e-06, 9.84666075964924e-06, 1.0537161870161071e-05, 1.1227662980672903e-05, 1.1918164091184735e-05, 1.2608664292201865e-05, 1.3299165402713697e-05, 1.3989665603730828e-05, 1.468016671424266e-05, 1.537066782475449e-05, 1.6061168935266323e-05, 1.6751670045778155e-05, 1.7442169337300584e-05, 1.8132670447812416e-05, 1.8823171558324248e-05, 1.951367266883608e-05, 2.020417377934791e-05, 2.089467307087034e-05, 2.1585174181382172e-05, 2.2275675291894004e-05, 2.2966176402405836e-05, 2.3656677512917668e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 7.0, 10.0, 9.0, 15.0, 16.0, 21.0, 25.0, 34.0, 53.0, 83.0, 227.0, 539.0, 1728.0, 7634.0, 41137.0, 701925.0, 260283.0, 27532.0, 5080.0, 1361.0, 377.0, 149.0, 95.0, 56.0, 31.0, 24.0, 17.0, 14.0, 13.0, 20.0, 4.0, 9.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.832578659057617e-05, -3.722682595252991e-05, -3.612786531448364e-05, -3.502890467643738e-05, -3.392994403839111e-05, -3.283098340034485e-05, -3.1732022762298584e-05, -3.063306212425232e-05, -2.9534101486206055e-05, -2.843514084815979e-05, -2.7336180210113525e-05, -2.623721957206726e-05, -2.5138258934020996e-05, -2.403929829597473e-05, -2.2940337657928467e-05, -2.1841377019882202e-05, -2.0742416381835938e-05, -1.9643455743789673e-05, -1.8544495105743408e-05, -1.7445534467697144e-05, -1.634657382965088e-05, -1.5247613191604614e-05, -1.414865255355835e-05, -1.3049691915512085e-05, -1.195073127746582e-05, -1.0851770639419556e-05, -9.752810001373291e-06, -8.653849363327026e-06, -7.554888725280762e-06, -6.455928087234497e-06, -5.356967449188232e-06, -4.258006811141968e-06, -3.159046173095703e-06, -2.0600855350494385e-06, -9.611248970031738e-07, 1.3783574104309082e-07, 1.2367963790893555e-06, 2.33575701713562e-06, 3.4347176551818848e-06, 4.533678293228149e-06, 5.632638931274414e-06, 6.731599569320679e-06, 7.830560207366943e-06, 8.929520845413208e-06, 1.0028481483459473e-05, 1.1127442121505737e-05, 1.2226402759552002e-05, 1.3325363397598267e-05, 1.4424324035644531e-05, 1.5523284673690796e-05, 1.662224531173706e-05, 1.7721205949783325e-05, 1.882016658782959e-05, 1.9919127225875854e-05, 2.101808786392212e-05, 2.2117048501968384e-05, 2.321600914001465e-05, 2.4314969778060913e-05, 2.5413930416107178e-05, 2.6512891054153442e-05, 2.7611851692199707e-05, 2.871081233024597e-05, 2.9809772968292236e-05, 3.09087336063385e-05, 3.2007694244384766e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 7.0, 10.0, 8.0, 16.0, 15.0, 19.0, 26.0, 22.0, 31.0, 37.0, 43.0, 39.0, 44.0, 39.0, 54.0, 75.0, 69.0, 51.0, 53.0, 52.0, 28.0, 37.0, 43.0, 34.0, 26.0, 24.0, 14.0, 14.0, 12.0, 21.0, 5.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.319450378417969e-05, -7.109809666872025e-05, -6.90016895532608e-05, -6.690528243780136e-05, -6.480887532234192e-05, -6.271246820688248e-05, -6.0616061091423035e-05, -5.851965397596359e-05, -5.642324686050415e-05, -5.432683974504471e-05, -5.2230432629585266e-05, -5.0134025514125824e-05, -4.803761839866638e-05, -4.594121128320694e-05, -4.38448041677475e-05, -4.1748397052288055e-05, -3.965198993682861e-05, -3.755558282136917e-05, -3.545917570590973e-05, -3.336276859045029e-05, -3.1266361474990845e-05, -2.9169954359531403e-05, -2.707354724407196e-05, -2.497714012861252e-05, -2.2880733013153076e-05, -2.0784325897693634e-05, -1.8687918782234192e-05, -1.659151166677475e-05, -1.4495104551315308e-05, -1.2398697435855865e-05, -1.0302290320396423e-05, -8.205883204936981e-06, -6.109476089477539e-06, -4.013068974018097e-06, -1.9166618585586548e-06, 1.7974525690078735e-07, 2.2761523723602295e-06, 4.372559487819672e-06, 6.468966603279114e-06, 8.565373718738556e-06, 1.0661780834197998e-05, 1.275818794965744e-05, 1.4854595065116882e-05, 1.6951002180576324e-05, 1.9047409296035767e-05, 2.114381641149521e-05, 2.324022352695465e-05, 2.5336630642414093e-05, 2.7433037757873535e-05, 2.9529444873332977e-05, 3.162585198879242e-05, 3.372225910425186e-05, 3.5818666219711304e-05, 3.7915073335170746e-05, 4.001148045063019e-05, 4.210788756608963e-05, 4.420429468154907e-05, 4.6300701797008514e-05, 4.8397108912467957e-05, 5.04935160279274e-05, 5.258992314338684e-05, 5.468633025884628e-05, 5.6782737374305725e-05, 5.887914448976517e-05, 6.097555160522461e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 6.0, 3.0, 4.0, 7.0, 6.0, 10.0, 13.0, 18.0, 16.0, 17.0, 37.0, 43.0, 67.0, 85.0, 211.0, 573.0, 926811.0, 119732.0, 469.0, 165.0, 74.0, 35.0, 31.0, 30.0, 25.0, 15.0, 17.0, 9.0, 6.0, 5.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00029659271240234375, -0.00028759613633155823, -0.0002785995602607727, -0.0002696029841899872, -0.00026060640811920166, -0.00025160983204841614, -0.00024261325597763062, -0.0002336166799068451, -0.00022462010383605957, -0.00021562352776527405, -0.00020662695169448853, -0.000197630375623703, -0.00018863379955291748, -0.00017963722348213196, -0.00017064064741134644, -0.0001616440713405609, -0.0001526474952697754, -0.00014365091919898987, -0.00013465434312820435, -0.00012565776705741882, -0.0001166611909866333, -0.00010766461491584778, -9.866803884506226e-05, -8.967146277427673e-05, -8.067488670349121e-05, -7.167831063270569e-05, -6.268173456192017e-05, -5.3685158491134644e-05, -4.468858242034912e-05, -3.56920063495636e-05, -2.6695430278778076e-05, -1.7698854207992554e-05, -8.702278137207031e-06, 2.942979335784912e-07, 9.290874004364014e-06, 1.8287450075149536e-05, 2.728402614593506e-05, 3.628060221672058e-05, 4.5277178287506104e-05, 5.4273754358291626e-05, 6.327033042907715e-05, 7.226690649986267e-05, 8.12634825706482e-05, 9.026005864143372e-05, 9.925663471221924e-05, 0.00010825321078300476, 0.00011724978685379028, 0.0001262463629245758, 0.00013524293899536133, 0.00014423951506614685, 0.00015323609113693237, 0.0001622326672077179, 0.00017122924327850342, 0.00018022581934928894, 0.00018922239542007446, 0.00019821897149085999, 0.0002072155475616455, 0.00021621212363243103, 0.00022520869970321655, 0.00023420527577400208, 0.0002432018518447876, 0.0002521984279155731, 0.00026119500398635864, 0.00027019158005714417, 0.0002791881561279297]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 6.0, 3.0, 6.0, 5.0, 7.0, 9.0, 12.0, 19.0, 18.0, 14.0, 33.0, 37.0, 49.0, 47.0, 82.0, 79.0, 110.0, 89.0, 75.0, 73.0, 49.0, 29.0, 32.0, 28.0, 26.0, 14.0, 17.0, 9.0, 5.0, 6.0, 9.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001442432403564453, -0.00013986602425575256, -0.00013548880815505981, -0.00013111159205436707, -0.00012673437595367432, -0.00012235715985298157, -0.00011797994375228882, -0.00011360272765159607, -0.00010922551155090332, -0.00010484829545021057, -0.00010047107934951782, -9.609386324882507e-05, -9.171664714813232e-05, -8.733943104743958e-05, -8.296221494674683e-05, -7.858499884605408e-05, -7.420778274536133e-05, -6.983056664466858e-05, -6.545335054397583e-05, -6.107613444328308e-05, -5.669891834259033e-05, -5.232170224189758e-05, -4.7944486141204834e-05, -4.3567270040512085e-05, -3.9190053939819336e-05, -3.481283783912659e-05, -3.0435621738433838e-05, -2.605840563774109e-05, -2.168118953704834e-05, -1.730397343635559e-05, -1.2926757335662842e-05, -8.549541234970093e-06, -4.172325134277344e-06, 2.0489096641540527e-07, 4.582107067108154e-06, 8.959323167800903e-06, 1.3336539268493652e-05, 1.77137553691864e-05, 2.209097146987915e-05, 2.64681875705719e-05, 3.084540367126465e-05, 3.52226197719574e-05, 3.9599835872650146e-05, 4.3977051973342896e-05, 4.8354268074035645e-05, 5.2731484174728394e-05, 5.710870027542114e-05, 6.148591637611389e-05, 6.586313247680664e-05, 7.024034857749939e-05, 7.461756467819214e-05, 7.899478077888489e-05, 8.337199687957764e-05, 8.774921298027039e-05, 9.212642908096313e-05, 9.650364518165588e-05, 0.00010088086128234863, 0.00010525807738304138, 0.00010963529348373413, 0.00011401250958442688, 0.00011838972568511963, 0.00012276694178581238, 0.00012714415788650513, 0.00013152137398719788, 0.00013589859008789062]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 5.0, 0.0, 3.0, 8.0, 12.0, 16.0, 14.0, 28.0, 24.0, 66.0, 87.0, 144.0, 262.0, 492.0, 970.0, 2409.0, 7246.0, 46212.0, 932665.0, 45744.0, 7465.0, 2576.0, 1015.0, 498.0, 257.0, 128.0, 68.0, 34.0, 22.0, 28.0, 4.0, 6.0, 9.0, 7.0, 4.0, 2.0, 2.0, 5.0, 2.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.8477439880371094e-06, -1.7872080206871033e-06, -1.7266720533370972e-06, -1.666136085987091e-06, -1.605600118637085e-06, -1.5450641512870789e-06, -1.4845281839370728e-06, -1.4239922165870667e-06, -1.3634562492370605e-06, -1.3029202818870544e-06, -1.2423843145370483e-06, -1.1818483471870422e-06, -1.1213123798370361e-06, -1.06077641248703e-06, -1.000240445137024e-06, -9.397044777870178e-07, -8.791685104370117e-07, -8.186325430870056e-07, -7.580965757369995e-07, -6.975606083869934e-07, -6.370246410369873e-07, -5.764886736869812e-07, -5.159527063369751e-07, -4.55416738986969e-07, -3.948807716369629e-07, -3.343448042869568e-07, -2.738088369369507e-07, -2.1327286958694458e-07, -1.5273690223693848e-07, -9.220093488693237e-08, -3.166496753692627e-08, 2.8870999813079834e-08, 8.940696716308594e-08, 1.4994293451309204e-07, 2.1047890186309814e-07, 2.7101486921310425e-07, 3.3155083656311035e-07, 3.9208680391311646e-07, 4.5262277126312256e-07, 5.131587386131287e-07, 5.736947059631348e-07, 6.342306733131409e-07, 6.94766640663147e-07, 7.553026080131531e-07, 8.158385753631592e-07, 8.763745427131653e-07, 9.369105100631714e-07, 9.974464774131775e-07, 1.0579824447631836e-06, 1.1185184121131897e-06, 1.1790543794631958e-06, 1.239590346813202e-06, 1.300126314163208e-06, 1.3606622815132141e-06, 1.4211982488632202e-06, 1.4817342162132263e-06, 1.5422701835632324e-06, 1.6028061509132385e-06, 1.6633421182632446e-06, 1.7238780856132507e-06, 1.7844140529632568e-06, 1.844950020313263e-06, 1.905485987663269e-06, 1.966021955013275e-06, 2.0265579223632812e-06]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 807.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 111.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 2.0, 8.0, 11.0, 14.0, 33.0, 24.0, 71.0, 71.0, 146.0, 200.0, 728.0, 1326.0, 4479.0, 49942.0, 984362.0, 4246.0, 1399.0, 645.0, 418.0, 140.0, 105.0, 53.0, 52.0, 21.0, 14.0, 15.0, 11.0, 2.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.827976226806641e-06, -4.693865776062012e-06, -4.559755325317383e-06, -4.425644874572754e-06, -4.291534423828125e-06, -4.157423973083496e-06, -4.023313522338867e-06, -3.889203071594238e-06, -3.7550926208496094e-06, -3.6209821701049805e-06, -3.4868717193603516e-06, -3.3527612686157227e-06, -3.2186508178710938e-06, -3.084540367126465e-06, -2.950429916381836e-06, -2.816319465637207e-06, -2.682209014892578e-06, -2.5480985641479492e-06, -2.4139881134033203e-06, -2.2798776626586914e-06, -2.1457672119140625e-06, -2.0116567611694336e-06, -1.8775463104248047e-06, -1.7434358596801758e-06, -1.6093254089355469e-06, -1.475214958190918e-06, -1.341104507446289e-06, -1.2069940567016602e-06, -1.0728836059570312e-06, -9.387731552124023e-07, -8.046627044677734e-07, -6.705522537231445e-07, -5.364418029785156e-07, -4.023313522338867e-07, -2.682209014892578e-07, -1.341104507446289e-07, 0.0, 1.341104507446289e-07, 2.682209014892578e-07, 4.023313522338867e-07, 5.364418029785156e-07, 6.705522537231445e-07, 8.046627044677734e-07, 9.387731552124023e-07, 1.0728836059570312e-06, 1.2069940567016602e-06, 1.341104507446289e-06, 1.475214958190918e-06, 1.6093254089355469e-06, 1.7434358596801758e-06, 1.8775463104248047e-06, 2.0116567611694336e-06, 2.1457672119140625e-06, 2.2798776626586914e-06, 2.4139881134033203e-06, 2.5480985641479492e-06, 2.682209014892578e-06, 2.816319465637207e-06, 2.950429916381836e-06, 3.084540367126465e-06, 3.2186508178710938e-06, 3.3527612686157227e-06, 3.4868717193603516e-06, 3.6209821701049805e-06, 3.7550926208496094e-06]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 7.0, 22.0, 0.0, 38.0, 74.0, 718.0, 0.0, 85.0, 35.0, 7.0, 0.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-07, -9.099021553993225e-07, -8.66129994392395e-07, -8.223578333854675e-07, -7.7858567237854e-07, -7.348135113716125e-07, -6.910413503646851e-07, -6.472691893577576e-07, -6.034970283508301e-07, -5.597248673439026e-07, -5.159527063369751e-07, -4.721805453300476e-07, -4.284083843231201e-07, -3.8463622331619263e-07, -3.4086406230926514e-07, -2.9709190130233765e-07, -2.5331974029541016e-07, -2.0954757928848267e-07, -1.6577541828155518e-07, -1.2200325727462769e-07, -7.82310962677002e-08, -3.4458935260772705e-08, 9.313225746154785e-09, 5.3085386753082275e-08, 9.685754776000977e-08, 1.4062970876693726e-07, 1.8440186977386475e-07, 2.2817403078079224e-07, 2.7194619178771973e-07, 3.157183527946472e-07, 3.594905138015747e-07, 4.032626748085022e-07, 4.470348358154297e-07, 4.908069968223572e-07, 5.345791578292847e-07, 5.783513188362122e-07, 6.221234798431396e-07, 6.658956408500671e-07, 7.096678018569946e-07, 7.534399628639221e-07, 7.972121238708496e-07, 8.409842848777771e-07, 8.847564458847046e-07, 9.285286068916321e-07, 9.723007678985596e-07, 1.016072928905487e-06, 1.0598450899124146e-06, 1.103617250919342e-06, 1.1473894119262695e-06, 1.191161572933197e-06, 1.2349337339401245e-06, 1.278705894947052e-06, 1.3224780559539795e-06, 1.366250216960907e-06, 1.4100223779678345e-06, 1.453794538974762e-06, 1.4975666999816895e-06, 1.541338860988617e-06, 1.5851110219955444e-06, 1.628883183002472e-06, 1.6726553440093994e-06, 1.716427505016327e-06, 1.7601996660232544e-06, 1.8039718270301819e-06, 1.8477439880371094e-06]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 18.0, 977.0, 23.0, 1.0], "bins": [-0.0011164582101628184, -0.0010983212850987911, -0.001080184243619442, -0.0010620473185554147, -0.0010439102770760655, -0.0010257733520120382, -0.001007636426948011, -0.0009894993854686618, -0.0009713624604046345, -0.0009532254771329463, -0.000935088493861258, -0.0009169515687972307, -0.0008988145855255425, -0.0008806776022538543, -0.000862540618982166, -0.0008444036357104778, -0.0008262666524387896, -0.0008081296691671014, -0.0007899926858954132, -0.0007718557608313859, -0.0007537187775596976, -0.0007355817942880094, -0.0007174448110163212, -0.000699307827744633, -0.0006811708444729447, -0.0006630338612012565, -0.0006448968779295683, -0.000626759952865541, -0.0006086229695938528, -0.0005904859863221645, -0.0005723490030504763, -0.0005542120197787881, -0.0005360750947147608, -0.0005179381114430726, -0.0004998011281713843, -0.00048166417400352657, -0.0004635272198356688, -0.0004453902365639806, -0.00042725325329229236, -0.00040911627002060413, -0.0003909793449565768, -0.0003728423616848886, -0.00035470540751703084, -0.0003365684242453426, -0.00031843147007748485, -0.0003002944868057966, -0.0002821575035341084, -0.0002640205202624202, -0.0002458835660945624, -0.00022774659737478942, -0.00020960962865501642, -0.0001914726453833282, -0.0001733356766635552, -0.0001551987079437822, -0.000137061724672094, -0.00011892475595232099, -0.00010078777268063277, -8.265080396085978e-05, -6.451382796512917e-05, -4.6376855607377365e-05, -2.8239883249625564e-05, -1.0102914529852569e-05, 8.03406146587804e-06, 2.6171037461608648e-05, 4.4308002543402836e-05]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 9.0, 8.0, 7.0, 12.0, 9.0, 14.0, 11.0, 14.0, 17.0, 24.0, 28.0, 27.0, 30.0, 42.0, 29.0, 38.0, 40.0, 53.0, 37.0, 52.0, 32.0, 45.0, 40.0, 32.0, 36.0, 33.0, 38.0, 32.0, 31.0, 30.0, 25.0, 18.0, 16.0, 18.0, 12.0, 15.0, 9.0, 8.0, 6.0, 4.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00014231508248485625, -0.00013800666783936322, -0.00013369826774578542, -0.0001293898676522076, -0.00012508145300671458, -0.00012077304563717917, -0.00011646463826764375, -0.00011215623089810833, -0.00010784782352857292, -0.0001035394161590375, -9.923100878950208e-05, -9.492260141996667e-05, -9.061419405043125e-05, -8.630578668089584e-05, -8.199737931136042e-05, -7.7688971941825e-05, -7.338056457228959e-05, -6.907215720275417e-05, -6.476374983321875e-05, -6.045534246368334e-05, -5.614693509414792e-05, -5.1838527724612504e-05, -4.753012035507709e-05, -4.322171298554167e-05, -3.8913305616006255e-05, -3.460489824647084e-05, -3.0296490876935422e-05, -2.5988083507400006e-05, -2.167967613786459e-05, -1.7371268768329173e-05, -1.3062861398793757e-05, -8.75445402925834e-06, -4.446032107807696e-06, -1.376247382722795e-07, 4.170782631263137e-06, 8.479190000798553e-06, 1.278759737033397e-05, 1.7096004739869386e-05, 2.1404412109404802e-05, 2.571281947894022e-05, 3.0021226848475635e-05, 3.432963421801105e-05, 3.863804158754647e-05, 4.2946448957081884e-05, 4.72548563266173e-05, 5.156326369615272e-05, 5.587167106568813e-05, 6.018007843522355e-05, 6.448848580475897e-05, 6.879689317429438e-05, 7.31053005438298e-05, 7.741370791336522e-05, 8.172211528290063e-05, 8.603052265243605e-05, 9.033893002197146e-05, 9.464733739150688e-05, 9.89557447610423e-05, 0.00010326415213057771, 0.00010757255950011313, 0.00011188096686964855, 0.00011618937423918396, 0.00012049778160871938, 0.0001248061889782548, 0.00012911460362374783, 0.00013342300371732563]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 7.0, 0.0, 6.0, 20.0, 5.0, 8.0, 25.0, 10.0, 53.0, 22.0, 20.0, 81.0, 52.0, 191.0, 82.0, 316.0, 526.0, 2354.0, 58859.0, 4123546.0, 6071.0, 963.0, 383.0, 95.0, 237.0, 32.0, 85.0, 67.0, 24.0, 54.0, 25.0, 8.0, 22.0, 10.0, 5.0, 18.0, 1.0, 2.0, 5.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30752944946289e-05, -7.029063999652863e-05, -6.750598549842834e-05, -6.472133100032806e-05, -6.193667650222778e-05, -5.91520220041275e-05, -5.636736750602722e-05, -5.358271300792694e-05, -5.079805850982666e-05, -4.801340401172638e-05, -4.52287495136261e-05, -4.244409501552582e-05, -3.965944051742554e-05, -3.6874786019325256e-05, -3.4090131521224976e-05, -3.1305477023124695e-05, -2.8520822525024414e-05, -2.5736168026924133e-05, -2.2951513528823853e-05, -2.0166859030723572e-05, -1.738220453262329e-05, -1.459755003452301e-05, -1.181289553642273e-05, -9.028241038322449e-06, -6.243586540222168e-06, -3.458932042121887e-06, -6.742775440216064e-07, 2.1103769540786743e-06, 4.895031452178955e-06, 7.679685950279236e-06, 1.0464340448379517e-05, 1.3248994946479797e-05, 1.6033649444580078e-05, 1.881830394268036e-05, 2.160295844078064e-05, 2.438761293888092e-05, 2.71722674369812e-05, 2.9956921935081482e-05, 3.274157643318176e-05, 3.5526230931282043e-05, 3.8310885429382324e-05, 4.1095539927482605e-05, 4.3880194425582886e-05, 4.6664848923683167e-05, 4.944950342178345e-05, 5.223415791988373e-05, 5.501881241798401e-05, 5.780346691608429e-05, 6.058812141418457e-05, 6.337277591228485e-05, 6.615743041038513e-05, 6.894208490848541e-05, 7.17267394065857e-05, 7.451139390468597e-05, 7.729604840278625e-05, 8.008070290088654e-05, 8.286535739898682e-05, 8.56500118970871e-05, 8.843466639518738e-05, 9.121932089328766e-05, 9.400397539138794e-05, 9.678862988948822e-05, 9.95732843875885e-05, 0.00010235793888568878, 0.00010514259338378906]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 5.0, 7.0, 12.0, 14.0, 15.0, 17.0, 26.0, 29.0, 35.0, 47.0, 66.0, 75.0, 72.0, 64.0, 79.0, 60.0, 57.0, 51.0, 59.0, 43.0, 49.0, 38.0, 15.0, 21.0, 9.0, 5.0, 9.0, 5.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.043081283569336e-05, -1.0058283805847168e-05, -9.685754776000977e-06, -9.313225746154785e-06, -8.940696716308594e-06, -8.568167686462402e-06, -8.195638656616211e-06, -7.82310962677002e-06, -7.450580596923828e-06, -7.078051567077637e-06, -6.705522537231445e-06, -6.332993507385254e-06, -5.9604644775390625e-06, -5.587935447692871e-06, -5.21540641784668e-06, -4.842877388000488e-06, -4.470348358154297e-06, -4.0978193283081055e-06, -3.725290298461914e-06, -3.3527612686157227e-06, -2.9802322387695312e-06, -2.60770320892334e-06, -2.2351741790771484e-06, -1.862645149230957e-06, -1.4901161193847656e-06, -1.1175870895385742e-06, -7.450580596923828e-07, -3.725290298461914e-07, 0.0, 3.725290298461914e-07, 7.450580596923828e-07, 1.1175870895385742e-06, 1.4901161193847656e-06, 1.862645149230957e-06, 2.2351741790771484e-06, 2.60770320892334e-06, 2.9802322387695312e-06, 3.3527612686157227e-06, 3.725290298461914e-06, 4.0978193283081055e-06, 4.470348358154297e-06, 4.842877388000488e-06, 5.21540641784668e-06, 5.587935447692871e-06, 5.9604644775390625e-06, 6.332993507385254e-06, 6.705522537231445e-06, 7.078051567077637e-06, 7.450580596923828e-06, 7.82310962677002e-06, 8.195638656616211e-06, 8.568167686462402e-06, 8.940696716308594e-06, 9.313225746154785e-06, 9.685754776000977e-06, 1.0058283805847168e-05, 1.043081283569336e-05, 1.080334186553955e-05, 1.1175870895385742e-05, 1.1548399925231934e-05, 1.1920928955078125e-05, 1.2293457984924316e-05, 1.2665987014770508e-05, 1.30385160446167e-05, 1.341104507446289e-05]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 2.0, 2.0, 11.0, 16.0, 13.0, 27.0, 36.0, 60.0, 105.0, 260.0, 515.0, 1396.0, 4159.0, 15807.0, 189990.0, 3930173.0, 40469.0, 7383.0, 2250.0, 854.0, 354.0, 148.0, 66.0, 44.0, 45.0, 25.0, 19.0, 10.0, 8.0, 10.0, 3.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6106834411621094e-05, -2.5029294192790985e-05, -2.3951753973960876e-05, -2.2874213755130768e-05, -2.179667353630066e-05, -2.071913331747055e-05, -1.9641593098640442e-05, -1.8564052879810333e-05, -1.7486512660980225e-05, -1.6408972442150116e-05, -1.5331432223320007e-05, -1.4253892004489899e-05, -1.317635178565979e-05, -1.2098811566829681e-05, -1.1021271347999573e-05, -9.943731129169464e-06, -8.866190910339355e-06, -7.788650691509247e-06, -6.711110472679138e-06, -5.6335702538490295e-06, -4.556030035018921e-06, -3.4784898161888123e-06, -2.4009495973587036e-06, -1.323409378528595e-06, -2.4586915969848633e-07, 8.316710591316223e-07, 1.909211277961731e-06, 2.9867514967918396e-06, 4.064291715621948e-06, 5.141831934452057e-06, 6.2193721532821655e-06, 7.296912372112274e-06, 8.374452590942383e-06, 9.451992809772491e-06, 1.05295330286026e-05, 1.1607073247432709e-05, 1.2684613466262817e-05, 1.3762153685092926e-05, 1.4839693903923035e-05, 1.5917234122753143e-05, 1.6994774341583252e-05, 1.807231456041336e-05, 1.914985477924347e-05, 2.0227394998073578e-05, 2.1304935216903687e-05, 2.2382475435733795e-05, 2.3460015654563904e-05, 2.4537555873394012e-05, 2.561509609222412e-05, 2.669263631105423e-05, 2.777017652988434e-05, 2.8847716748714447e-05, 2.9925256967544556e-05, 3.1002797186374664e-05, 3.208033740520477e-05, 3.315787762403488e-05, 3.423541784286499e-05, 3.53129580616951e-05, 3.639049828052521e-05, 3.7468038499355316e-05, 3.8545578718185425e-05, 3.9623118937015533e-05, 4.070065915584564e-05, 4.177819937467575e-05, 4.285573959350586e-05]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 4.0, 9.0, 4.0, 7.0, 10.0, 2.0, 14.0, 13.0, 18.0, 24.0, 33.0, 78.0, 113.0, 401.0, 1556.0, 968.0, 457.0, 124.0, 86.0, 43.0, 15.0, 22.0, 13.0, 11.0, 8.0, 2.0, 6.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.271766662597656e-06, -7.057562470436096e-06, -6.843358278274536e-06, -6.629154086112976e-06, -6.414949893951416e-06, -6.200745701789856e-06, -5.986541509628296e-06, -5.772337317466736e-06, -5.558133125305176e-06, -5.343928933143616e-06, -5.129724740982056e-06, -4.915520548820496e-06, -4.7013163566589355e-06, -4.4871121644973755e-06, -4.2729079723358154e-06, -4.058703780174255e-06, -3.844499588012695e-06, -3.6302953958511353e-06, -3.416091203689575e-06, -3.201887011528015e-06, -2.987682819366455e-06, -2.773478627204895e-06, -2.559274435043335e-06, -2.345070242881775e-06, -2.130866050720215e-06, -1.9166618585586548e-06, -1.7024576663970947e-06, -1.4882534742355347e-06, -1.2740492820739746e-06, -1.0598450899124146e-06, -8.456408977508545e-07, -6.314367055892944e-07, -4.172325134277344e-07, -2.0302832126617432e-07, 1.1175870895385742e-08, 2.253800630569458e-07, 4.3958425521850586e-07, 6.537884473800659e-07, 8.67992639541626e-07, 1.082196831703186e-06, 1.296401023864746e-06, 1.5106052160263062e-06, 1.7248094081878662e-06, 1.9390136003494263e-06, 2.1532177925109863e-06, 2.3674219846725464e-06, 2.5816261768341064e-06, 2.7958303689956665e-06, 3.0100345611572266e-06, 3.2242387533187866e-06, 3.4384429454803467e-06, 3.6526471376419067e-06, 3.866851329803467e-06, 4.081055521965027e-06, 4.295259714126587e-06, 4.509463906288147e-06, 4.723668098449707e-06, 4.937872290611267e-06, 5.152076482772827e-06, 5.366280674934387e-06, 5.580484867095947e-06, 5.794689059257507e-06, 6.008893251419067e-06, 6.2230974435806274e-06, 6.4373016357421875e-06]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 12.0, 12.0, 17.0, 31.0, 41.0, 88.0, 100.0, 169.0, 182.0, 137.0, 75.0, 47.0, 27.0, 27.0, 10.0, 7.0, 6.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.908163176267408e-05, -1.828828862926457e-05, -1.7494947314844467e-05, -1.670160418143496e-05, -1.590826104802545e-05, -1.5114918824110646e-05, -1.432157660019584e-05, -1.3528233466786332e-05, -1.2734890333376825e-05, -1.1941548109462019e-05, -1.1148204976052511e-05, -1.0354862752137706e-05, -9.561519618728198e-06, -8.768177394813392e-06, -7.974835170898587e-06, -7.181492037489079e-06, -6.388149813574273e-06, -5.5948071349121165e-06, -4.80146445624996e-06, -4.008122232335154e-06, -3.214779326299322e-06, -2.4214368750108406e-06, -1.628094196348684e-06, -8.347515176865272e-07, -4.1408839024370536e-08, 7.519337827943673e-07, 1.5452764046131051e-06, 2.338618969588424e-06, 3.1319616482505808e-06, 3.925304099539062e-06, 4.718646778201219e-06, 5.511989456863375e-06, 6.305332135525532e-06, 7.098674814187689e-06, 7.892017492849845e-06, 8.685359716764651e-06, 9.478702850174159e-06, 1.0272045074088965e-05, 1.106538729800377e-05, 1.1858730431413278e-05, 1.2652073564822786e-05, 1.3445415788737591e-05, 1.4238758922147099e-05, 1.5032101146061905e-05, 1.5825444279471412e-05, 1.6618785593891516e-05, 1.7412128727301024e-05, 1.820547186071053e-05, 1.8998813175130635e-05, 1.9792156308540143e-05, 2.0585497622960247e-05, 2.1378840756369755e-05, 2.2172183889779262e-05, 2.296552702318877e-05, 2.3758868337608874e-05, 2.455221147101838e-05, 2.534555460442789e-05, 2.6138897737837397e-05, 2.69322390522575e-05, 2.7725582185667008e-05, 2.8518925319076516e-05, 2.9312268452486023e-05, 3.0105609766906127e-05, 3.089895471930504e-05, 3.169229603372514e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 2.0, 6.0, 5.0, 5.0, 7.0, 13.0, 12.0, 13.0, 23.0, 14.0, 20.0, 26.0, 19.0, 27.0, 33.0, 37.0, 43.0, 26.0, 39.0, 37.0, 30.0, 47.0, 46.0, 42.0, 42.0, 34.0, 44.0, 27.0, 36.0, 32.0, 25.0, 28.0, 19.0, 15.0, 22.0, 15.0, 14.0, 12.0, 10.0, 12.0, 1.0, 7.0, 7.0, 8.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.579733730584849e-06, -8.296617124869954e-06, -8.013500519155059e-06, -7.730383913440164e-06, -7.44726776247262e-06, -7.164151156757725e-06, -6.8810350057901815e-06, -6.597918400075287e-06, -6.314801794360392e-06, -6.031685188645497e-06, -5.748568582930602e-06, -5.465452431963058e-06, -5.182335826248163e-06, -4.8992192205332685e-06, -4.616103069565725e-06, -4.33298646385083e-06, -4.049869858135935e-06, -3.76675325242104e-06, -3.4836368740798207e-06, -3.2005204957386013e-06, -2.9174038900237065e-06, -2.6342872843088116e-06, -2.3511709059675923e-06, -2.068054527626373e-06, -1.784937921911478e-06, -1.501821429883421e-06, -1.2187049378553638e-06, -9.355884458273067e-07, -6.524719537992496e-07, -3.693554617711925e-07, -8.623896974313539e-08, 1.96877408598084e-07, 4.799940143129788e-07, 7.631105063410359e-07, 1.046226998369093e-06, 1.3293434903971502e-06, 1.6124599824252073e-06, 1.8955764744532644e-06, 2.1786929664813215e-06, 2.461809344822541e-06, 2.7449259505374357e-06, 3.0280425562523305e-06, 3.31115893459355e-06, 3.5942753129347693e-06, 3.877391918649664e-06, 4.160508524364559e-06, 4.443624675332103e-06, 4.726741281046998e-06, 5.009857886761893e-06, 5.292974492476787e-06, 5.576091098191682e-06, 5.859207249159226e-06, 6.142323854874121e-06, 6.425440460589016e-06, 6.70855661155656e-06, 6.991673217271455e-06, 7.2747898229863495e-06, 7.557906428701244e-06, 7.841023034416139e-06, 8.124139640131034e-06, 8.407256245845929e-06, 8.690371942066122e-06, 8.973488547781017e-06, 9.256605153495912e-06, 9.539721759210806e-06]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 8.0, 8.0, 9.0, 10.0, 26.0, 16.0, 17.0, 31.0, 44.0, 164.0, 137.0, 180.0, 325.0, 1230.0, 1269.0, 2263.0, 4172.0, 26284.0, 45761.0, 153474.0, 577725.0, 199325.0, 17973.0, 8176.0, 4126.0, 2301.0, 2046.0, 480.0, 308.0, 201.0, 215.0, 69.0, 45.0, 22.0, 31.0, 22.0, 16.0, 12.0, 12.0, 11.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.086162567138672e-06, -2.012588083744049e-06, -1.9390136003494263e-06, -1.8654391169548035e-06, -1.7918646335601807e-06, -1.7182901501655579e-06, -1.644715666770935e-06, -1.5711411833763123e-06, -1.4975666999816895e-06, -1.4239922165870667e-06, -1.3504177331924438e-06, -1.276843249797821e-06, -1.2032687664031982e-06, -1.1296942830085754e-06, -1.0561197996139526e-06, -9.825453162193298e-07, -9.08970832824707e-07, -8.353963494300842e-07, -7.618218660354614e-07, -6.882473826408386e-07, -6.146728992462158e-07, -5.41098415851593e-07, -4.675239324569702e-07, -3.939494490623474e-07, -3.203749656677246e-07, -2.468004822731018e-07, -1.73225998878479e-07, -9.96515154838562e-08, -2.60770320892334e-08, 4.7497451305389404e-08, 1.210719347000122e-07, 1.94646418094635e-07, 2.682209014892578e-07, 3.417953848838806e-07, 4.153698682785034e-07, 4.889443516731262e-07, 5.62518835067749e-07, 6.360933184623718e-07, 7.096678018569946e-07, 7.832422852516174e-07, 8.568167686462402e-07, 9.30391252040863e-07, 1.0039657354354858e-06, 1.0775402188301086e-06, 1.1511147022247314e-06, 1.2246891856193542e-06, 1.298263669013977e-06, 1.3718381524085999e-06, 1.4454126358032227e-06, 1.5189871191978455e-06, 1.5925616025924683e-06, 1.666136085987091e-06, 1.7397105693817139e-06, 1.8132850527763367e-06, 1.8868595361709595e-06, 1.9604340195655823e-06, 2.034008502960205e-06, 2.107582986354828e-06, 2.1811574697494507e-06, 2.2547319531440735e-06, 2.3283064365386963e-06, 2.401880919933319e-06, 2.475455403327942e-06, 2.5490298867225647e-06, 2.6226043701171875e-06]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 4.0, 5.0, 4.0, 9.0, 7.0, 14.0, 13.0, 15.0, 24.0, 18.0, 20.0, 38.0, 32.0, 41.0, 32.0, 60.0, 33.0, 49.0, 45.0, 69.0, 63.0, 39.0, 59.0, 31.0, 45.0, 30.0, 33.0, 23.0, 26.0, 17.0, 21.0, 17.0, 6.0, 10.0, 10.0, 2.0, 3.0, 11.0, 7.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-06, -6.346963346004486e-06, -6.137415766716003e-06, -5.927868187427521e-06, -5.718320608139038e-06, -5.508773028850555e-06, -5.299225449562073e-06, -5.08967787027359e-06, -4.880130290985107e-06, -4.670582711696625e-06, -4.461035132408142e-06, -4.2514875531196594e-06, -4.041939973831177e-06, -3.832392394542694e-06, -3.6228448152542114e-06, -3.4132972359657288e-06, -3.203749656677246e-06, -2.9942020773887634e-06, -2.7846544981002808e-06, -2.575106918811798e-06, -2.3655593395233154e-06, -2.1560117602348328e-06, -1.94646418094635e-06, -1.7369166016578674e-06, -1.5273690223693848e-06, -1.317821443080902e-06, -1.1082738637924194e-06, -8.987262845039368e-07, -6.891787052154541e-07, -4.796311259269714e-07, -2.7008354663848877e-07, -6.05359673500061e-08, 1.4901161193847656e-07, 3.5855919122695923e-07, 5.681067705154419e-07, 7.776543498039246e-07, 9.872019290924072e-07, 1.1967495083808899e-06, 1.4062970876693726e-06, 1.6158446669578552e-06, 1.8253922462463379e-06, 2.0349398255348206e-06, 2.2444874048233032e-06, 2.454034984111786e-06, 2.6635825634002686e-06, 2.8731301426887512e-06, 3.082677721977234e-06, 3.2922253012657166e-06, 3.5017728805541992e-06, 3.711320459842682e-06, 3.9208680391311646e-06, 4.130415618419647e-06, 4.33996319770813e-06, 4.5495107769966125e-06, 4.759058356285095e-06, 4.968605935573578e-06, 5.1781535148620605e-06, 5.387701094150543e-06, 5.597248673439026e-06, 5.8067962527275085e-06, 6.016343832015991e-06, 6.225891411304474e-06, 6.4354389905929565e-06, 6.644986569881439e-06, 6.854534149169922e-06]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 5.0, 0.0, 18.0, 0.0, 37.0, 0.0, 0.0, 60.0, 0.0, 183.0, 0.0, 482.0, 0.0, 1214.0, 0.0, 0.0, 3577.0, 0.0, 10584.0, 0.0, 35893.0, 0.0, 0.0, 153599.0, 0.0, 639548.0, 0.0, 152931.0, 0.0, 35202.0, 0.0, 0.0, 10163.0, 0.0, 3277.0, 0.0, 1123.0, 0.0, 0.0, 427.0, 0.0, 142.0, 0.0, 64.0, 0.0, 21.0, 0.0, 0.0, 10.0, 0.0, 5.0, 0.0, 2.0, 0.0, 2.0], "bins": [-8.940696716308594e-07, -8.67992639541626e-07, -8.419156074523926e-07, -8.158385753631592e-07, -7.897615432739258e-07, -7.636845111846924e-07, -7.37607479095459e-07, -7.115304470062256e-07, -6.854534149169922e-07, -6.593763828277588e-07, -6.332993507385254e-07, -6.07222318649292e-07, -5.811452865600586e-07, -5.550682544708252e-07, -5.289912223815918e-07, -5.029141902923584e-07, -4.76837158203125e-07, -4.507601261138916e-07, -4.246830940246582e-07, -3.986060619354248e-07, -3.725290298461914e-07, -3.46451997756958e-07, -3.203749656677246e-07, -2.942979335784912e-07, -2.682209014892578e-07, -2.421438694000244e-07, -2.1606683731079102e-07, -1.8998980522155762e-07, -1.6391277313232422e-07, -1.3783574104309082e-07, -1.1175870895385742e-07, -8.568167686462402e-08, -5.960464477539063e-08, -3.3527612686157227e-08, -7.450580596923828e-09, 1.862645149230957e-08, 4.470348358154297e-08, 7.078051567077637e-08, 9.685754776000977e-08, 1.2293457984924316e-07, 1.4901161193847656e-07, 1.7508864402770996e-07, 2.0116567611694336e-07, 2.2724270820617676e-07, 2.5331974029541016e-07, 2.7939677238464355e-07, 3.0547380447387695e-07, 3.3155083656311035e-07, 3.5762786865234375e-07, 3.8370490074157715e-07, 4.0978193283081055e-07, 4.3585896492004395e-07, 4.6193599700927734e-07, 4.880130290985107e-07, 5.140900611877441e-07, 5.401670932769775e-07, 5.662441253662109e-07, 5.923211574554443e-07, 6.183981895446777e-07, 6.444752216339111e-07, 6.705522537231445e-07, 6.966292858123779e-07, 7.227063179016113e-07, 7.487833499908447e-07, 7.748603820800781e-07]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 1.0, 7.0, 4.0, 5.0, 8.0, 8.0, 10.0, 10.0, 19.0, 19.0, 20.0, 23.0, 23.0, 25.0, 22.0, 40.0, 36.0, 33.0, 49.0, 60.0, 53.0, 38.0, 53.0, 44.0, 46.0, 60.0, 45.0, 31.0, 26.0, 25.0, 20.0, 27.0, 22.0, 13.0, 14.0, 10.0, 8.0, 14.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.4781951904296875e-05, -1.4355406165122986e-05, -1.3928860425949097e-05, -1.3502314686775208e-05, -1.3075768947601318e-05, -1.264922320842743e-05, -1.222267746925354e-05, -1.1796131730079651e-05, -1.1369585990905762e-05, -1.0943040251731873e-05, -1.0516494512557983e-05, -1.0089948773384094e-05, -9.663403034210205e-06, -9.236857295036316e-06, -8.810311555862427e-06, -8.383765816688538e-06, -7.957220077514648e-06, -7.530674338340759e-06, -7.10412859916687e-06, -6.677582859992981e-06, -6.251037120819092e-06, -5.824491381645203e-06, -5.3979456424713135e-06, -4.971399903297424e-06, -4.544854164123535e-06, -4.118308424949646e-06, -3.691762685775757e-06, -3.2652169466018677e-06, -2.8386712074279785e-06, -2.4121254682540894e-06, -1.9855797290802e-06, -1.559033989906311e-06, -1.1324882507324219e-06, -7.059425115585327e-07, -2.7939677238464355e-07, 1.471489667892456e-07, 5.736947059631348e-07, 1.000240445137024e-06, 1.426786184310913e-06, 1.8533319234848022e-06, 2.2798776626586914e-06, 2.7064234018325806e-06, 3.1329691410064697e-06, 3.559514880180359e-06, 3.986060619354248e-06, 4.412606358528137e-06, 4.839152097702026e-06, 5.2656978368759155e-06, 5.692243576049805e-06, 6.118789315223694e-06, 6.545335054397583e-06, 6.971880793571472e-06, 7.398426532745361e-06, 7.82497227191925e-06, 8.25151801109314e-06, 8.678063750267029e-06, 9.104609489440918e-06, 9.531155228614807e-06, 9.957700967788696e-06, 1.0384246706962585e-05, 1.0810792446136475e-05, 1.1237338185310364e-05, 1.1663883924484253e-05, 1.2090429663658142e-05, 1.2516975402832031e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 557.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1047360.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 646.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-07, -1.1455267667770386e-07, -1.0989606380462646e-07, -1.0523945093154907e-07, -1.0058283805847168e-07, -9.592622518539429e-08, -9.12696123123169e-08, -8.66129994392395e-08, -8.195638656616211e-08, -7.729977369308472e-08, -7.264316082000732e-08, -6.798654794692993e-08, -6.332993507385254e-08, -5.8673322200775146e-08, -5.4016709327697754e-08, -4.936009645462036e-08, -4.470348358154297e-08, -4.0046870708465576e-08, -3.5390257835388184e-08, -3.073364496231079e-08, -2.60770320892334e-08, -2.1420419216156006e-08, -1.6763806343078613e-08, -1.210719347000122e-08, -7.450580596923828e-09, -2.7939677238464355e-09, 1.862645149230957e-09, 6.51925802230835e-09, 1.1175870895385742e-08, 1.5832483768463135e-08, 2.0489096641540527e-08, 2.514570951461792e-08, 2.9802322387695312e-08, 3.4458935260772705e-08, 3.91155481338501e-08, 4.377216100692749e-08, 4.842877388000488e-08, 5.3085386753082275e-08, 5.774199962615967e-08, 6.239861249923706e-08, 6.705522537231445e-08, 7.171183824539185e-08, 7.636845111846924e-08, 8.102506399154663e-08, 8.568167686462402e-08, 9.033828973770142e-08, 9.499490261077881e-08, 9.96515154838562e-08, 1.043081283569336e-07, 1.0896474123001099e-07, 1.1362135410308838e-07, 1.1827796697616577e-07, 1.2293457984924316e-07, 1.2759119272232056e-07, 1.3224780559539795e-07, 1.3690441846847534e-07, 1.4156103134155273e-07, 1.4621764421463013e-07, 1.5087425708770752e-07, 1.555308699607849e-07, 1.601874828338623e-07, 1.648440957069397e-07, 1.695007085800171e-07, 1.7415732145309448e-07, 1.7881393432617188e-07]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 193.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 499.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 212.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07, 1.862645149230957e-07, 1.9371509552001953e-07, 2.0116567611694336e-07, 2.086162567138672e-07, 2.1606683731079102e-07, 2.2351741790771484e-07, 2.3096799850463867e-07, 2.384185791015625e-07]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 10.0, 30.0, 46.0, 116.0, 262.0, 292.0, 140.0, 66.0, 25.0, 12.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.911319466482382e-06, -9.097376278077718e-06, -8.283433999167755e-06, -7.469490810763091e-06, -6.655548531853128e-06, -5.841605343448464e-06, -5.02766260979115e-06, -4.213719876133837e-06, -3.3997771424765233e-06, -2.5858344088192098e-06, -1.7718915614750586e-06, -9.579487141309073e-07, -1.440059804735938e-07, 6.699369805573951e-07, 1.4838797142147087e-06, 2.297822447872022e-06, 3.1117651815293357e-06, 3.925707915186649e-06, 4.739650648843963e-06, 5.553593837248627e-06, 6.36753611615859e-06, 7.181479304563254e-06, 7.995422492967919e-06, 8.809364771877881e-06, 9.623307050787844e-06, 1.0437250239192508e-05, 1.125119251810247e-05, 1.2065135706507135e-05, 1.2879077985417098e-05, 1.3693021173821762e-05, 1.4506964362226427e-05, 1.532090755063109e-05, 1.6134848920046352e-05, 1.6948792108451016e-05, 1.776273529685568e-05, 1.857667666627094e-05, 1.9390619854675606e-05, 2.020456304308027e-05, 2.1018506231484935e-05, 2.18324494198896e-05, 2.264639078930486e-05, 2.3460333977709524e-05, 2.427427716611419e-05, 2.508821853552945e-05, 2.5902161723934114e-05, 2.671610491233878e-05, 2.7530048100743443e-05, 2.8343991289148107e-05, 2.915793447755277e-05, 2.9971877665957436e-05, 3.07858208543621e-05, 3.1599764042766765e-05, 3.241370723117143e-05, 3.3227646781597286e-05, 3.404158997000195e-05, 3.4855533158406615e-05, 3.566947634681128e-05, 3.6483419535215944e-05, 3.729736272362061e-05, 3.811130591202527e-05, 3.892524910042994e-05, 3.97391922888346e-05, 4.055313183926046e-05, 4.136707502766512e-05, 4.218101821606979e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 6.0, 8.0, 8.0, 20.0, 16.0, 33.0, 28.0, 32.0, 38.0, 47.0, 56.0, 50.0, 48.0, 55.0, 65.0, 63.0, 59.0, 56.0, 49.0, 45.0, 35.0, 28.0, 27.0, 22.0, 26.0, 18.0, 9.0, 6.0, 8.0, 12.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.957397206657333e-06, -5.723979029426118e-06, -5.490560852194903e-06, -5.2571426749636885e-06, -5.0237244977324735e-06, -4.790306320501259e-06, -4.556887688522693e-06, -4.323469511291478e-06, -4.090051334060263e-06, -3.856633156829048e-06, -3.623214979597833e-06, -3.389796802366618e-06, -3.156378625135403e-06, -2.922960447904188e-06, -2.689542043299298e-06, -2.456123866068083e-06, -2.2227059162105434e-06, -1.9892877389793284e-06, -1.7558695617481135e-06, -1.5224512708300608e-06, -1.2890330935988459e-06, -1.055614916367631e-06, -8.221966254495783e-07, -5.887784482183633e-07, -3.553602709871484e-07, -1.2194206533422403e-07, 1.1147614031870035e-07, 3.4489437439333415e-07, 5.783125516245491e-07, 8.11730728855764e-07, 1.0451490197738167e-06, 1.2785671970050316e-06, 1.5119849194888957e-06, 1.7454030967201106e-06, 1.9788212739513256e-06, 2.2122394511825405e-06, 2.4456576284137554e-06, 2.6790758056449704e-06, 2.9124942102498608e-06, 3.1459123874810757e-06, 3.3793305647122907e-06, 3.6127487419435056e-06, 3.846167146548396e-06, 4.079585323779611e-06, 4.313003501010826e-06, 4.546421678242041e-06, 4.779839855473256e-06, 5.013258032704471e-06, 5.246676209935686e-06, 5.4800943871669006e-06, 5.7135125643981155e-06, 5.9469307416293304e-06, 6.180348918860545e-06, 6.41376709609176e-06, 6.647185728070326e-06, 6.880603905301541e-06, 7.114022082532756e-06, 7.347440259763971e-06, 7.580858436995186e-06, 7.814276614226401e-06, 8.047694791457616e-06, 8.28111296868883e-06, 8.514531145920046e-06, 8.74794932315126e-06, 8.981367500382476e-06]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 13.0, 12.0, 17.0, 34.0, 52.0, 88.0, 121.0, 261.0, 378.0, 1001.0, 2422.0, 16639.0, 162756.0, 797449.0, 58604.0, 5582.0, 1714.0, 599.0, 292.0, 204.0, 86.0, 87.0, 38.0, 30.0, 24.0, 15.0, 13.0, 6.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-06, -6.233341991901398e-06, -5.910173058509827e-06, -5.587004125118256e-06, -5.2638351917266846e-06, -4.9406662583351135e-06, -4.6174973249435425e-06, -4.2943283915519714e-06, -3.9711594581604e-06, -3.6479905247688293e-06, -3.3248215913772583e-06, -3.0016526579856873e-06, -2.678483724594116e-06, -2.355314791202545e-06, -2.032145857810974e-06, -1.708976924419403e-06, -1.385807991027832e-06, -1.062639057636261e-06, -7.394701242446899e-07, -4.163011908531189e-07, -9.313225746154785e-08, 2.300366759300232e-07, 5.532056093215942e-07, 8.763745427131653e-07, 1.1995434761047363e-06, 1.5227124094963074e-06, 1.8458813428878784e-06, 2.1690502762794495e-06, 2.4922192096710205e-06, 2.8153881430625916e-06, 3.1385570764541626e-06, 3.4617260098457336e-06, 3.7848949432373047e-06, 4.108063876628876e-06, 4.431232810020447e-06, 4.754401743412018e-06, 5.077570676803589e-06, 5.40073961019516e-06, 5.723908543586731e-06, 6.047077476978302e-06, 6.370246410369873e-06, 6.693415343761444e-06, 7.016584277153015e-06, 7.339753210544586e-06, 7.662922143936157e-06, 7.986091077327728e-06, 8.3092600107193e-06, 8.63242894411087e-06, 8.955597877502441e-06, 9.278766810894012e-06, 9.601935744285583e-06, 9.925104677677155e-06, 1.0248273611068726e-05, 1.0571442544460297e-05, 1.0894611477851868e-05, 1.1217780411243439e-05, 1.154094934463501e-05, 1.186411827802658e-05, 1.2187287211418152e-05, 1.2510456144809723e-05, 1.2833625078201294e-05, 1.3156794011592865e-05, 1.3479962944984436e-05, 1.3803131878376007e-05, 1.4126300811767578e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 11.0, 2.0, 10.0, 15.0, 15.0, 38.0, 34.0, 40.0, 51.0, 55.0, 60.0, 81.0, 78.0, 77.0, 81.0, 63.0, 50.0, 63.0, 48.0, 32.0, 20.0, 22.0, 15.0, 14.0, 10.0, 11.0, 1.0, 7.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8417835235595703e-05, -1.7547979950904846e-05, -1.667812466621399e-05, -1.5808269381523132e-05, -1.4938414096832275e-05, -1.4068558812141418e-05, -1.3198703527450562e-05, -1.2328848242759705e-05, -1.1458992958068848e-05, -1.058913767337799e-05, -9.719282388687134e-06, -8.849427103996277e-06, -7.97957181930542e-06, -7.109716534614563e-06, -6.239861249923706e-06, -5.370005965232849e-06, -4.500150680541992e-06, -3.6302953958511353e-06, -2.7604401111602783e-06, -1.8905848264694214e-06, -1.0207295417785645e-06, -1.5087425708770752e-07, 7.189810276031494e-07, 1.5888363122940063e-06, 2.4586915969848633e-06, 3.3285468816757202e-06, 4.198402166366577e-06, 5.068257451057434e-06, 5.938112735748291e-06, 6.807968020439148e-06, 7.677823305130005e-06, 8.547678589820862e-06, 9.417533874511719e-06, 1.0287389159202576e-05, 1.1157244443893433e-05, 1.202709972858429e-05, 1.2896955013275146e-05, 1.3766810297966003e-05, 1.463666558265686e-05, 1.5506520867347717e-05, 1.6376376152038574e-05, 1.724623143672943e-05, 1.8116086721420288e-05, 1.8985942006111145e-05, 1.9855797290802002e-05, 2.072565257549286e-05, 2.1595507860183716e-05, 2.2465363144874573e-05, 2.333521842956543e-05, 2.4205073714256287e-05, 2.5074928998947144e-05, 2.5944784283638e-05, 2.6814639568328857e-05, 2.7684494853019714e-05, 2.855435013771057e-05, 2.9424205422401428e-05, 3.0294060707092285e-05, 3.116391599178314e-05, 3.2033771276474e-05, 3.2903626561164856e-05, 3.377348184585571e-05, 3.464333713054657e-05, 3.551319241523743e-05, 3.6383047699928284e-05, 3.725290298461914e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 11.0, 16.0, 21.0, 35.0, 43.0, 76.0, 131.0, 223.0, 706.0, 7065.0, 1036990.0, 2271.0, 479.0, 204.0, 106.0, 60.0, 44.0, 25.0, 18.0, 13.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.547834396362305e-05, -4.4072046875953674e-05, -4.26657497882843e-05, -4.125945270061493e-05, -3.985315561294556e-05, -3.8446858525276184e-05, -3.704056143760681e-05, -3.563426434993744e-05, -3.4227967262268066e-05, -3.2821670174598694e-05, -3.141537308692932e-05, -3.000907599925995e-05, -2.8602778911590576e-05, -2.7196481823921204e-05, -2.579018473625183e-05, -2.438388764858246e-05, -2.2977590560913086e-05, -2.1571293473243713e-05, -2.016499638557434e-05, -1.8758699297904968e-05, -1.7352402210235596e-05, -1.5946105122566223e-05, -1.453980803489685e-05, -1.3133510947227478e-05, -1.1727213859558105e-05, -1.0320916771888733e-05, -8.91461968421936e-06, -7.508322596549988e-06, -6.102025508880615e-06, -4.695728421211243e-06, -3.28943133354187e-06, -1.8831342458724976e-06, -4.76837158203125e-07, 9.294599294662476e-07, 2.33575701713562e-06, 3.7420541048049927e-06, 5.148351192474365e-06, 6.554648280143738e-06, 7.96094536781311e-06, 9.367242455482483e-06, 1.0773539543151855e-05, 1.2179836630821228e-05, 1.35861337184906e-05, 1.4992430806159973e-05, 1.6398727893829346e-05, 1.7805024981498718e-05, 1.921132206916809e-05, 2.0617619156837463e-05, 2.2023916244506836e-05, 2.343021333217621e-05, 2.483651041984558e-05, 2.6242807507514954e-05, 2.7649104595184326e-05, 2.90554016828537e-05, 3.046169877052307e-05, 3.1867995858192444e-05, 3.3274292945861816e-05, 3.468059003353119e-05, 3.608688712120056e-05, 3.7493184208869934e-05, 3.889948129653931e-05, 4.030577838420868e-05, 4.171207547187805e-05, 4.3118372559547424e-05, 4.45246696472168e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 10.0, 10.0, 21.0, 22.0, 19.0, 42.0, 54.0, 88.0, 113.0, 135.0, 131.0, 107.0, 80.0, 65.0, 33.0, 19.0, 20.0, 8.0, 14.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.239248275756836e-05, -5.074404180049896e-05, -4.9095600843429565e-05, -4.744715988636017e-05, -4.579871892929077e-05, -4.4150277972221375e-05, -4.250183701515198e-05, -4.085339605808258e-05, -3.9204955101013184e-05, -3.755651414394379e-05, -3.590807318687439e-05, -3.425963222980499e-05, -3.2611191272735596e-05, -3.09627503156662e-05, -2.9314309358596802e-05, -2.7665868401527405e-05, -2.6017427444458008e-05, -2.436898648738861e-05, -2.2720545530319214e-05, -2.1072104573249817e-05, -1.942366361618042e-05, -1.7775222659111023e-05, -1.6126781702041626e-05, -1.4478340744972229e-05, -1.2829899787902832e-05, -1.1181458830833435e-05, -9.533017873764038e-06, -7.884576916694641e-06, -6.236135959625244e-06, -4.587695002555847e-06, -2.93925404548645e-06, -1.2908130884170532e-06, 3.5762786865234375e-07, 2.0060688257217407e-06, 3.6545097827911377e-06, 5.302950739860535e-06, 6.951391696929932e-06, 8.599832653999329e-06, 1.0248273611068726e-05, 1.1896714568138123e-05, 1.354515552520752e-05, 1.5193596482276917e-05, 1.6842037439346313e-05, 1.849047839641571e-05, 2.0138919353485107e-05, 2.1787360310554504e-05, 2.34358012676239e-05, 2.50842422246933e-05, 2.6732683181762695e-05, 2.8381124138832092e-05, 3.002956509590149e-05, 3.1678006052970886e-05, 3.332644701004028e-05, 3.497488796710968e-05, 3.662332892417908e-05, 3.8271769881248474e-05, 3.992021083831787e-05, 4.156865179538727e-05, 4.3217092752456665e-05, 4.486553370952606e-05, 4.651397466659546e-05, 4.8162415623664856e-05, 4.981085658073425e-05, 5.145929753780365e-05, 5.310773849487305e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 14.0, 6.0, 4.0, 16.0, 61.0, 70.0, 102.0, 147.0, 260.0, 562.0, 2901.0, 4158.0, 10089.0, 53521.0, 904629.0, 53623.0, 10017.0, 6152.0, 975.0, 508.0, 296.0, 172.0, 107.0, 73.0, 22.0, 18.0, 11.0, 8.0, 5.0, 3.0, 4.0, 1.0, 4.0, 5.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.0265579223632812e-06, -1.957640051841736e-06, -1.8887221813201904e-06, -1.819804310798645e-06, -1.7508864402770996e-06, -1.6819685697555542e-06, -1.6130506992340088e-06, -1.5441328287124634e-06, -1.475214958190918e-06, -1.4062970876693726e-06, -1.3373792171478271e-06, -1.2684613466262817e-06, -1.1995434761047363e-06, -1.130625605583191e-06, -1.0617077350616455e-06, -9.927898645401e-07, -9.238719940185547e-07, -8.549541234970093e-07, -7.860362529754639e-07, -7.171183824539185e-07, -6.48200511932373e-07, -5.792826414108276e-07, -5.103647708892822e-07, -4.414469003677368e-07, -3.725290298461914e-07, -3.03611159324646e-07, -2.3469328880310059e-07, -1.6577541828155518e-07, -9.685754776000977e-08, -2.7939677238464355e-08, 4.0978193283081055e-08, 1.0989606380462646e-07, 1.7881393432617188e-07, 2.477318048477173e-07, 3.166496753692627e-07, 3.855675458908081e-07, 4.544854164123535e-07, 5.234032869338989e-07, 5.923211574554443e-07, 6.612390279769897e-07, 7.301568984985352e-07, 7.990747690200806e-07, 8.67992639541626e-07, 9.369105100631714e-07, 1.0058283805847168e-06, 1.0747462511062622e-06, 1.1436641216278076e-06, 1.212581992149353e-06, 1.2814998626708984e-06, 1.3504177331924438e-06, 1.4193356037139893e-06, 1.4882534742355347e-06, 1.55717134475708e-06, 1.6260892152786255e-06, 1.695007085800171e-06, 1.7639249563217163e-06, 1.8328428268432617e-06, 1.9017606973648071e-06, 1.9706785678863525e-06, 2.039596438407898e-06, 2.1085143089294434e-06, 2.1774321794509888e-06, 2.246350049972534e-06, 2.3152679204940796e-06, 2.384185791015625e-06]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [84.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 849.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 4.0, 7.0, 22.0, 20.0, 48.0, 47.0, 118.0, 163.0, 211.0, 879.0, 1816.0, 19155.0, 945158.0, 75348.0, 4023.0, 690.0, 391.0, 163.0, 117.0, 50.0, 56.0, 41.0, 11.0, 11.0, 2.0, 1.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.708766937255859e-06, -4.555098712444305e-06, -4.4014304876327515e-06, -4.2477622628211975e-06, -4.0940940380096436e-06, -3.94042581319809e-06, -3.7867575883865356e-06, -3.6330893635749817e-06, -3.4794211387634277e-06, -3.3257529139518738e-06, -3.17208468914032e-06, -3.018416464328766e-06, -2.864748239517212e-06, -2.711080014705658e-06, -2.557411789894104e-06, -2.40374356508255e-06, -2.250075340270996e-06, -2.096407115459442e-06, -1.942738890647888e-06, -1.7890706658363342e-06, -1.6354024410247803e-06, -1.4817342162132263e-06, -1.3280659914016724e-06, -1.1743977665901184e-06, -1.0207295417785645e-06, -8.670613169670105e-07, -7.133930921554565e-07, -5.597248673439026e-07, -4.0605664253234863e-07, -2.523884177207947e-07, -9.872019290924072e-08, 5.494803190231323e-08, 2.086162567138672e-07, 3.6228448152542114e-07, 5.159527063369751e-07, 6.69620931148529e-07, 8.23289155960083e-07, 9.76957380771637e-07, 1.130625605583191e-06, 1.2842938303947449e-06, 1.4379620552062988e-06, 1.5916302800178528e-06, 1.7452985048294067e-06, 1.8989667296409607e-06, 2.0526349544525146e-06, 2.2063031792640686e-06, 2.3599714040756226e-06, 2.5136396288871765e-06, 2.6673078536987305e-06, 2.8209760785102844e-06, 2.9746443033218384e-06, 3.1283125281333923e-06, 3.2819807529449463e-06, 3.4356489777565002e-06, 3.589317202568054e-06, 3.742985427379608e-06, 3.896653652191162e-06, 4.050321877002716e-06, 4.20399010181427e-06, 4.357658326625824e-06, 4.511326551437378e-06, 4.664994776248932e-06, 4.818663001060486e-06, 4.97233122587204e-06, 5.125999450683594e-06]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 17.0, 14.0, 48.0, 86.0, 648.0, 88.0, 51.0, 21.0, 6.0, 9.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9669532775878906e-06, -1.9082799553871155e-06, -1.8496066331863403e-06, -1.7909333109855652e-06, -1.73225998878479e-06, -1.6735866665840149e-06, -1.6149133443832397e-06, -1.5562400221824646e-06, -1.4975666999816895e-06, -1.4388933777809143e-06, -1.3802200555801392e-06, -1.321546733379364e-06, -1.2628734111785889e-06, -1.2042000889778137e-06, -1.1455267667770386e-06, -1.0868534445762634e-06, -1.0281801223754883e-06, -9.695068001747131e-07, -9.10833477973938e-07, -8.521601557731628e-07, -7.934868335723877e-07, -7.348135113716125e-07, -6.761401891708374e-07, -6.174668669700623e-07, -5.587935447692871e-07, -5.00120222568512e-07, -4.414469003677368e-07, -3.8277357816696167e-07, -3.241002559661865e-07, -2.654269337654114e-07, -2.0675361156463623e-07, -1.4808028936386108e-07, -8.940696716308594e-08, -3.073364496231079e-08, 2.7939677238464355e-08, 8.66129994392395e-08, 1.4528632164001465e-07, 2.039596438407898e-07, 2.6263296604156494e-07, 3.213062882423401e-07, 3.7997961044311523e-07, 4.386529326438904e-07, 4.973262548446655e-07, 5.559995770454407e-07, 6.146728992462158e-07, 6.73346221446991e-07, 7.320195436477661e-07, 7.906928658485413e-07, 8.493661880493164e-07, 9.080395102500916e-07, 9.667128324508667e-07, 1.0253861546516418e-06, 1.084059476852417e-06, 1.1427327990531921e-06, 1.2014061212539673e-06, 1.2600794434547424e-06, 1.3187527656555176e-06, 1.3774260878562927e-06, 1.4360994100570679e-06, 1.494772732257843e-06, 1.5534460544586182e-06, 1.6121193766593933e-06, 1.6707926988601685e-06, 1.7294660210609436e-06, 1.7881393432617188e-06]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 75.0, 908.0, 29.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036680864286608994, -0.00035724983899854124, -0.000347691064234823, -0.0003381322603672743, -0.0003285734564997256, -0.0003190146526321769, -0.00030945587786845863, -0.0002998970740009099, -0.0002903382992371917, -0.000280779495369643, -0.0002712207206059247, -0.000261661916738376, -0.0002521031128708273, -0.00024254432355519384, -0.00023298553423956037, -0.00022342673037201166, -0.00021386792650446296, -0.00020430913718882948, -0.00019475033332128078, -0.0001851915440056473, -0.0001756327401380986, -0.00016607395082246512, -0.00015651516150683165, -0.00014695635763928294, -0.00013739756832364947, -0.000127838779008016, -0.00011827997514046729, -0.00010872118582483381, -9.916238923324272e-05, -8.960359264165163e-05, -8.004480332601815e-05, -7.048600673442706e-05, -6.092723924666643e-05, -5.136844265507534e-05, -4.180964970146306e-05, -3.2250856747850776e-05, -2.2692060156259686e-05, -1.3133263564668596e-05, -3.574470611056313e-06, 5.98432234255597e-06, 1.554311893414706e-05, 2.5101913706748746e-05, 3.466070847935043e-05, 4.4219501432962716e-05, 5.3778298024553806e-05, 6.33370946161449e-05, 7.289588393177837e-05, 8.245468052336946e-05, 9.201347711496055e-05, 0.00010157227370655164, 0.00011113107029814273, 0.00012068985961377621, 0.0001302486634813249, 0.0001398074527969584, 0.00014936624211259186, 0.00015892504598014057, 0.00016848383529577404, 0.00017804262461140752, 0.00018760142847895622, 0.0001971602177945897, 0.00020671900711022317, 0.00021627781097777188, 0.00022583660029340535, 0.00023539538960903883, 0.00024495419347658753]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 0.0, 4.0, 5.0, 3.0, 5.0, 10.0, 12.0, 8.0, 10.0, 18.0, 22.0, 26.0, 36.0, 31.0, 38.0, 39.0, 36.0, 41.0, 38.0, 37.0, 51.0, 46.0, 48.0, 42.0, 38.0, 45.0, 47.0, 34.0, 24.0, 30.0, 21.0, 22.0, 23.0, 22.0, 29.0, 14.0, 9.0, 10.0, 7.0, 4.0, 4.0, 5.0, 5.0, 1.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.586768434615806e-05, -3.480196392047219e-05, -3.3736239856807515e-05, -3.267051943112165e-05, -3.160479536745697e-05, -3.0539074941771105e-05, -2.9473352697095834e-05, -2.8407630452420563e-05, -2.734190820774529e-05, -2.627618596307002e-05, -2.521046371839475e-05, -2.4144741473719478e-05, -2.307902104803361e-05, -2.2013296984368935e-05, -2.0947576558683068e-05, -1.9881854314007796e-05, -1.8816132069332525e-05, -1.7750409824657254e-05, -1.6684687579981983e-05, -1.561896533530671e-05, -1.4553244000126142e-05, -1.348752175545087e-05, -1.2421800420270301e-05, -1.135607817559503e-05, -1.0290355930919759e-05, -9.224633686244488e-06, -8.158911441569217e-06, -7.093190106388647e-06, -6.027467861713376e-06, -4.961745617038105e-06, -3.896023827110184e-06, -2.830302037182264e-06, -1.7645761545281857e-06, -6.9885413722659e-07, 3.668678800750058e-07, 1.4325898973766016e-06, 2.4983119146781974e-06, 3.5640341593534686e-06, 4.629755949281389e-06, 5.695477739209309e-06, 6.7611999838845804e-06, 7.826922228559852e-06, 8.892644473235123e-06, 9.958365808415692e-06, 1.1024088053090964e-05, 1.2089810297766235e-05, 1.3155531632946804e-05, 1.4221253877622075e-05, 1.5286976122297347e-05, 1.6352698366972618e-05, 1.741842061164789e-05, 1.848414285632316e-05, 1.954986510099843e-05, 2.06155855266843e-05, 2.168130777135957e-05, 2.274703001603484e-05, 2.3812752260710113e-05, 2.4878474505385384e-05, 2.5944196750060655e-05, 2.7009918994735926e-05, 2.8075639420421794e-05, 2.914136348408647e-05, 3.0207083909772336e-05, 3.127280797343701e-05, 3.233852839912288e-05]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 10.0, 2.0, 1.0, 3.0, 5.0, 7.0, 32.0, 5.0, 20.0, 14.0, 20.0, 125.0, 66.0, 67.0, 96.0, 176.0, 461.0, 650.0, 1224.0, 3199.0, 11797.0, 900515.0, 3251607.0, 16863.0, 3834.0, 1519.0, 763.0, 470.0, 221.0, 117.0, 78.0, 68.0, 120.0, 24.0, 16.0, 15.0, 13.0, 37.0, 12.0, 4.0, 2.0, 2.0, 4.0, 11.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580881118774414e-05, -2.4856068193912506e-05, -2.390332520008087e-05, -2.2950582206249237e-05, -2.1997839212417603e-05, -2.1045096218585968e-05, -2.0092353224754333e-05, -1.91396102309227e-05, -1.8186867237091064e-05, -1.723412424325943e-05, -1.6281381249427795e-05, -1.532863825559616e-05, -1.4375895261764526e-05, -1.3423152267932892e-05, -1.2470409274101257e-05, -1.1517666280269623e-05, -1.0564923286437988e-05, -9.612180292606354e-06, -8.65943729877472e-06, -7.706694304943085e-06, -6.75395131111145e-06, -5.801208317279816e-06, -4.848465323448181e-06, -3.895722329616547e-06, -2.942979335784912e-06, -1.9902363419532776e-06, -1.037493348121643e-06, -8.475035429000854e-08, 8.67992639541626e-07, 1.8207356333732605e-06, 2.773478627204895e-06, 3.7262216210365295e-06, 4.678964614868164e-06, 5.631707608699799e-06, 6.584450602531433e-06, 7.537193596363068e-06, 8.489936590194702e-06, 9.442679584026337e-06, 1.0395422577857971e-05, 1.1348165571689606e-05, 1.230090856552124e-05, 1.3253651559352875e-05, 1.420639455318451e-05, 1.5159137547016144e-05, 1.611188054084778e-05, 1.7064623534679413e-05, 1.8017366528511047e-05, 1.8970109522342682e-05, 1.9922852516174316e-05, 2.087559551000595e-05, 2.1828338503837585e-05, 2.278108149766922e-05, 2.3733824491500854e-05, 2.468656748533249e-05, 2.5639310479164124e-05, 2.6592053472995758e-05, 2.7544796466827393e-05, 2.8497539460659027e-05, 2.945028245449066e-05, 3.0403025448322296e-05, 3.135576844215393e-05, 3.2308511435985565e-05, 3.32612544298172e-05, 3.4213997423648834e-05, 3.516674041748047e-05]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 5.0, 8.0, 6.0, 4.0, 9.0, 18.0, 16.0, 17.0, 38.0, 32.0, 33.0, 42.0, 37.0, 62.0, 45.0, 48.0, 74.0, 62.0, 30.0, 58.0, 41.0, 37.0, 50.0, 37.0, 34.0, 24.0, 23.0, 23.0, 12.0, 18.0, 15.0, 4.0, 7.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.258487701416016e-06, -6.058253347873688e-06, -5.85801899433136e-06, -5.657784640789032e-06, -5.457550287246704e-06, -5.257315933704376e-06, -5.057081580162048e-06, -4.8568472266197205e-06, -4.656612873077393e-06, -4.456378519535065e-06, -4.256144165992737e-06, -4.055909812450409e-06, -3.855675458908081e-06, -3.655441105365753e-06, -3.4552067518234253e-06, -3.2549723982810974e-06, -3.0547380447387695e-06, -2.8545036911964417e-06, -2.6542693376541138e-06, -2.454034984111786e-06, -2.253800630569458e-06, -2.05356627702713e-06, -1.8533319234848022e-06, -1.6530975699424744e-06, -1.4528632164001465e-06, -1.2526288628578186e-06, -1.0523945093154907e-06, -8.521601557731628e-07, -6.51925802230835e-07, -4.516914486885071e-07, -2.514570951461792e-07, -5.122274160385132e-08, 1.4901161193847656e-07, 3.4924596548080444e-07, 5.494803190231323e-07, 7.497146725654602e-07, 9.499490261077881e-07, 1.150183379650116e-06, 1.3504177331924438e-06, 1.5506520867347717e-06, 1.7508864402770996e-06, 1.9511207938194275e-06, 2.1513551473617554e-06, 2.3515895009040833e-06, 2.551823854446411e-06, 2.752058207988739e-06, 2.952292561531067e-06, 3.1525269150733948e-06, 3.3527612686157227e-06, 3.5529956221580505e-06, 3.7532299757003784e-06, 3.953464329242706e-06, 4.153698682785034e-06, 4.353933036327362e-06, 4.55416738986969e-06, 4.754401743412018e-06, 4.954636096954346e-06, 5.154870450496674e-06, 5.3551048040390015e-06, 5.555339157581329e-06, 5.755573511123657e-06, 5.955807864665985e-06, 6.156042218208313e-06, 6.356276571750641e-06, 6.556510925292969e-06]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 4.0, 10.0, 11.0, 19.0, 23.0, 33.0, 60.0, 87.0, 215.0, 715.0, 2243.0, 11912.0, 156387.0, 3989093.0, 26780.0, 4794.0, 1162.0, 414.0, 139.0, 68.0, 39.0, 16.0, 15.0, 8.0, 5.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.123283386230469e-05, -3.01264226436615e-05, -2.902001142501831e-05, -2.7913600206375122e-05, -2.6807188987731934e-05, -2.5700777769088745e-05, -2.4594366550445557e-05, -2.3487955331802368e-05, -2.238154411315918e-05, -2.127513289451599e-05, -2.0168721675872803e-05, -1.9062310457229614e-05, -1.7955899238586426e-05, -1.6849488019943237e-05, -1.574307680130005e-05, -1.463666558265686e-05, -1.3530254364013672e-05, -1.2423843145370483e-05, -1.1317431926727295e-05, -1.0211020708084106e-05, -9.104609489440918e-06, -7.99819827079773e-06, -6.891787052154541e-06, -5.7853758335113525e-06, -4.678964614868164e-06, -3.5725533962249756e-06, -2.466142177581787e-06, -1.3597309589385986e-06, -2.5331974029541016e-07, 8.530914783477783e-07, 1.959502696990967e-06, 3.0659139156341553e-06, 4.172325134277344e-06, 5.278736352920532e-06, 6.385147571563721e-06, 7.491558790206909e-06, 8.597970008850098e-06, 9.704381227493286e-06, 1.0810792446136475e-05, 1.1917203664779663e-05, 1.3023614883422852e-05, 1.413002610206604e-05, 1.5236437320709229e-05, 1.6342848539352417e-05, 1.7449259757995605e-05, 1.8555670976638794e-05, 1.9662082195281982e-05, 2.076849341392517e-05, 2.187490463256836e-05, 2.2981315851211548e-05, 2.4087727069854736e-05, 2.5194138288497925e-05, 2.6300549507141113e-05, 2.7406960725784302e-05, 2.851337194442749e-05, 2.961978316307068e-05, 3.072619438171387e-05, 3.1832605600357056e-05, 3.2939016819000244e-05, 3.404542803764343e-05, 3.515183925628662e-05, 3.625825047492981e-05, 3.7364661693573e-05, 3.8471072912216187e-05, 3.9577484130859375e-05]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 4.0, 4.0, 6.0, 5.0, 8.0, 10.0, 17.0, 22.0, 34.0, 63.0, 108.0, 465.0, 1011.0, 1629.0, 353.0, 148.0, 53.0, 34.0, 14.0, 16.0, 7.0, 14.0, 21.0, 6.0, 7.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.212162017822266e-06, -7.006339728832245e-06, -6.800517439842224e-06, -6.594695150852203e-06, -6.388872861862183e-06, -6.183050572872162e-06, -5.977228283882141e-06, -5.77140599489212e-06, -5.5655837059021e-06, -5.359761416912079e-06, -5.153939127922058e-06, -4.948116838932037e-06, -4.742294549942017e-06, -4.536472260951996e-06, -4.330649971961975e-06, -4.124827682971954e-06, -3.919005393981934e-06, -3.713183104991913e-06, -3.507360816001892e-06, -3.3015385270118713e-06, -3.0957162380218506e-06, -2.88989394903183e-06, -2.684071660041809e-06, -2.4782493710517883e-06, -2.2724270820617676e-06, -2.066604793071747e-06, -1.860782504081726e-06, -1.6549602150917053e-06, -1.4491379261016846e-06, -1.2433156371116638e-06, -1.037493348121643e-06, -8.316710591316223e-07, -6.258487701416016e-07, -4.200264811515808e-07, -2.1420419216156006e-07, -8.381903171539307e-09, 1.9744038581848145e-07, 4.032626748085022e-07, 6.09084963798523e-07, 8.149072527885437e-07, 1.0207295417785645e-06, 1.2265518307685852e-06, 1.432374119758606e-06, 1.6381964087486267e-06, 1.8440186977386475e-06, 2.0498409867286682e-06, 2.255663275718689e-06, 2.4614855647087097e-06, 2.6673078536987305e-06, 2.8731301426887512e-06, 3.078952431678772e-06, 3.2847747206687927e-06, 3.4905970096588135e-06, 3.6964192986488342e-06, 3.902241587638855e-06, 4.108063876628876e-06, 4.3138861656188965e-06, 4.519708454608917e-06, 4.725530743598938e-06, 4.931353032588959e-06, 5.1371753215789795e-06, 5.342997610569e-06, 5.548819899559021e-06, 5.754642188549042e-06, 5.9604644775390625e-06]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 3.0, 8.0, 9.0, 6.0, 9.0, 13.0, 17.0, 12.0, 35.0, 32.0, 55.0, 65.0, 81.0, 99.0, 116.0, 90.0, 76.0, 56.0, 38.0, 36.0, 37.0, 19.0, 14.0, 13.0, 15.0, 9.0, 7.0, 5.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.024055018206127e-05, -9.891364243230782e-06, -9.542178304400295e-06, -9.192992365569808e-06, -8.84380642673932e-06, -8.494620487908833e-06, -8.145434549078345e-06, -7.796248610247858e-06, -7.447063126164721e-06, -7.097877187334234e-06, -6.7486912485037465e-06, -6.39950576442061e-06, -6.0503198255901225e-06, -5.701133886759635e-06, -5.351947947929148e-06, -5.00276200909866e-06, -4.653576070268173e-06, -4.304390131437685e-06, -3.955204192607198e-06, -3.606018481150386e-06, -3.2568325423198985e-06, -2.907646603489411e-06, -2.558460892032599e-06, -2.2092749532021116e-06, -1.8600890143716242e-06, -1.5109030755411368e-06, -1.161717250397487e-06, -8.125314252538374e-07, -4.6334548642334994e-07, -1.1415954759286251e-07, 2.3502616386394948e-07, 5.842121026944369e-07, 9.333989510196261e-07, 1.2825848898501135e-06, 1.6317707149937632e-06, 1.980956540137413e-06, 2.3301424789679004e-06, 2.679328417798388e-06, 3.0285141292552e-06, 3.3777000680856872e-06, 3.7268860069161747e-06, 4.076071945746662e-06, 4.4252578845771495e-06, 4.774443368660286e-06, 5.1236293074907735e-06, 5.472815246321261e-06, 5.822001185151748e-06, 6.171187123982236e-06, 6.520373062812723e-06, 6.869559001643211e-06, 7.218744940473698e-06, 7.5679308793041855e-06, 7.917116818134673e-06, 8.26630275696516e-06, 8.615488695795648e-06, 8.964674634626135e-06, 9.313860573456623e-06, 9.66304651228711e-06, 1.0012232451117598e-05, 1.0361418389948085e-05, 1.0710604328778572e-05, 1.105979026760906e-05, 1.1408976206439547e-05, 1.1758162145270035e-05, 1.210734717460582e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 5.0, 3.0, 2.0, 4.0, 3.0, 7.0, 7.0, 10.0, 15.0, 12.0, 20.0, 11.0, 23.0, 31.0, 19.0, 22.0, 31.0, 32.0, 38.0, 38.0, 40.0, 48.0, 46.0, 37.0, 41.0, 43.0, 35.0, 42.0, 34.0, 31.0, 37.0, 25.0, 32.0, 26.0, 19.0, 31.0, 16.0, 12.0, 11.0, 13.0, 14.0, 9.0, 9.0, 3.0, 4.0, 7.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.260255304368911e-06, -6.040001153451158e-06, -5.819747457280755e-06, -5.5994933063630015e-06, -5.379239155445248e-06, -5.158985004527494e-06, -4.938731308357092e-06, -4.718477157439338e-06, -4.498223461268935e-06, -4.277969310351182e-06, -4.057715614180779e-06, -3.8374614632630255e-06, -3.617207312345272e-06, -3.396953388801194e-06, -3.1766994652571157e-06, -2.956445314339362e-06, -2.7361911634216085e-06, -2.5159372398775304e-06, -2.295683088959777e-06, -2.0754291654156987e-06, -1.8551751281847828e-06, -1.634921090953867e-06, -1.4146671674097888e-06, -1.194413130178873e-06, -9.741590929479571e-07, -7.539050557170413e-07, -5.336510753295443e-07, -3.1339709494204726e-07, -9.31430577111314e-08, 1.2711097951978445e-07, 3.473649030638626e-07, 5.676189402947784e-07, 7.878734322730452e-07, 1.008127469503961e-06, 1.2283815067348769e-06, 1.448635430278955e-06, 1.6688894675098709e-06, 1.8891435047407867e-06, 2.109397428284865e-06, 2.3296515792026184e-06, 2.5499055027466966e-06, 2.7701594262907747e-06, 2.9904135772085283e-06, 3.2106675007526064e-06, 3.4309214242966846e-06, 3.651175575214438e-06, 3.871429726132192e-06, 4.091683422302594e-06, 4.311937573220348e-06, 4.5321917241381016e-06, 4.752445420308504e-06, 4.972699571226258e-06, 5.192953722144011e-06, 5.413207873061765e-06, 5.633461569232168e-06, 5.853715720149921e-06, 6.073969416320324e-06, 6.2942235672380775e-06, 6.51447726340848e-06, 6.734731414326234e-06, 6.954985565243987e-06, 7.17523926141439e-06, 7.395493412332144e-06, 7.615747563249897e-06, 7.83600171416765e-06]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 5.0, 3.0, 5.0, 6.0, 4.0, 24.0, 23.0, 11.0, 31.0, 40.0, 66.0, 59.0, 108.0, 211.0, 147.0, 465.0, 1181.0, 4971.0, 9692.0, 181924.0, 799195.0, 33311.0, 13214.0, 2226.0, 427.0, 468.0, 269.0, 158.0, 42.0, 82.0, 64.0, 21.0, 26.0, 16.0, 14.0, 18.0, 11.0, 7.0, 1.0, 2.0, 6.0, 1.0, 1.0, 3.0, 1.0], "bins": [-3.993511199951172e-06, -3.891997039318085e-06, -3.7904828786849976e-06, -3.6889687180519104e-06, -3.5874545574188232e-06, -3.485940396785736e-06, -3.384426236152649e-06, -3.2829120755195618e-06, -3.1813979148864746e-06, -3.0798837542533875e-06, -2.9783695936203003e-06, -2.876855432987213e-06, -2.775341272354126e-06, -2.673827111721039e-06, -2.5723129510879517e-06, -2.4707987904548645e-06, -2.3692846298217773e-06, -2.26777046918869e-06, -2.166256308555603e-06, -2.064742147922516e-06, -1.9632279872894287e-06, -1.8617138266563416e-06, -1.7601996660232544e-06, -1.6586855053901672e-06, -1.55717134475708e-06, -1.455657184123993e-06, -1.3541430234909058e-06, -1.2526288628578186e-06, -1.1511147022247314e-06, -1.0496005415916443e-06, -9.480863809585571e-07, -8.4657222032547e-07, -7.450580596923828e-07, -6.435438990592957e-07, -5.420297384262085e-07, -4.4051557779312134e-07, -3.390014171600342e-07, -2.3748725652694702e-07, -1.3597309589385986e-07, -3.4458935260772705e-08, 6.705522537231445e-08, 1.685693860054016e-07, 2.7008354663848877e-07, 3.7159770727157593e-07, 4.731118679046631e-07, 5.746260285377502e-07, 6.761401891708374e-07, 7.776543498039246e-07, 8.791685104370117e-07, 9.806826710700989e-07, 1.082196831703186e-06, 1.1837109923362732e-06, 1.2852251529693604e-06, 1.3867393136024475e-06, 1.4882534742355347e-06, 1.5897676348686218e-06, 1.691281795501709e-06, 1.7927959561347961e-06, 1.8943101167678833e-06, 1.9958242774009705e-06, 2.0973384380340576e-06, 2.1988525986671448e-06, 2.300366759300232e-06, 2.401880919933319e-06, 2.5033950805664062e-06]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 9.0, 11.0, 12.0, 7.0, 16.0, 17.0, 25.0, 24.0, 17.0, 34.0, 40.0, 35.0, 54.0, 51.0, 29.0, 58.0, 47.0, 59.0, 57.0, 28.0, 47.0, 47.0, 44.0, 30.0, 23.0, 31.0, 28.0, 30.0, 13.0, 11.0, 14.0, 8.0, 17.0, 7.0, 3.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0531158447265625e-06, -3.885477781295776e-06, -3.7178397178649902e-06, -3.550201654434204e-06, -3.382563591003418e-06, -3.214925527572632e-06, -3.0472874641418457e-06, -2.8796494007110596e-06, -2.7120113372802734e-06, -2.5443732738494873e-06, -2.376735210418701e-06, -2.209097146987915e-06, -2.041459083557129e-06, -1.8738210201263428e-06, -1.7061829566955566e-06, -1.5385448932647705e-06, -1.3709068298339844e-06, -1.2032687664031982e-06, -1.0356307029724121e-06, -8.67992639541626e-07, -7.003545761108398e-07, -5.327165126800537e-07, -3.650784492492676e-07, -1.9744038581848145e-07, -2.9802322387695312e-08, 1.3783574104309082e-07, 3.0547380447387695e-07, 4.731118679046631e-07, 6.407499313354492e-07, 8.083879947662354e-07, 9.760260581970215e-07, 1.1436641216278076e-06, 1.3113021850585938e-06, 1.4789402484893799e-06, 1.646578311920166e-06, 1.8142163753509521e-06, 1.9818544387817383e-06, 2.1494925022125244e-06, 2.3171305656433105e-06, 2.4847686290740967e-06, 2.652406692504883e-06, 2.820044755935669e-06, 2.987682819366455e-06, 3.155320882797241e-06, 3.3229589462280273e-06, 3.4905970096588135e-06, 3.6582350730895996e-06, 3.825873136520386e-06, 3.993511199951172e-06, 4.161149263381958e-06, 4.328787326812744e-06, 4.49642539024353e-06, 4.664063453674316e-06, 4.8317015171051025e-06, 4.999339580535889e-06, 5.166977643966675e-06, 5.334615707397461e-06, 5.502253770828247e-06, 5.669891834259033e-06, 5.837529897689819e-06, 6.0051679611206055e-06, 6.172806024551392e-06, 6.340444087982178e-06, 6.508082151412964e-06, 6.67572021484375e-06]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 10.0, 0.0, 18.0, 0.0, 0.0, 82.0, 0.0, 0.0, 205.0, 0.0, 629.0, 0.0, 0.0, 1994.0, 0.0, 0.0, 7125.0, 0.0, 29230.0, 0.0, 0.0, 145795.0, 0.0, 0.0, 679746.0, 0.0, 144602.0, 0.0, 0.0, 29058.0, 0.0, 0.0, 7110.0, 0.0, 2029.0, 0.0, 0.0, 617.0, 0.0, 0.0, 193.0, 0.0, 82.0, 0.0, 0.0, 23.0, 0.0, 0.0, 10.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-7.152557373046875e-07, -6.92903995513916e-07, -6.705522537231445e-07, -6.48200511932373e-07, -6.258487701416016e-07, -6.034970283508301e-07, -5.811452865600586e-07, -5.587935447692871e-07, -5.364418029785156e-07, -5.140900611877441e-07, -4.917383193969727e-07, -4.6938657760620117e-07, -4.470348358154297e-07, -4.246830940246582e-07, -4.023313522338867e-07, -3.7997961044311523e-07, -3.5762786865234375e-07, -3.3527612686157227e-07, -3.129243850708008e-07, -2.905726432800293e-07, -2.682209014892578e-07, -2.4586915969848633e-07, -2.2351741790771484e-07, -2.0116567611694336e-07, -1.7881393432617188e-07, -1.564621925354004e-07, -1.341104507446289e-07, -1.1175870895385742e-07, -8.940696716308594e-08, -6.705522537231445e-08, -4.470348358154297e-08, -2.2351741790771484e-08, 0.0, 2.2351741790771484e-08, 4.470348358154297e-08, 6.705522537231445e-08, 8.940696716308594e-08, 1.1175870895385742e-07, 1.341104507446289e-07, 1.564621925354004e-07, 1.7881393432617188e-07, 2.0116567611694336e-07, 2.2351741790771484e-07, 2.4586915969848633e-07, 2.682209014892578e-07, 2.905726432800293e-07, 3.129243850708008e-07, 3.3527612686157227e-07, 3.5762786865234375e-07, 3.7997961044311523e-07, 4.023313522338867e-07, 4.246830940246582e-07, 4.470348358154297e-07, 4.6938657760620117e-07, 4.917383193969727e-07, 5.140900611877441e-07, 5.364418029785156e-07, 5.587935447692871e-07, 5.811452865600586e-07, 6.034970283508301e-07, 6.258487701416016e-07, 6.48200511932373e-07, 6.705522537231445e-07, 6.92903995513916e-07, 7.152557373046875e-07]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 0.0, 7.0, 9.0, 7.0, 11.0, 10.0, 20.0, 23.0, 27.0, 20.0, 22.0, 37.0, 44.0, 28.0, 35.0, 44.0, 35.0, 50.0, 42.0, 48.0, 49.0, 44.0, 36.0, 46.0, 32.0, 33.0, 32.0, 27.0, 24.0, 21.0, 20.0, 23.0, 14.0, 14.0, 10.0, 11.0, 8.0, 4.0, 10.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.1324882507324219e-05, -1.096632331609726e-05, -1.06077641248703e-05, -1.0249204933643341e-05, -9.890645742416382e-06, -9.532086551189423e-06, -9.173527359962463e-06, -8.814968168735504e-06, -8.456408977508545e-06, -8.097849786281586e-06, -7.739290595054626e-06, -7.380731403827667e-06, -7.022172212600708e-06, -6.663613021373749e-06, -6.3050538301467896e-06, -5.94649463891983e-06, -5.587935447692871e-06, -5.229376256465912e-06, -4.870817065238953e-06, -4.512257874011993e-06, -4.153698682785034e-06, -3.795139491558075e-06, -3.4365803003311157e-06, -3.0780211091041565e-06, -2.7194619178771973e-06, -2.360902726650238e-06, -2.002343535423279e-06, -1.6437843441963196e-06, -1.2852251529693604e-06, -9.266659617424011e-07, -5.681067705154419e-07, -2.0954757928848267e-07, 1.4901161193847656e-07, 5.075708031654358e-07, 8.66129994392395e-07, 1.2246891856193542e-06, 1.5832483768463135e-06, 1.9418075680732727e-06, 2.300366759300232e-06, 2.658925950527191e-06, 3.0174851417541504e-06, 3.3760443329811096e-06, 3.734603524208069e-06, 4.093162715435028e-06, 4.451721906661987e-06, 4.8102810978889465e-06, 5.168840289115906e-06, 5.527399480342865e-06, 5.885958671569824e-06, 6.2445178627967834e-06, 6.603077054023743e-06, 6.961636245250702e-06, 7.320195436477661e-06, 7.67875462770462e-06, 8.03731381893158e-06, 8.395873010158539e-06, 8.754432201385498e-06, 9.112991392612457e-06, 9.471550583839417e-06, 9.830109775066376e-06, 1.0188668966293335e-05, 1.0547228157520294e-05, 1.0905787348747253e-05, 1.1264346539974213e-05, 1.1622905731201172e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [33.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048480.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [46.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 217.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 528.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 196.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-07, -1.1362135410308838e-07, -1.0803341865539551e-07, -1.0244548320770264e-07, -9.685754776000977e-08, -9.12696123123169e-08, -8.568167686462402e-08, -8.009374141693115e-08, -7.450580596923828e-08, -6.891787052154541e-08, -6.332993507385254e-08, -5.774199962615967e-08, -5.21540641784668e-08, -4.6566128730773926e-08, -4.0978193283081055e-08, -3.5390257835388184e-08, -2.9802322387695312e-08, -2.421438694000244e-08, -1.862645149230957e-08, -1.30385160446167e-08, -7.450580596923828e-09, -1.862645149230957e-09, 3.725290298461914e-09, 9.313225746154785e-09, 1.4901161193847656e-08, 2.0489096641540527e-08, 2.60770320892334e-08, 3.166496753692627e-08, 3.725290298461914e-08, 4.284083843231201e-08, 4.842877388000488e-08, 5.4016709327697754e-08, 5.960464477539063e-08, 6.51925802230835e-08, 7.078051567077637e-08, 7.636845111846924e-08, 8.195638656616211e-08, 8.754432201385498e-08, 9.313225746154785e-08, 9.872019290924072e-08, 1.043081283569336e-07, 1.0989606380462646e-07, 1.1548399925231934e-07, 1.210719347000122e-07, 1.2665987014770508e-07, 1.3224780559539795e-07, 1.3783574104309082e-07, 1.434236764907837e-07, 1.4901161193847656e-07, 1.5459954738616943e-07, 1.601874828338623e-07, 1.6577541828155518e-07, 1.7136335372924805e-07, 1.7695128917694092e-07, 1.825392246246338e-07, 1.8812716007232666e-07, 1.9371509552001953e-07, 1.993030309677124e-07, 2.0489096641540527e-07, 2.1047890186309814e-07, 2.1606683731079102e-07, 2.2165477275848389e-07, 2.2724270820617676e-07, 2.3283064365386963e-07, 2.384185791015625e-07]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 5.0, 5.0, 17.0, 13.0, 29.0, 33.0, 43.0, 74.0, 104.0, 124.0, 159.0, 120.0, 62.0, 59.0, 37.0, 28.0, 21.0, 19.0, 12.0, 5.0, 8.0, 4.0, 5.0, 1.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.551963906531455e-06, -6.270994163060095e-06, -5.990024419588735e-06, -5.7090546761173755e-06, -5.428084932646016e-06, -5.147115189174656e-06, -4.866145445703296e-06, -4.585175702231936e-06, -4.304205958760576e-06, -4.0232362152892165e-06, -3.7422664718178567e-06, -3.461296728346497e-06, -3.180326984875137e-06, -2.899357241403777e-06, -2.6183874979324173e-06, -2.3374177544610575e-06, -2.0564480109896977e-06, -1.7754782675183378e-06, -1.494508524046978e-06, -1.2135387805756181e-06, -9.325690371042583e-07, -6.515992936328985e-07, -3.7062955016153865e-07, -8.965980669017881e-08, 1.9130993678118102e-07, 4.7227968025254086e-07, 7.532494237239007e-07, 1.0342191671952605e-06, 1.3151889106666204e-06, 1.5961586541379802e-06, 1.87712839760934e-06, 2.1580981410807e-06, 2.439067429804709e-06, 2.7200371732760686e-06, 3.0010069167474285e-06, 3.2819766602187883e-06, 3.562946403690148e-06, 3.843916147161508e-06, 4.124885890632868e-06, 4.405855634104228e-06, 4.6868253775755875e-06, 4.967795121046947e-06, 5.248764864518307e-06, 5.529734607989667e-06, 5.810704351461027e-06, 6.091674094932387e-06, 6.3726438384037465e-06, 6.653613581875106e-06, 6.934583325346466e-06, 7.215553068817826e-06, 7.496522812289186e-06, 7.777493010507897e-06, 8.058462299231905e-06, 8.339431587955914e-06, 8.620401786174625e-06, 8.901371984393336e-06, 9.182341273117345e-06, 9.463310561841354e-06, 9.744280760060064e-06, 1.0025250958278775e-05, 1.0306220247002784e-05, 1.0587189535726793e-05, 1.0868159733945504e-05, 1.1149129932164215e-05, 1.1430099220888223e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [5.0, 5.0, 1.0, 2.0, 6.0, 1.0, 3.0, 10.0, 12.0, 13.0, 13.0, 15.0, 23.0, 27.0, 29.0, 25.0, 30.0, 35.0, 46.0, 36.0, 52.0, 46.0, 54.0, 36.0, 60.0, 42.0, 40.0, 41.0, 36.0, 39.0, 27.0, 34.0, 27.0, 29.0, 20.0, 12.0, 18.0, 17.0, 7.0, 12.0, 5.0, 5.0, 10.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.628075546657783e-06, -3.4758527363010217e-06, -3.3236299259442603e-06, -3.171407115587499e-06, -3.0191840778570622e-06, -2.866961267500301e-06, -2.7147384571435396e-06, -2.562515419413103e-06, -2.410292836430017e-06, -2.2580700260732556e-06, -2.1058472157164942e-06, -1.9536241779860575e-06, -1.8014013676292961e-06, -1.6491785572725348e-06, -1.4969557469157735e-06, -1.3447328228721744e-06, -1.1925098988285754e-06, -1.040287088471814e-06, -8.88064164428215e-07, -7.358413540714537e-07, -5.836184868712735e-07, -4.313956196710933e-07, -2.7917280931433197e-07, -1.2694988527073292e-07, 2.5272925086028408e-08, 1.7749577807535388e-07, 3.2971863106467936e-07, 4.819414698431501e-07, 6.341643370433303e-07, 7.863872042435105e-07, 9.386100146002718e-07, 1.0908329386438709e-06, 1.2430555216269568e-06, 1.395278331983718e-06, 1.5475012560273171e-06, 1.6997240663840785e-06, 1.8519469904276775e-06, 2.004169800784439e-06, 2.1563926111412e-06, 2.3086154214979615e-06, 2.4608384592283983e-06, 2.6130612695851596e-06, 2.765284079941921e-06, 2.9175071176723577e-06, 3.069729928029119e-06, 3.2219527383858804e-06, 3.3741755487426417e-06, 3.526398359099403e-06, 3.6786211694561644e-06, 3.830843979812926e-06, 3.9830670175433625e-06, 4.135289600526448e-06, 4.287512638256885e-06, 4.439735675987322e-06, 4.591958258970408e-06, 4.7441812967008445e-06, 4.8964038796839304e-06, 5.048626917414367e-06, 5.200849500397453e-06, 5.35307253812789e-06, 5.505295121110976e-06, 5.6575181588414125e-06, 5.809741196571849e-06, 5.961963779554935e-06, 6.114186817285372e-06]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 5.0, 10.0, 11.0, 13.0, 18.0, 40.0, 49.0, 87.0, 117.0, 213.0, 264.0, 403.0, 816.0, 1258.0, 2708.0, 4183.0, 7532.0, 19981.0, 42010.0, 210763.0, 586758.0, 113333.0, 28967.0, 13124.0, 7682.0, 3365.0, 2150.0, 1027.0, 667.0, 378.0, 201.0, 167.0, 87.0, 52.0, 29.0, 18.0, 24.0, 8.0, 16.0, 10.0, 6.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.47713851928711e-06, -9.153969585895538e-06, -8.830800652503967e-06, -8.507631719112396e-06, -8.184462785720825e-06, -7.861293852329254e-06, -7.538124918937683e-06, -7.214955985546112e-06, -6.891787052154541e-06, -6.56861811876297e-06, -6.245449185371399e-06, -5.922280251979828e-06, -5.599111318588257e-06, -5.275942385196686e-06, -4.952773451805115e-06, -4.629604518413544e-06, -4.306435585021973e-06, -3.983266651630402e-06, -3.6600977182388306e-06, -3.3369287848472595e-06, -3.0137598514556885e-06, -2.6905909180641174e-06, -2.3674219846725464e-06, -2.0442530512809753e-06, -1.7210841178894043e-06, -1.3979151844978333e-06, -1.0747462511062622e-06, -7.515773177146912e-07, -4.284083843231201e-07, -1.0523945093154907e-07, 2.1792948246002197e-07, 5.41098415851593e-07, 8.642673492431641e-07, 1.1874362826347351e-06, 1.5106052160263062e-06, 1.8337741494178772e-06, 2.1569430828094482e-06, 2.4801120162010193e-06, 2.8032809495925903e-06, 3.1264498829841614e-06, 3.4496188163757324e-06, 3.7727877497673035e-06, 4.0959566831588745e-06, 4.4191256165504456e-06, 4.742294549942017e-06, 5.065463483333588e-06, 5.388632416725159e-06, 5.71180135011673e-06, 6.034970283508301e-06, 6.358139216899872e-06, 6.681308150291443e-06, 7.004477083683014e-06, 7.327646017074585e-06, 7.650814950466156e-06, 7.973983883857727e-06, 8.297152817249298e-06, 8.620321750640869e-06, 8.94349068403244e-06, 9.266659617424011e-06, 9.589828550815582e-06, 9.912997484207153e-06, 1.0236166417598724e-05, 1.0559335350990295e-05, 1.0882504284381866e-05, 1.1205673217773438e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 6.0, 3.0, 5.0, 8.0, 8.0, 13.0, 12.0, 23.0, 23.0, 25.0, 42.0, 39.0, 39.0, 53.0, 57.0, 59.0, 51.0, 77.0, 67.0, 47.0, 50.0, 46.0, 41.0, 32.0, 34.0, 33.0, 15.0, 17.0, 12.0, 15.0, 5.0, 16.0, 9.0, 6.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.761882781982422e-06, -8.45547765493393e-06, -8.149072527885437e-06, -7.842667400836945e-06, -7.536262273788452e-06, -7.22985714673996e-06, -6.923452019691467e-06, -6.617046892642975e-06, -6.310641765594482e-06, -6.00423663854599e-06, -5.6978315114974976e-06, -5.391426384449005e-06, -5.085021257400513e-06, -4.77861613035202e-06, -4.472211003303528e-06, -4.165805876255035e-06, -3.859400749206543e-06, -3.5529956221580505e-06, -3.246590495109558e-06, -2.9401853680610657e-06, -2.6337802410125732e-06, -2.327375113964081e-06, -2.0209699869155884e-06, -1.714564859867096e-06, -1.4081597328186035e-06, -1.101754605770111e-06, -7.953494787216187e-07, -4.889443516731262e-07, -1.825392246246338e-07, 1.2386590242385864e-07, 4.302710294723511e-07, 7.366761565208435e-07, 1.043081283569336e-06, 1.3494864106178284e-06, 1.6558915376663208e-06, 1.9622966647148132e-06, 2.2687017917633057e-06, 2.575106918811798e-06, 2.8815120458602905e-06, 3.187917172908783e-06, 3.4943222999572754e-06, 3.800727427005768e-06, 4.10713255405426e-06, 4.413537681102753e-06, 4.719942808151245e-06, 5.0263479351997375e-06, 5.33275306224823e-06, 5.639158189296722e-06, 5.945563316345215e-06, 6.251968443393707e-06, 6.5583735704422e-06, 6.864778697490692e-06, 7.1711838245391846e-06, 7.477588951587677e-06, 7.78399407863617e-06, 8.090399205684662e-06, 8.396804332733154e-06, 8.703209459781647e-06, 9.00961458683014e-06, 9.316019713878632e-06, 9.622424840927124e-06, 9.928829967975616e-06, 1.0235235095024109e-05, 1.0541640222072601e-05, 1.0848045349121094e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 7.0, 10.0, 18.0, 25.0, 25.0, 33.0, 56.0, 83.0, 108.0, 161.0, 205.0, 313.0, 598.0, 694.0, 1106.0, 1660.0, 2717.0, 5616.0, 8842.0, 17999.0, 48741.0, 205405.0, 586794.0, 113847.0, 25826.0, 11420.0, 6074.0, 3617.0, 2566.0, 1295.0, 848.0, 533.0, 396.0, 293.0, 162.0, 142.0, 83.0, 64.0, 47.0, 39.0, 30.0, 15.0, 12.0, 10.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.655952453613281e-06, -9.346753358840942e-06, -9.037554264068604e-06, -8.728355169296265e-06, -8.419156074523926e-06, -8.109956979751587e-06, -7.800757884979248e-06, -7.491558790206909e-06, -7.18235969543457e-06, -6.8731606006622314e-06, -6.563961505889893e-06, -6.254762411117554e-06, -5.945563316345215e-06, -5.636364221572876e-06, -5.327165126800537e-06, -5.017966032028198e-06, -4.708766937255859e-06, -4.3995678424835205e-06, -4.090368747711182e-06, -3.7811696529388428e-06, -3.471970558166504e-06, -3.162771463394165e-06, -2.853572368621826e-06, -2.5443732738494873e-06, -2.2351741790771484e-06, -1.9259750843048096e-06, -1.6167759895324707e-06, -1.3075768947601318e-06, -9.98377799987793e-07, -6.891787052154541e-07, -3.7997961044311523e-07, -7.078051567077637e-08, 2.384185791015625e-07, 5.476176738739014e-07, 8.568167686462402e-07, 1.166015863418579e-06, 1.475214958190918e-06, 1.7844140529632568e-06, 2.0936131477355957e-06, 2.4028122425079346e-06, 2.7120113372802734e-06, 3.0212104320526123e-06, 3.330409526824951e-06, 3.63960862159729e-06, 3.948807716369629e-06, 4.258006811141968e-06, 4.567205905914307e-06, 4.8764050006866455e-06, 5.185604095458984e-06, 5.494803190231323e-06, 5.804002285003662e-06, 6.113201379776001e-06, 6.42240047454834e-06, 6.731599569320679e-06, 7.040798664093018e-06, 7.3499977588653564e-06, 7.659196853637695e-06, 7.968395948410034e-06, 8.277595043182373e-06, 8.586794137954712e-06, 8.89599323272705e-06, 9.20519232749939e-06, 9.514391422271729e-06, 9.823590517044067e-06, 1.0132789611816406e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 6.0, 5.0, 12.0, 17.0, 15.0, 18.0, 22.0, 16.0, 27.0, 46.0, 33.0, 52.0, 36.0, 56.0, 34.0, 48.0, 69.0, 66.0, 44.0, 45.0, 47.0, 58.0, 29.0, 29.0, 26.0, 23.0, 16.0, 20.0, 10.0, 7.0, 16.0, 6.0, 2.0, 10.0, 6.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.0669231414794922e-05, -1.0359100997447968e-05, -1.0048970580101013e-05, -9.738840162754059e-06, -9.428709745407104e-06, -9.11857932806015e-06, -8.808448910713196e-06, -8.498318493366241e-06, -8.188188076019287e-06, -7.878057658672333e-06, -7.567927241325378e-06, -7.257796823978424e-06, -6.94766640663147e-06, -6.637535989284515e-06, -6.327405571937561e-06, -6.017275154590607e-06, -5.707144737243652e-06, -5.397014319896698e-06, -5.086883902549744e-06, -4.776753485202789e-06, -4.466623067855835e-06, -4.156492650508881e-06, -3.846362233161926e-06, -3.536231815814972e-06, -3.2261013984680176e-06, -2.9159709811210632e-06, -2.605840563774109e-06, -2.2957101464271545e-06, -1.9855797290802e-06, -1.6754493117332458e-06, -1.3653188943862915e-06, -1.0551884770393372e-06, -7.450580596923828e-07, -4.3492764234542847e-07, -1.2479722499847412e-07, 1.8533319234848022e-07, 4.954636096954346e-07, 8.055940270423889e-07, 1.1157244443893433e-06, 1.4258548617362976e-06, 1.735985279083252e-06, 2.0461156964302063e-06, 2.3562461137771606e-06, 2.666376531124115e-06, 2.9765069484710693e-06, 3.2866373658180237e-06, 3.596767783164978e-06, 3.906898200511932e-06, 4.217028617858887e-06, 4.527159035205841e-06, 4.837289452552795e-06, 5.14741986989975e-06, 5.457550287246704e-06, 5.7676807045936584e-06, 6.077811121940613e-06, 6.387941539287567e-06, 6.6980719566345215e-06, 7.008202373981476e-06, 7.31833279132843e-06, 7.6284632086753845e-06, 7.938593626022339e-06, 8.248724043369293e-06, 8.558854460716248e-06, 8.868984878063202e-06, 9.179115295410156e-06]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 3.0, 8.0, 17.0, 13.0, 22.0, 28.0, 42.0, 52.0, 96.0, 327.0, 306.0, 427.0, 643.0, 1080.0, 1814.0, 2985.0, 20842.0, 83657.0, 824379.0, 83295.0, 14970.0, 5761.0, 3028.0, 2729.0, 687.0, 413.0, 293.0, 220.0, 122.0, 92.0, 104.0, 34.0, 19.0, 8.0, 22.0, 3.0, 2.0, 10.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.562999725341797e-06, -2.495013177394867e-06, -2.427026629447937e-06, -2.359040081501007e-06, -2.291053533554077e-06, -2.2230669856071472e-06, -2.1550804376602173e-06, -2.0870938897132874e-06, -2.0191073417663574e-06, -1.9511207938194275e-06, -1.8831342458724976e-06, -1.8151476979255676e-06, -1.7471611499786377e-06, -1.6791746020317078e-06, -1.6111880540847778e-06, -1.543201506137848e-06, -1.475214958190918e-06, -1.407228410243988e-06, -1.339241862297058e-06, -1.2712553143501282e-06, -1.2032687664031982e-06, -1.1352822184562683e-06, -1.0672956705093384e-06, -9.993091225624084e-07, -9.313225746154785e-07, -8.633360266685486e-07, -7.953494787216187e-07, -7.273629307746887e-07, -6.593763828277588e-07, -5.913898348808289e-07, -5.234032869338989e-07, -4.55416738986969e-07, -3.8743019104003906e-07, -3.1944364309310913e-07, -2.514570951461792e-07, -1.8347054719924927e-07, -1.1548399925231934e-07, -4.7497451305389404e-08, 2.0489096641540527e-08, 8.847564458847046e-08, 1.564621925354004e-07, 2.2444874048233032e-07, 2.9243528842926025e-07, 3.604218363761902e-07, 4.284083843231201e-07, 4.9639493227005e-07, 5.6438148021698e-07, 6.323680281639099e-07, 7.003545761108398e-07, 7.683411240577698e-07, 8.363276720046997e-07, 9.043142199516296e-07, 9.723007678985596e-07, 1.0402873158454895e-06, 1.1082738637924194e-06, 1.1762604117393494e-06, 1.2442469596862793e-06, 1.3122335076332092e-06, 1.3802200555801392e-06, 1.448206603527069e-06, 1.516193151473999e-06, 1.584179699420929e-06, 1.6521662473678589e-06, 1.7201527953147888e-06, 1.7881393432617188e-06]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [106.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 824.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 5.0, 6.0, 2.0, 8.0, 19.0, 17.0, 19.0, 15.0, 45.0, 46.0, 59.0, 84.0, 49.0, 131.0, 206.0, 369.0, 623.0, 522.0, 1853.0, 4131.0, 10296.0, 35949.0, 94250.0, 845598.0, 35629.0, 10444.0, 4130.0, 1108.0, 1285.0, 603.0, 333.0, 211.0, 67.0, 115.0, 74.0, 69.0, 47.0, 16.0, 31.0, 27.0, 15.0, 16.0, 3.0, 11.0, 6.0, 7.0, 3.0, 0.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.2186508178710938e-06, -3.1115487217903137e-06, -3.0044466257095337e-06, -2.8973445296287537e-06, -2.7902424335479736e-06, -2.6831403374671936e-06, -2.5760382413864136e-06, -2.4689361453056335e-06, -2.3618340492248535e-06, -2.2547319531440735e-06, -2.1476298570632935e-06, -2.0405277609825134e-06, -1.9334256649017334e-06, -1.8263235688209534e-06, -1.7192214727401733e-06, -1.6121193766593933e-06, -1.5050172805786133e-06, -1.3979151844978333e-06, -1.2908130884170532e-06, -1.1837109923362732e-06, -1.0766088962554932e-06, -9.695068001747131e-07, -8.624047040939331e-07, -7.553026080131531e-07, -6.48200511932373e-07, -5.41098415851593e-07, -4.33996319770813e-07, -3.2689422369003296e-07, -2.1979212760925293e-07, -1.126900315284729e-07, -5.587935447692871e-09, 1.0151416063308716e-07, 2.086162567138672e-07, 3.157183527946472e-07, 4.2282044887542725e-07, 5.299225449562073e-07, 6.370246410369873e-07, 7.441267371177673e-07, 8.512288331985474e-07, 9.583309292793274e-07, 1.0654330253601074e-06, 1.1725351214408875e-06, 1.2796372175216675e-06, 1.3867393136024475e-06, 1.4938414096832275e-06, 1.6009435057640076e-06, 1.7080456018447876e-06, 1.8151476979255676e-06, 1.9222497940063477e-06, 2.0293518900871277e-06, 2.1364539861679077e-06, 2.2435560822486877e-06, 2.3506581783294678e-06, 2.457760274410248e-06, 2.564862370491028e-06, 2.671964466571808e-06, 2.779066562652588e-06, 2.886168658733368e-06, 2.993270754814148e-06, 3.100372850894928e-06, 3.207474946975708e-06, 3.314577043056488e-06, 3.421679139137268e-06, 3.528781235218048e-06, 3.635883331298828e-06]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 7.0, 3.0, 3.0, 9.0, 13.0, 14.0, 5.0, 21.0, 35.0, 62.0, 131.0, 546.0, 46.0, 22.0, 16.0, 20.0, 11.0, 7.0, 7.0, 5.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3709068298339844e-06, -1.3057142496109009e-06, -1.2405216693878174e-06, -1.1753290891647339e-06, -1.1101365089416504e-06, -1.044943928718567e-06, -9.797513484954834e-07, -9.145587682723999e-07, -8.493661880493164e-07, -7.841736078262329e-07, -7.189810276031494e-07, -6.537884473800659e-07, -5.885958671569824e-07, -5.234032869338989e-07, -4.5821070671081543e-07, -3.9301812648773193e-07, -3.2782554626464844e-07, -2.6263296604156494e-07, -1.9744038581848145e-07, -1.3224780559539795e-07, -6.705522537231445e-08, -1.862645149230957e-09, 6.332993507385254e-08, 1.2852251529693604e-07, 1.9371509552001953e-07, 2.5890767574310303e-07, 3.241002559661865e-07, 3.8929283618927e-07, 4.544854164123535e-07, 5.19677996635437e-07, 5.848705768585205e-07, 6.50063157081604e-07, 7.152557373046875e-07, 7.80448317527771e-07, 8.456408977508545e-07, 9.10833477973938e-07, 9.760260581970215e-07, 1.041218638420105e-06, 1.1064112186431885e-06, 1.171603798866272e-06, 1.2367963790893555e-06, 1.301988959312439e-06, 1.3671815395355225e-06, 1.432374119758606e-06, 1.4975666999816895e-06, 1.562759280204773e-06, 1.6279518604278564e-06, 1.69314444065094e-06, 1.7583370208740234e-06, 1.823529601097107e-06, 1.8887221813201904e-06, 1.953914761543274e-06, 2.0191073417663574e-06, 2.084299921989441e-06, 2.1494925022125244e-06, 2.214685082435608e-06, 2.2798776626586914e-06, 2.345070242881775e-06, 2.4102628231048584e-06, 2.475455403327942e-06, 2.5406479835510254e-06, 2.605840563774109e-06, 2.6710331439971924e-06, 2.736225724220276e-06, 2.8014183044433594e-06]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 7.0, 11.0, 14.0, 44.0, 95.0, 252.0, 329.0, 153.0, 56.0, 30.0, 11.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.629663842730224e-05, -3.4856657293858007e-05, -3.341667616041377e-05, -3.197669502696954e-05, -3.05367138935253e-05, -2.9096732760081068e-05, -2.765674980764743e-05, -2.6216768674203195e-05, -2.477678754075896e-05, -2.3336806407314725e-05, -2.189682527387049e-05, -2.0456842321436852e-05, -1.9016861187992617e-05, -1.7576880054548383e-05, -1.6136898921104148e-05, -1.4696917787659913e-05, -1.3256936654215679e-05, -1.1816955520771444e-05, -1.0376974387327209e-05, -8.936992344388273e-06, -7.497011210944038e-06, -6.057030077499803e-06, -4.617048034560867e-06, -3.177066901116632e-06, -1.7370857676723972e-06, -2.97104406854487e-07, 1.1428769539634231e-06, 2.5828585421550088e-06, 4.0228396755992435e-06, 5.462820809043478e-06, 6.902802851982415e-06, 8.34278398542665e-06, 9.782761480892077e-06, 1.1222742614336312e-05, 1.2662723747780547e-05, 1.4102705790719483e-05, 1.5542686014669016e-05, 1.698266714811325e-05, 1.842265010054689e-05, 1.9862631233991124e-05, 2.130261236743536e-05, 2.2742593500879593e-05, 2.4182574634323828e-05, 2.5622557586757466e-05, 2.70625387202017e-05, 2.8502519853645936e-05, 2.994250098709017e-05, 3.1382482120534405e-05, 3.282246325397864e-05, 3.4262444387422875e-05, 3.570242552086711e-05, 3.7142406654311344e-05, 3.858238778775558e-05, 4.0022368921199813e-05, 4.146235005464405e-05, 4.290233482606709e-05, 4.434231232153252e-05, 4.578229345497675e-05, 4.722227458842099e-05, 4.866225572186522e-05, 5.0102236855309457e-05, 5.154221798875369e-05, 5.2982199122197926e-05, 5.442218389362097e-05, 5.58621650270652e-05]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 7.0, 10.0, 6.0, 10.0, 21.0, 12.0, 22.0, 28.0, 29.0, 29.0, 39.0, 34.0, 49.0, 34.0, 52.0, 46.0, 59.0, 50.0, 48.0, 49.0, 38.0, 36.0, 36.0, 30.0, 28.0, 34.0, 22.0, 27.0, 24.0, 22.0, 11.0, 13.0, 7.0, 7.0, 10.0, 8.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.7583648514118977e-05, -1.7083897546399385e-05, -1.6584146578679793e-05, -1.60843956109602e-05, -1.5584644643240608e-05, -1.5084893675521016e-05, -1.4585141798306722e-05, -1.408539083058713e-05, -1.3585639862867538e-05, -1.3085888895147946e-05, -1.2586137927428354e-05, -1.2086386959708761e-05, -1.1586635082494467e-05, -1.1086884114774875e-05, -1.0587133147055283e-05, -1.0087382179335691e-05, -9.587631211616099e-06, -9.087880243896507e-06, -8.588129276176915e-06, -8.088378308457322e-06, -7.588626885990379e-06, -7.088875918270787e-06, -6.589124495803844e-06, -6.089373528084252e-06, -5.58962256036466e-06, -5.089871592645068e-06, -4.5901206249254756e-06, -4.0903692024585325e-06, -3.5906182347389404e-06, -3.0908672670193482e-06, -2.5911160719260806e-06, -2.091364876832813e-06, -1.5916148186079226e-06, -1.0918637372014928e-06, -5.921126557950629e-07, -9.236157438863302e-08, 4.0738950701779686e-07, 9.07140474737389e-07, 1.4068916698306566e-06, 1.9066428649239242e-06, 2.4063938326435164e-06, 2.9061448003631085e-06, 3.405895995456376e-06, 3.905647190549644e-06, 4.405398158269236e-06, 4.905149125988828e-06, 5.404900548455771e-06, 5.904651516175363e-06, 6.404402483894955e-06, 6.9041534516145475e-06, 7.40390441933414e-06, 7.903655387053732e-06, 8.403407264268026e-06, 8.903158231987618e-06, 9.40290919970721e-06, 9.902660167426802e-06, 1.0402411135146394e-05, 1.0902162102865987e-05, 1.1401913070585579e-05, 1.190166403830517e-05, 1.2401415006024763e-05, 1.2901165973744355e-05, 1.3400917850958649e-05, 1.3900668818678241e-05, 1.4400419786397833e-05]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 11.0, 11.0, 13.0, 22.0, 19.0, 31.0, 32.0, 41.0, 77.0, 83.0, 105.0, 164.0, 155.0, 249.0, 372.0, 1047318.0, 579.0, 328.0, 228.0, 161.0, 118.0, 113.0, 75.0, 64.0, 40.0, 37.0, 36.0, 30.0, 18.0, 13.0, 13.0, 7.0, 7.0, 6.0, 3.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7612808228004724e-05, -3.6504519812297076e-05, -3.539622775861062e-05, -3.4287935704924166e-05, -3.317964728921652e-05, -3.207135887350887e-05, -3.0963066819822416e-05, -2.9854776585125364e-05, -2.8746486350428313e-05, -2.763819611573126e-05, -2.652990588103421e-05, -2.542161564633716e-05, -2.4313325411640108e-05, -2.3205035176943056e-05, -2.2096744942246005e-05, -2.0988454707548954e-05, -1.9880164472851902e-05, -1.877187423815485e-05, -1.76635840034578e-05, -1.6555293768760748e-05, -1.5447003534063697e-05, -1.4338713299366646e-05, -1.3230423064669594e-05, -1.2122132829972543e-05, -1.1013842595275491e-05, -9.90555236057844e-06, -8.797262125881389e-06, -7.688971891184337e-06, -6.580681656487286e-06, -5.472391421790235e-06, -4.364101187093183e-06, -3.255810952396132e-06, -2.1475207176990807e-06, -1.0392304830020294e-06, 6.905975169502199e-08, 1.1773499863920733e-06, 2.2856402210891247e-06, 3.393930455786176e-06, 4.502220690483227e-06, 5.610510925180279e-06, 6.71880115987733e-06, 7.827091394574381e-06, 8.935381629271433e-06, 1.0043671863968484e-05, 1.1151962098665535e-05, 1.2260252333362587e-05, 1.3368542568059638e-05, 1.447683280275669e-05, 1.558512303745374e-05, 1.6693413272150792e-05, 1.7801703506847844e-05, 1.8909993741544895e-05, 2.0018283976241946e-05, 2.1126574210938998e-05, 2.223486444563605e-05, 2.33431546803331e-05, 2.445144491503015e-05, 2.5559735149727203e-05, 2.6668025384424254e-05, 2.7776315619121306e-05, 2.8884605853818357e-05, 2.999289608851541e-05, 3.110118632321246e-05, 3.2209478376898915e-05, 3.331776679260656e-05]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 20.0, 51.0, 104.0, 341.0, 982.0, 3040.0, 51459924.0, 3342.0, 1803.0, 997.0, 435.0, 159.0, 62.0, 26.0, 11.0, 13.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.851563453674316, -9.595887184143066, -9.340210914611816, -9.084534645080566, -8.828858375549316, -8.573182106018066, -8.317505836486816, -8.061829566955566, -7.806153297424316, -7.550477027893066, -7.294800758361816, -7.039124488830566, -6.783448219299316, -6.527771949768066, -6.272095680236816, -6.016419410705566, -5.760743141174316, -5.505066871643066, -5.249390602111816, -4.993714332580566, -4.738038063049316, -4.482361793518066, -4.226685523986816, -3.9710092544555664, -3.7153329849243164, -3.4596567153930664, -3.2039804458618164, -2.9483041763305664, -2.6926279067993164, -2.4369516372680664, -2.1812753677368164, -1.9255990982055664, -1.669921875, -1.41424560546875, -1.1585693359375, -0.90289306640625, -0.647216796875, -0.39154052734375, -0.1358642578125, 0.11981201171875, 0.37548828125, 0.63116455078125, 0.8868408203125, 1.14251708984375, 1.398193359375, 1.65386962890625, 1.9095458984375, 2.16522216796875, 2.4208984375, 2.67657470703125, 2.9322509765625, 3.18792724609375, 3.443603515625, 3.69927978515625, 3.9549560546875, 4.21063232421875, 4.46630859375, 4.72198486328125, 4.9776611328125, 5.23333740234375, 5.489013671875, 5.74468994140625, 6.0003662109375, 6.25604248046875, 6.51171875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 16.0, 33.0, 54.0, 63.0, 99.0, 152.0, 244.0, 372.0, 523.0, 863.0, 1253.0, 1836.0, 2908.0, 4260.0, 6285.0, 9306.0, 13701.0, 20782.0, 31121.0, 46499.0, 73075.0, 115872.0, 193398.0, 349789.0, 880165.0, 3610301.0, 376262.0, 205808.0, 121862.0, 76615.0, 49810.0, 32508.0, 21390.0, 14663.0, 9970.0, 6540.0, 4383.0, 2850.0, 1946.0, 1362.0, 885.0, 559.0, 371.0, 248.0, 157.0, 102.0, 61.0, 38.0, 29.0, 15.0, 13.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1082763671875, -0.10478973388671875, -0.1013031005859375, -0.09781646728515625, -0.094329833984375, -0.09084320068359375, -0.0873565673828125, -0.08386993408203125, -0.08038330078125, -0.07689666748046875, -0.0734100341796875, -0.06992340087890625, -0.066436767578125, -0.06295013427734375, -0.0594635009765625, -0.05597686767578125, -0.052490234375, -0.04900360107421875, -0.0455169677734375, -0.04203033447265625, -0.038543701171875, -0.03505706787109375, -0.0315704345703125, -0.02808380126953125, -0.02459716796875, -0.02111053466796875, -0.0176239013671875, -0.01413726806640625, -0.010650634765625, -0.00716400146484375, -0.0036773681640625, -0.00019073486328125, 0.0032958984375, 0.00678253173828125, 0.0102691650390625, 0.01375579833984375, 0.017242431640625, 0.02072906494140625, 0.0242156982421875, 0.02770233154296875, 0.03118896484375, 0.03467559814453125, 0.0381622314453125, 0.04164886474609375, 0.045135498046875, 0.04862213134765625, 0.0521087646484375, 0.05559539794921875, 0.05908203125, 0.06256866455078125, 0.0660552978515625, 0.06954193115234375, 0.073028564453125, 0.07651519775390625, 0.0800018310546875, 0.08348846435546875, 0.08697509765625, 0.09046173095703125, 0.0939483642578125, 0.09743499755859375, 0.100921630859375, 0.10440826416015625, 0.1078948974609375, 0.11138153076171875, 0.1148681640625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 5.0, 13.0, 5.0, 7.0, 9.0, 16.0, 22.0, 19.0, 15.0, 23.0, 14.0, 19.0, 28.0, 30.0, 34.0, 37.0, 40.0, 39.0, 41.0, 116.0, 978.0, 35.0, 38.0, 51.0, 39.0, 41.0, 31.0, 31.0, 25.0, 32.0, 26.0, 22.0, 13.0, 25.0, 13.0, 14.0, 20.0, 11.0, 11.0, 8.0, 6.0, 7.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5390625, -2.457611083984375, -2.37615966796875, -2.294708251953125, -2.2132568359375, -2.131805419921875, -2.05035400390625, -1.968902587890625, -1.887451171875, -1.805999755859375, -1.72454833984375, -1.643096923828125, -1.5616455078125, -1.480194091796875, -1.39874267578125, -1.317291259765625, -1.23583984375, -1.154388427734375, -1.07293701171875, -0.991485595703125, -0.9100341796875, -0.828582763671875, -0.74713134765625, -0.665679931640625, -0.584228515625, -0.502777099609375, -0.42132568359375, -0.339874267578125, -0.2584228515625, -0.176971435546875, -0.09552001953125, -0.014068603515625, 0.0673828125, 0.148834228515625, 0.23028564453125, 0.311737060546875, 0.3931884765625, 0.474639892578125, 0.55609130859375, 0.637542724609375, 0.718994140625, 0.800445556640625, 0.88189697265625, 0.963348388671875, 1.0447998046875, 1.126251220703125, 1.20770263671875, 1.289154052734375, 1.37060546875, 1.452056884765625, 1.53350830078125, 1.614959716796875, 1.6964111328125, 1.777862548828125, 1.85931396484375, 1.940765380859375, 2.022216796875, 2.103668212890625, 2.18511962890625, 2.266571044921875, 2.3480224609375, 2.429473876953125, 2.51092529296875, 2.592376708984375, 2.673828125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 7.0, 4.0, 10.0, 13.0, 17.0, 27.0, 26.0, 35.0, 63.0, 108.0, 181.0, 285.0, 462.0, 688.0, 1047.0, 1620.0, 2481.0, 3679.0, 6094.0, 9399.0, 15063.0, 24167.0, 38842.0, 63456.0, 106020.0, 184306.0, 342401.0, 614547.0, 3839323.0, 452618.0, 241661.0, 134944.0, 79458.0, 47745.0, 29737.0, 18526.0, 11820.0, 7387.0, 4695.0, 3002.0, 1938.0, 1245.0, 855.0, 507.0, 354.0, 211.0, 124.0, 79.0, 58.0, 33.0, 37.0, 11.0, 8.0, 9.0, 7.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.0919189453125, -0.0889749526977539, -0.08603096008300781, -0.08308696746826172, -0.08014297485351562, -0.07719898223876953, -0.07425498962402344, -0.07131099700927734, -0.06836700439453125, -0.06542301177978516, -0.06247901916503906, -0.05953502655029297, -0.056591033935546875, -0.05364704132080078, -0.05070304870605469, -0.047759056091308594, -0.0448150634765625, -0.041871070861816406, -0.03892707824707031, -0.03598308563232422, -0.033039093017578125, -0.03009510040283203, -0.027151107788085938, -0.024207115173339844, -0.02126312255859375, -0.018319129943847656, -0.015375137329101562, -0.012431144714355469, -0.009487152099609375, -0.006543159484863281, -0.0035991668701171875, -0.0006551742553710938, 0.002288818359375, 0.005232810974121094, 0.008176803588867188, 0.011120796203613281, 0.014064788818359375, 0.01700878143310547, 0.019952774047851562, 0.022896766662597656, 0.02584075927734375, 0.028784751892089844, 0.03172874450683594, 0.03467273712158203, 0.037616729736328125, 0.04056072235107422, 0.04350471496582031, 0.046448707580566406, 0.0493927001953125, 0.052336692810058594, 0.05528068542480469, 0.05822467803955078, 0.061168670654296875, 0.06411266326904297, 0.06705665588378906, 0.07000064849853516, 0.07294464111328125, 0.07588863372802734, 0.07883262634277344, 0.08177661895751953, 0.08472061157226562, 0.08766460418701172, 0.09060859680175781, 0.0935525894165039, 0.09649658203125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 0.0, 5.0, 3.0, 7.0, 2.0, 5.0, 9.0, 10.0, 12.0, 11.0, 17.0, 25.0, 16.0, 18.0, 19.0, 21.0, 20.0, 21.0, 27.0, 35.0, 32.0, 38.0, 48.0, 38.0, 48.0, 1047.0, 46.0, 41.0, 41.0, 34.0, 41.0, 32.0, 30.0, 29.0, 25.0, 23.0, 31.0, 18.0, 21.0, 15.0, 18.0, 11.0, 6.0, 4.0, 10.0, 6.0, 0.0, 2.0, 7.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.8984375, -1.8397369384765625, -1.781036376953125, -1.7223358154296875, -1.66363525390625, -1.6049346923828125, -1.546234130859375, -1.4875335693359375, -1.4288330078125, -1.3701324462890625, -1.311431884765625, -1.2527313232421875, -1.19403076171875, -1.1353302001953125, -1.076629638671875, -1.0179290771484375, -0.959228515625, -0.9005279541015625, -0.841827392578125, -0.7831268310546875, -0.72442626953125, -0.6657257080078125, -0.607025146484375, -0.5483245849609375, -0.4896240234375, -0.4309234619140625, -0.372222900390625, -0.3135223388671875, -0.25482177734375, -0.1961212158203125, -0.137420654296875, -0.0787200927734375, -0.02001953125, 0.0386810302734375, 0.097381591796875, 0.1560821533203125, 0.21478271484375, 0.2734832763671875, 0.332183837890625, 0.3908843994140625, 0.4495849609375, 0.5082855224609375, 0.566986083984375, 0.6256866455078125, 0.68438720703125, 0.7430877685546875, 0.801788330078125, 0.8604888916015625, 0.919189453125, 0.9778900146484375, 1.036590576171875, 1.0952911376953125, 1.15399169921875, 1.2126922607421875, 1.271392822265625, 1.3300933837890625, 1.3887939453125, 1.4474945068359375, 1.506195068359375, 1.5648956298828125, 1.62359619140625, 1.6822967529296875, 1.740997314453125, 1.7996978759765625, 1.8583984375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 14.0, 17.0, 32.0, 51.0, 49.0, 85.0, 113.0, 194.0, 295.0, 467.0, 695.0, 1094.0, 1818.0, 2855.0, 5048.0, 8801.0, 15731.0, 29550.0, 56309.0, 115183.0, 259500.0, 655422.0, 4204904.0, 524360.0, 210615.0, 95247.0, 46618.0, 24346.0, 13145.0, 7561.0, 4305.0, 2588.0, 1650.0, 999.0, 607.0, 410.0, 238.0, 172.0, 121.0, 75.0, 54.0, 31.0, 23.0, 13.0, 8.0, 8.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.129638671875, -0.12575531005859375, -0.1218719482421875, -0.11798858642578125, -0.114105224609375, -0.11022186279296875, -0.1063385009765625, -0.10245513916015625, -0.09857177734375, -0.09468841552734375, -0.0908050537109375, -0.08692169189453125, -0.083038330078125, -0.07915496826171875, -0.0752716064453125, -0.07138824462890625, -0.0675048828125, -0.06362152099609375, -0.0597381591796875, -0.05585479736328125, -0.051971435546875, -0.04808807373046875, -0.0442047119140625, -0.04032135009765625, -0.03643798828125, -0.03255462646484375, -0.0286712646484375, -0.02478790283203125, -0.020904541015625, -0.01702117919921875, -0.0131378173828125, -0.00925445556640625, -0.00537109375, -0.00148773193359375, 0.0023956298828125, 0.00627899169921875, 0.010162353515625, 0.01404571533203125, 0.0179290771484375, 0.02181243896484375, 0.02569580078125, 0.02957916259765625, 0.0334625244140625, 0.03734588623046875, 0.041229248046875, 0.04511260986328125, 0.0489959716796875, 0.05287933349609375, 0.0567626953125, 0.06064605712890625, 0.0645294189453125, 0.06841278076171875, 0.072296142578125, 0.07617950439453125, 0.0800628662109375, 0.08394622802734375, 0.08782958984375, 0.09171295166015625, 0.0955963134765625, 0.09947967529296875, 0.103363037109375, 0.10724639892578125, 0.1111297607421875, 0.11501312255859375, 0.118896484375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 9.0, 4.0, 4.0, 11.0, 8.0, 20.0, 16.0, 20.0, 11.0, 22.0, 21.0, 26.0, 37.0, 39.0, 40.0, 44.0, 31.0, 45.0, 42.0, 62.0, 1046.0, 45.0, 43.0, 44.0, 56.0, 34.0, 40.0, 31.0, 34.0, 24.0, 21.0, 21.0, 23.0, 6.0, 9.0, 9.0, 6.0, 11.0, 2.0, 8.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.896484375, -1.8427734375, -1.7890625, -1.7353515625, -1.681640625, -1.6279296875, -1.57421875, -1.5205078125, -1.466796875, -1.4130859375, -1.359375, -1.3056640625, -1.251953125, -1.1982421875, -1.14453125, -1.0908203125, -1.037109375, -0.9833984375, -0.9296875, -0.8759765625, -0.822265625, -0.7685546875, -0.71484375, -0.6611328125, -0.607421875, -0.5537109375, -0.5, -0.4462890625, -0.392578125, -0.3388671875, -0.28515625, -0.2314453125, -0.177734375, -0.1240234375, -0.0703125, -0.0166015625, 0.037109375, 0.0908203125, 0.14453125, 0.1982421875, 0.251953125, 0.3056640625, 0.359375, 0.4130859375, 0.466796875, 0.5205078125, 0.57421875, 0.6279296875, 0.681640625, 0.7353515625, 0.7890625, 0.8427734375, 0.896484375, 0.9501953125, 1.00390625, 1.0576171875, 1.111328125, 1.1650390625, 1.21875, 1.2724609375, 1.326171875, 1.3798828125, 1.43359375, 1.4873046875, 1.541015625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.0, 861.0, 128.0, 6.0, 0.0, 1.0], "bins": [-21.138080596923828, -20.783517837524414, -20.428955078125, -20.074390411376953, -19.71982765197754, -19.365264892578125, -19.01070213317871, -18.656139373779297, -18.30157470703125, -17.947011947631836, -17.592449188232422, -17.237884521484375, -16.88332176208496, -16.528759002685547, -16.174196243286133, -15.819632530212402, -15.465070724487305, -15.11050796508789, -14.75594425201416, -14.401381492614746, -14.046817779541016, -13.692255020141602, -13.337692260742188, -12.983128547668457, -12.628564834594727, -12.274002075195312, -11.919438362121582, -11.564875602722168, -11.210311889648438, -10.855749130249023, -10.50118637084961, -10.146622657775879, -9.792058944702148, -9.437496185302734, -9.082932472229004, -8.72836971282959, -8.37380599975586, -8.019243240356445, -7.664680004119873, -7.310116767883301, -6.955554008483887, -6.6009907722473145, -6.246427536010742, -5.891864776611328, -5.537301540374756, -5.182738304138184, -4.828175067901611, -4.473611831665039, -4.119049072265625, -3.7644858360290527, -3.4099228382110596, -3.0553596019744873, -2.700796604156494, -2.346233367919922, -1.9916701316833496, -1.6371071338653564, -1.282543659210205, -0.9279805421829224, -0.5734173655509949, -0.21885418891906738, 0.13570892810821533, 0.49027204513549805, 0.8448352813720703, 1.1993982791900635, 1.5539615154266357]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 9.0, 8.0, 14.0, 19.0, 15.0, 17.0, 27.0, 18.0, 23.0, 34.0, 33.0, 35.0, 27.0, 45.0, 43.0, 38.0, 36.0, 43.0, 41.0, 44.0, 49.0, 29.0, 45.0, 30.0, 28.0, 23.0, 36.0, 39.0, 25.0, 24.0, 14.0, 21.0, 14.0, 10.0, 7.0, 7.0, 8.0, 2.0, 6.0, 6.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.268061637878418, -2.1805877685546875, -2.093113660812378, -2.0056397914886475, -1.918165922164917, -1.830691933631897, -1.743217945098877, -1.6557440757751465, -1.568270206451416, -1.480796217918396, -1.3933223485946655, -1.3058483600616455, -1.218374490737915, -1.130900502204895, -1.043426513671875, -0.9559526443481445, -0.8684786558151245, -0.7810047268867493, -0.693530797958374, -0.606056809425354, -0.5185829401016235, -0.4311089813709259, -0.34363502264022827, -0.256161093711853, -0.16868716478347778, -0.08121322840452194, 0.006260707974433899, 0.09373465180397034, 0.18120858073234558, 0.2686825096607208, 0.35615646839141846, 0.4436303973197937, 0.531104326248169, 0.6185782551765442, 0.7060521841049194, 0.7935261726379395, 0.8810000419616699, 0.9684740304946899, 1.05594801902771, 1.1434218883514404, 1.230895757675171, 1.318369746208191, 1.4058436155319214, 1.4933176040649414, 1.5807914733886719, 1.668265461921692, 1.755739450454712, 1.8432133197784424, 1.9306873083114624, 2.0181612968444824, 2.105635166168213, 2.1931090354919434, 2.280583143234253, 2.3680570125579834, 2.455530881881714, 2.5430049896240234, 2.630478858947754, 2.7179527282714844, 2.805426836013794, 2.8929007053375244, 2.980374574661255, 3.0678484439849854, 3.155322551727295, 3.2427964210510254, 3.330270290374756]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 8.0, 9.0, 22.0, 23.0, 51.0, 75.0, 108.0, 138.0, 215.0, 360.0, 743.0, 1819.0, 4471.0, 9631.0, 22503.0, 63146.0, 1254568.0, 2722289.0, 67651.0, 25185.0, 10620.0, 4887.0, 2499.0, 1316.0, 805.0, 451.0, 274.0, 165.0, 91.0, 45.0, 32.0, 18.0, 14.0, 8.0, 2.0, 14.0, 3.0, 4.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.050079345703125, -0.04851722717285156, -0.046955108642578125, -0.04539299011230469, -0.04383087158203125, -0.04226875305175781, -0.040706634521484375, -0.03914451599121094, -0.0375823974609375, -0.03602027893066406, -0.034458160400390625, -0.03289604187011719, -0.03133392333984375, -0.029771804809570312, -0.028209686279296875, -0.026647567749023438, -0.02508544921875, -0.023523330688476562, -0.021961212158203125, -0.020399093627929688, -0.01883697509765625, -0.017274856567382812, -0.015712738037109375, -0.014150619506835938, -0.0125885009765625, -0.011026382446289062, -0.009464263916015625, -0.007902145385742188, -0.00634002685546875, -0.0047779083251953125, -0.003215789794921875, -0.0016536712646484375, -9.1552734375e-05, 0.0014705657958984375, 0.003032684326171875, 0.0045948028564453125, 0.00615692138671875, 0.0077190399169921875, 0.009281158447265625, 0.010843276977539062, 0.0124053955078125, 0.013967514038085938, 0.015529632568359375, 0.017091751098632812, 0.01865386962890625, 0.020215988159179688, 0.021778106689453125, 0.023340225219726562, 0.02490234375, 0.026464462280273438, 0.028026580810546875, 0.029588699340820312, 0.03115081787109375, 0.03271293640136719, 0.034275054931640625, 0.03583717346191406, 0.0373992919921875, 0.03896141052246094, 0.040523529052734375, 0.04208564758300781, 0.04364776611328125, 0.04520988464355469, 0.046772003173828125, 0.04833412170410156, 0.049896240234375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 8.0, 15.0, 12.0, 17.0, 12.0, 21.0, 20.0, 42.0, 45.0, 41.0, 75.0, 54.0, 67.0, 67.0, 66.0, 59.0, 57.0, 47.0, 47.0, 45.0, 34.0, 28.0, 26.0, 13.0, 21.0, 9.0, 9.0, 8.0, 5.0, 5.0, 5.0, 2.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.008636474609375, -0.008367776870727539, -0.008099079132080078, -0.007830381393432617, -0.007561683654785156, -0.007292985916137695, -0.007024288177490234, -0.0067555904388427734, -0.0064868927001953125, -0.0062181949615478516, -0.005949497222900391, -0.00568079948425293, -0.005412101745605469, -0.005143404006958008, -0.004874706268310547, -0.004606008529663086, -0.004337310791015625, -0.004068613052368164, -0.003799915313720703, -0.003531217575073242, -0.0032625198364257812, -0.0029938220977783203, -0.0027251243591308594, -0.0024564266204833984, -0.0021877288818359375, -0.0019190311431884766, -0.0016503334045410156, -0.0013816356658935547, -0.0011129379272460938, -0.0008442401885986328, -0.0005755424499511719, -0.00030684471130371094, -3.814697265625e-05, 0.00023055076599121094, 0.0004992485046386719, 0.0007679462432861328, 0.0010366439819335938, 0.0013053417205810547, 0.0015740394592285156, 0.0018427371978759766, 0.0021114349365234375, 0.0023801326751708984, 0.0026488304138183594, 0.0029175281524658203, 0.0031862258911132812, 0.003454923629760742, 0.003723621368408203, 0.003992319107055664, 0.004261016845703125, 0.004529714584350586, 0.004798412322998047, 0.005067110061645508, 0.005335807800292969, 0.00560450553894043, 0.005873203277587891, 0.0061419010162353516, 0.0064105987548828125, 0.0066792964935302734, 0.006947994232177734, 0.007216691970825195, 0.007485389709472656, 0.007754087448120117, 0.008022785186767578, 0.008291482925415039, 0.0085601806640625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 6.0, 2.0, 6.0, 7.0, 6.0, 11.0, 19.0, 26.0, 30.0, 50.0, 104.0, 319.0, 26122.0, 4164653.0, 2306.0, 154.0, 104.0, 66.0, 51.0, 45.0, 34.0, 21.0, 17.0, 19.0, 13.0, 19.0, 11.0, 8.0, 7.0, 7.0, 5.0, 6.0, 4.0, 5.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0894775390625, -0.08661746978759766, -0.08375740051269531, -0.08089733123779297, -0.07803726196289062, -0.07517719268798828, -0.07231712341308594, -0.0694570541381836, -0.06659698486328125, -0.0637369155883789, -0.06087684631347656, -0.05801677703857422, -0.055156707763671875, -0.05229663848876953, -0.04943656921386719, -0.046576499938964844, -0.0437164306640625, -0.040856361389160156, -0.03799629211425781, -0.03513622283935547, -0.032276153564453125, -0.02941608428955078, -0.026556015014648438, -0.023695945739746094, -0.02083587646484375, -0.017975807189941406, -0.015115737915039062, -0.012255668640136719, -0.009395599365234375, -0.006535530090332031, -0.0036754608154296875, -0.0008153915405273438, 0.002044677734375, 0.004904747009277344, 0.0077648162841796875, 0.010624885559082031, 0.013484954833984375, 0.01634502410888672, 0.019205093383789062, 0.022065162658691406, 0.02492523193359375, 0.027785301208496094, 0.030645370483398438, 0.03350543975830078, 0.036365509033203125, 0.03922557830810547, 0.04208564758300781, 0.044945716857910156, 0.0478057861328125, 0.050665855407714844, 0.05352592468261719, 0.05638599395751953, 0.059246063232421875, 0.06210613250732422, 0.06496620178222656, 0.0678262710571289, 0.07068634033203125, 0.0735464096069336, 0.07640647888183594, 0.07926654815673828, 0.08212661743164062, 0.08498668670654297, 0.08784675598144531, 0.09070682525634766, 0.09356689453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 5.0, 3.0, 7.0, 4.0, 7.0, 7.0, 8.0, 13.0, 17.0, 16.0, 17.0, 19.0, 26.0, 34.0, 43.0, 52.0, 71.0, 107.0, 166.0, 580.0, 1805.0, 614.0, 189.0, 89.0, 46.0, 33.0, 22.0, 18.0, 11.0, 5.0, 8.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017730712890625, -0.01718616485595703, -0.016641616821289062, -0.016097068786621094, -0.015552520751953125, -0.015007972717285156, -0.014463424682617188, -0.013918876647949219, -0.01337432861328125, -0.012829780578613281, -0.012285232543945312, -0.011740684509277344, -0.011196136474609375, -0.010651588439941406, -0.010107040405273438, -0.009562492370605469, -0.0090179443359375, -0.008473396301269531, -0.007928848266601562, -0.007384300231933594, -0.006839752197265625, -0.006295204162597656, -0.0057506561279296875, -0.005206108093261719, -0.00466156005859375, -0.004117012023925781, -0.0035724639892578125, -0.0030279159545898438, -0.002483367919921875, -0.0019388198852539062, -0.0013942718505859375, -0.0008497238159179688, -0.00030517578125, 0.00023937225341796875, 0.0007839202880859375, 0.0013284683227539062, 0.001873016357421875, 0.0024175643920898438, 0.0029621124267578125, 0.0035066604614257812, 0.00405120849609375, 0.004595756530761719, 0.0051403045654296875, 0.005684852600097656, 0.006229400634765625, 0.006773948669433594, 0.0073184967041015625, 0.007863044738769531, 0.0084075927734375, 0.008952140808105469, 0.009496688842773438, 0.010041236877441406, 0.010585784912109375, 0.011130332946777344, 0.011674880981445312, 0.012219429016113281, 0.01276397705078125, 0.013308525085449219, 0.013853073120117188, 0.014397621154785156, 0.014942169189453125, 0.015486717224121094, 0.016031265258789062, 0.01657581329345703, 0.017120361328125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 303.0, 720.0], "bins": [-3.795872449874878, -3.735629081726074, -3.6753857135772705, -3.615142345428467, -3.554898738861084, -3.4946553707122803, -3.4344120025634766, -3.374168634414673, -3.313925266265869, -3.2536818981170654, -3.1934385299682617, -3.133194923400879, -3.072951555252075, -3.0127081871032715, -2.9524648189544678, -2.892221450805664, -2.8319778442382812, -2.7717344760894775, -2.711491107940674, -2.651247501373291, -2.5910041332244873, -2.5307607650756836, -2.47051739692688, -2.410274028778076, -2.3500306606292725, -2.2897872924804688, -2.229543924331665, -2.1693005561828613, -2.1090569496154785, -2.048813581466675, -1.988570213317871, -1.9283268451690674, -1.8680833578109741, -1.8078399896621704, -1.7475965023040771, -1.6873531341552734, -1.6271097660064697, -1.566866397857666, -1.5066229104995728, -1.446379542350769, -1.3861361742019653, -1.3258928060531616, -1.2656493186950684, -1.2054059505462646, -1.145162582397461, -1.0849192142486572, -1.024675726890564, -0.9644323587417603, -0.904188871383667, -0.8439454436302185, -0.7837020754814148, -0.7234586477279663, -0.6632152795791626, -0.6029718518257141, -0.5427284240722656, -0.4824850261211395, -0.4222416579723358, -0.3619982600212097, -0.30175483226776123, -0.24151143431663513, -0.18126803636550903, -0.12102463841438293, -0.06078121066093445, -0.0005378127098083496, 0.05970558896660805]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 9.0, 8.0, 11.0, 17.0, 21.0, 26.0, 39.0, 57.0, 76.0, 79.0, 67.0, 77.0, 86.0, 69.0, 71.0, 79.0, 60.0, 46.0, 32.0, 25.0, 22.0, 15.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1879231333732605, -0.18307442963123322, -0.17822571098804474, -0.17337700724601746, -0.16852828860282898, -0.1636795848608017, -0.15883088111877441, -0.15398216247558594, -0.14913345873355865, -0.14428475499153137, -0.1394360363483429, -0.1345873326063156, -0.12973862886428833, -0.12488991022109985, -0.12004120647907257, -0.11519249528646469, -0.11034378409385681, -0.10549507290124893, -0.10064636170864105, -0.09579765796661377, -0.09094894677400589, -0.08610023558139801, -0.08125153183937073, -0.07640282064676285, -0.07155410945415497, -0.06670539826154709, -0.06185669079422951, -0.057007983326911926, -0.05215927213430405, -0.04731056094169617, -0.042461853474378586, -0.037613146007061005, -0.032764434814453125, -0.027915725484490395, -0.023067016154527664, -0.018218306824564934, -0.013369597494602203, -0.008520888164639473, -0.0036721788346767426, 0.0011765286326408386, 0.006025239825248718, 0.010873949155211449, 0.01572265848517418, 0.02057136781513691, 0.02542007714509964, 0.03026878647506237, 0.0351174958050251, 0.03996620327234268, 0.04481491446495056, 0.04966362565755844, 0.05451233312487602, 0.059361040592193604, 0.06420975178480148, 0.06905846297740936, 0.07390716671943665, 0.07875587791204453, 0.0836045891046524, 0.08845330029726028, 0.09330201148986816, 0.09815071523189545, 0.10299942642450333, 0.1078481376171112, 0.11269684135913849, 0.11754555255174637, 0.12239426374435425]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 13.0, 9.0, 20.0, 30.0, 26.0, 27.0, 58.0, 56.0, 118.0, 146.0, 225.0, 353.0, 619.0, 1131.0, 1986.0, 4034.0, 9568.0, 29767.0, 633897.0, 322901.0, 26118.0, 8862.0, 3849.0, 1982.0, 1028.0, 611.0, 394.0, 251.0, 154.0, 94.0, 77.0, 35.0, 40.0, 19.0, 15.0, 5.0, 13.0, 4.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.190185546875, -0.18404197692871094, -0.17789840698242188, -0.1717548370361328, -0.16561126708984375, -0.1594676971435547, -0.15332412719726562, -0.14718055725097656, -0.1410369873046875, -0.13489341735839844, -0.12874984741210938, -0.12260627746582031, -0.11646270751953125, -0.11031913757324219, -0.10417556762695312, -0.09803199768066406, -0.091888427734375, -0.08574485778808594, -0.07960128784179688, -0.07345771789550781, -0.06731414794921875, -0.06117057800292969, -0.055027008056640625, -0.04888343811035156, -0.0427398681640625, -0.03659629821777344, -0.030452728271484375, -0.024309158325195312, -0.01816558837890625, -0.012022018432617188, -0.005878448486328125, 0.0002651214599609375, 0.00640869140625, 0.012552261352539062, 0.018695831298828125, 0.024839401245117188, 0.03098297119140625, 0.03712654113769531, 0.043270111083984375, 0.04941368103027344, 0.0555572509765625, 0.06170082092285156, 0.06784439086914062, 0.07398796081542969, 0.08013153076171875, 0.08627510070800781, 0.09241867065429688, 0.09856224060058594, 0.104705810546875, 0.11084938049316406, 0.11699295043945312, 0.12313652038574219, 0.12928009033203125, 0.1354236602783203, 0.14156723022460938, 0.14771080017089844, 0.1538543701171875, 0.15999794006347656, 0.16614151000976562, 0.1722850799560547, 0.17842864990234375, 0.1845722198486328, 0.19071578979492188, 0.19685935974121094, 0.2030029296875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 11.0, 7.0, 13.0, 9.0, 19.0, 18.0, 15.0, 24.0, 35.0, 42.0, 42.0, 59.0, 64.0, 60.0, 68.0, 72.0, 55.0, 55.0, 52.0, 59.0, 35.0, 27.0, 28.0, 30.0, 21.0, 21.0, 12.0, 14.0, 10.0, 2.0, 4.0, 4.0, 5.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0087127685546875, -0.00845193862915039, -0.008191108703613281, -0.007930278778076172, -0.0076694488525390625, -0.007408618927001953, -0.007147789001464844, -0.006886959075927734, -0.006626129150390625, -0.006365299224853516, -0.006104469299316406, -0.005843639373779297, -0.0055828094482421875, -0.005321979522705078, -0.005061149597167969, -0.004800319671630859, -0.00453948974609375, -0.004278659820556641, -0.004017829895019531, -0.003756999969482422, -0.0034961700439453125, -0.003235340118408203, -0.0029745101928710938, -0.0027136802673339844, -0.002452850341796875, -0.0021920204162597656, -0.0019311904907226562, -0.0016703605651855469, -0.0014095306396484375, -0.0011487007141113281, -0.0008878707885742188, -0.0006270408630371094, -0.0003662109375, -0.00010538101196289062, 0.00015544891357421875, 0.0004162788391113281, 0.0006771087646484375, 0.0009379386901855469, 0.0011987686157226562, 0.0014595985412597656, 0.001720428466796875, 0.0019812583923339844, 0.0022420883178710938, 0.002502918243408203, 0.0027637481689453125, 0.003024578094482422, 0.0032854080200195312, 0.0035462379455566406, 0.00380706787109375, 0.004067897796630859, 0.004328727722167969, 0.004589557647705078, 0.0048503875732421875, 0.005111217498779297, 0.005372047424316406, 0.005632877349853516, 0.005893707275390625, 0.006154537200927734, 0.006415367126464844, 0.006676197052001953, 0.0069370269775390625, 0.007197856903076172, 0.007458686828613281, 0.007719516754150391, 0.0079803466796875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 6.0, 9.0, 7.0, 9.0, 9.0, 16.0, 15.0, 15.0, 25.0, 43.0, 54.0, 77.0, 83.0, 136.0, 192.0, 268.0, 421.0, 619.0, 1027.0, 1695.0, 2983.0, 5656.0, 12225.0, 30611.0, 101379.0, 583272.0, 219081.0, 52157.0, 18333.0, 8140.0, 4050.0, 2155.0, 1311.0, 796.0, 509.0, 362.0, 228.0, 160.0, 95.0, 74.0, 54.0, 36.0, 27.0, 25.0, 23.0, 21.0, 17.0, 11.0, 13.0, 9.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0], "bins": [-0.02911376953125, -0.02819657325744629, -0.027279376983642578, -0.026362180709838867, -0.025444984436035156, -0.024527788162231445, -0.023610591888427734, -0.022693395614624023, -0.021776199340820312, -0.0208590030670166, -0.01994180679321289, -0.01902461051940918, -0.01810741424560547, -0.017190217971801758, -0.016273021697998047, -0.015355825424194336, -0.014438629150390625, -0.013521432876586914, -0.012604236602783203, -0.011687040328979492, -0.010769844055175781, -0.00985264778137207, -0.00893545150756836, -0.008018255233764648, -0.0071010589599609375, -0.0061838626861572266, -0.005266666412353516, -0.004349470138549805, -0.0034322738647460938, -0.002515077590942383, -0.0015978813171386719, -0.0006806850433349609, 0.00023651123046875, 0.001153707504272461, 0.002070903778076172, 0.002988100051879883, 0.0039052963256835938, 0.004822492599487305, 0.005739688873291016, 0.0066568851470947266, 0.0075740814208984375, 0.008491277694702148, 0.00940847396850586, 0.01032567024230957, 0.011242866516113281, 0.012160062789916992, 0.013077259063720703, 0.013994455337524414, 0.014911651611328125, 0.015828847885131836, 0.016746044158935547, 0.017663240432739258, 0.01858043670654297, 0.01949763298034668, 0.02041482925415039, 0.0213320255279541, 0.022249221801757812, 0.023166418075561523, 0.024083614349365234, 0.025000810623168945, 0.025918006896972656, 0.026835203170776367, 0.027752399444580078, 0.02866959571838379, 0.0295867919921875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 10.0, 11.0, 9.0, 8.0, 12.0, 13.0, 13.0, 19.0, 12.0, 28.0, 28.0, 26.0, 36.0, 31.0, 28.0, 32.0, 33.0, 28.0, 47.0, 40.0, 40.0, 38.0, 51.0, 39.0, 32.0, 30.0, 39.0, 29.0, 33.0, 20.0, 21.0, 28.0, 21.0, 9.0, 19.0, 15.0, 12.0, 9.0, 7.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0], "bins": [-0.0167083740234375, -0.016185998916625977, -0.015663623809814453, -0.01514124870300293, -0.014618873596191406, -0.014096498489379883, -0.01357412338256836, -0.013051748275756836, -0.012529373168945312, -0.012006998062133789, -0.011484622955322266, -0.010962247848510742, -0.010439872741699219, -0.009917497634887695, -0.009395122528076172, -0.008872747421264648, -0.008350372314453125, -0.007827997207641602, -0.007305622100830078, -0.006783246994018555, -0.006260871887207031, -0.005738496780395508, -0.005216121673583984, -0.004693746566772461, -0.0041713714599609375, -0.003648996353149414, -0.0031266212463378906, -0.002604246139526367, -0.0020818710327148438, -0.0015594959259033203, -0.0010371208190917969, -0.0005147457122802734, 7.62939453125e-06, 0.0005300045013427734, 0.0010523796081542969, 0.0015747547149658203, 0.0020971298217773438, 0.002619504928588867, 0.0031418800354003906, 0.003664255142211914, 0.0041866302490234375, 0.004709005355834961, 0.005231380462646484, 0.005753755569458008, 0.006276130676269531, 0.006798505783081055, 0.007320880889892578, 0.007843255996704102, 0.008365631103515625, 0.008888006210327148, 0.009410381317138672, 0.009932756423950195, 0.010455131530761719, 0.010977506637573242, 0.011499881744384766, 0.012022256851196289, 0.012544631958007812, 0.013067007064819336, 0.01358938217163086, 0.014111757278442383, 0.014634132385253906, 0.01515650749206543, 0.015678882598876953, 0.016201257705688477, 0.0167236328125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 7.0, 16.0, 17.0, 31.0, 51.0, 67.0, 111.0, 171.0, 291.0, 537.0, 1057.0, 2424.0, 6497.0, 25420.0, 528237.0, 447823.0, 24597.0, 6493.0, 2393.0, 1019.0, 529.0, 296.0, 174.0, 90.0, 57.0, 35.0, 31.0, 16.0, 21.0, 9.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00916290283203125, -0.008857369422912598, -0.008551836013793945, -0.008246302604675293, -0.00794076919555664, -0.007635235786437988, -0.007329702377319336, -0.007024168968200684, -0.006718635559082031, -0.006413102149963379, -0.0061075687408447266, -0.005802035331726074, -0.005496501922607422, -0.0051909685134887695, -0.004885435104370117, -0.004579901695251465, -0.0042743682861328125, -0.00396883487701416, -0.003663301467895508, -0.0033577680587768555, -0.003052234649658203, -0.0027467012405395508, -0.0024411678314208984, -0.002135634422302246, -0.0018301010131835938, -0.0015245676040649414, -0.001219034194946289, -0.0009135007858276367, -0.0006079673767089844, -0.00030243396759033203, 3.0994415283203125e-06, 0.00030863285064697266, 0.000614166259765625, 0.0009196996688842773, 0.0012252330780029297, 0.001530766487121582, 0.0018362998962402344, 0.0021418333053588867, 0.002447366714477539, 0.0027529001235961914, 0.0030584335327148438, 0.003363966941833496, 0.0036695003509521484, 0.003975033760070801, 0.004280567169189453, 0.0045861005783081055, 0.004891633987426758, 0.00519716739654541, 0.0055027008056640625, 0.005808234214782715, 0.006113767623901367, 0.0064193010330200195, 0.006724834442138672, 0.007030367851257324, 0.0073359012603759766, 0.007641434669494629, 0.007946968078613281, 0.008252501487731934, 0.008558034896850586, 0.008863568305969238, 0.00916910171508789, 0.009474635124206543, 0.009780168533325195, 0.010085701942443848, 0.0103912353515625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 7.0, 7.0, 3.0, 8.0, 21.0, 8.0, 15.0, 32.0, 20.0, 26.0, 106.0, 67.0, 72.0, 130.0, 66.0, 61.0, 99.0, 44.0, 33.0, 67.0, 16.0, 11.0, 26.0, 7.0, 5.0, 9.0, 3.0, 4.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.682209014892578e-06, -2.6030465960502625e-06, -2.5238841772079468e-06, -2.444721758365631e-06, -2.3655593395233154e-06, -2.2863969206809998e-06, -2.207234501838684e-06, -2.1280720829963684e-06, -2.0489096641540527e-06, -1.969747245311737e-06, -1.8905848264694214e-06, -1.8114224076271057e-06, -1.73225998878479e-06, -1.6530975699424744e-06, -1.5739351511001587e-06, -1.494772732257843e-06, -1.4156103134155273e-06, -1.3364478945732117e-06, -1.257285475730896e-06, -1.1781230568885803e-06, -1.0989606380462646e-06, -1.019798219203949e-06, -9.406358003616333e-07, -8.614733815193176e-07, -7.82310962677002e-07, -7.031485438346863e-07, -6.239861249923706e-07, -5.448237061500549e-07, -4.6566128730773926e-07, -3.864988684654236e-07, -3.073364496231079e-07, -2.2817403078079224e-07, -1.4901161193847656e-07, -6.984919309616089e-08, 9.313225746154785e-09, 8.847564458847046e-08, 1.6763806343078613e-07, 2.468004822731018e-07, 3.259629011154175e-07, 4.0512531995773315e-07, 4.842877388000488e-07, 5.634501576423645e-07, 6.426125764846802e-07, 7.217749953269958e-07, 8.009374141693115e-07, 8.800998330116272e-07, 9.592622518539429e-07, 1.0384246706962585e-06, 1.1175870895385742e-06, 1.1967495083808899e-06, 1.2759119272232056e-06, 1.3550743460655212e-06, 1.434236764907837e-06, 1.5133991837501526e-06, 1.5925616025924683e-06, 1.671724021434784e-06, 1.7508864402770996e-06, 1.8300488591194153e-06, 1.909211277961731e-06, 1.9883736968040466e-06, 2.0675361156463623e-06, 2.146698534488678e-06, 2.2258609533309937e-06, 2.3050233721733093e-06, 2.384185791015625e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 9.0, 12.0, 17.0, 22.0, 38.0, 175.0, 567.0, 2761.0, 31712.0, 999952.0, 11144.0, 1578.0, 369.0, 107.0, 29.0, 12.0, 13.0, 3.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.030303955078125, -0.029304981231689453, -0.028306007385253906, -0.02730703353881836, -0.026308059692382812, -0.025309085845947266, -0.02431011199951172, -0.023311138153076172, -0.022312164306640625, -0.021313190460205078, -0.02031421661376953, -0.019315242767333984, -0.018316268920898438, -0.01731729507446289, -0.016318321228027344, -0.015319347381591797, -0.01432037353515625, -0.013321399688720703, -0.012322425842285156, -0.01132345199584961, -0.010324478149414062, -0.009325504302978516, -0.008326530456542969, -0.007327556610107422, -0.006328582763671875, -0.005329608917236328, -0.004330635070800781, -0.0033316612243652344, -0.0023326873779296875, -0.0013337135314941406, -0.00033473968505859375, 0.0006642341613769531, 0.0016632080078125, 0.002662181854248047, 0.0036611557006835938, 0.004660129547119141, 0.0056591033935546875, 0.006658077239990234, 0.007657051086425781, 0.008656024932861328, 0.009654998779296875, 0.010653972625732422, 0.011652946472167969, 0.012651920318603516, 0.013650894165039062, 0.01464986801147461, 0.015648841857910156, 0.016647815704345703, 0.01764678955078125, 0.018645763397216797, 0.019644737243652344, 0.02064371109008789, 0.021642684936523438, 0.022641658782958984, 0.02364063262939453, 0.024639606475830078, 0.025638580322265625, 0.026637554168701172, 0.02763652801513672, 0.028635501861572266, 0.029634475708007812, 0.03063344955444336, 0.031632423400878906, 0.03263139724731445, 0.03363037109375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 4.0, 8.0, 4.0, 18.0, 20.0, 34.0, 93.0, 192.0, 254.0, 153.0, 77.0, 36.0, 21.0, 14.0, 11.0, 14.0, 7.0, 8.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0158843994140625, -0.015394449234008789, -0.014904499053955078, -0.014414548873901367, -0.013924598693847656, -0.013434648513793945, -0.012944698333740234, -0.012454748153686523, -0.011964797973632812, -0.011474847793579102, -0.01098489761352539, -0.01049494743347168, -0.010004997253417969, -0.009515047073364258, -0.009025096893310547, -0.008535146713256836, -0.008045196533203125, -0.007555246353149414, -0.007065296173095703, -0.006575345993041992, -0.006085395812988281, -0.00559544563293457, -0.005105495452880859, -0.0046155452728271484, -0.0041255950927734375, -0.0036356449127197266, -0.0031456947326660156, -0.0026557445526123047, -0.0021657943725585938, -0.0016758441925048828, -0.0011858940124511719, -0.0006959438323974609, -0.00020599365234375, 0.00028395652770996094, 0.0007739067077636719, 0.0012638568878173828, 0.0017538070678710938, 0.0022437572479248047, 0.0027337074279785156, 0.0032236576080322266, 0.0037136077880859375, 0.0042035579681396484, 0.004693508148193359, 0.00518345832824707, 0.005673408508300781, 0.006163358688354492, 0.006653308868408203, 0.007143259048461914, 0.007633209228515625, 0.008123159408569336, 0.008613109588623047, 0.009103059768676758, 0.009593009948730469, 0.01008296012878418, 0.01057291030883789, 0.011062860488891602, 0.011552810668945312, 0.012042760848999023, 0.012532711029052734, 0.013022661209106445, 0.013512611389160156, 0.014002561569213867, 0.014492511749267578, 0.014982461929321289, 0.015472412109375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [19.0, 693.0, 291.0, 17.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08638295531272888, -0.039517052471637726, 0.00734885036945343, 0.05421474575996399, 0.10108065605163574, 0.1479465663433075, 0.19481244683265686, 0.2416783571243286, 0.28854426741600037, 0.3354101777076721, 0.3822760581970215, 0.42914196848869324, 0.476007878780365, 0.5228737592697144, 0.5697396993637085, 0.6166055798530579, 0.6634714603424072, 0.7103373408317566, 0.7572032809257507, 0.8040691614151001, 0.8509351015090942, 0.8978009819984436, 0.944666862487793, 0.9915328025817871, 1.0383987426757812, 1.0852646827697754, 1.13213050365448, 1.1789964437484741, 1.2258623838424683, 1.2727282047271729, 1.319594144821167, 1.3664600849151611, 1.4133260250091553, 1.4601919651031494, 1.507057785987854, 1.5539237260818481, 1.6007896661758423, 1.6476554870605469, 1.694521427154541, 1.7413873672485352, 1.7882533073425293, 1.8351192474365234, 1.881985068321228, 1.9288510084152222, 1.9757169485092163, 2.022582769393921, 2.069448709487915, 2.116314649581909, 2.163180351257324, 2.2100462913513184, 2.2569122314453125, 2.3037781715393066, 2.3506438732147217, 2.397509813308716, 2.44437575340271, 2.491241693496704, 2.5381076335906982, 2.5849735736846924, 2.6318395137786865, 2.6787052154541016, 2.7255711555480957, 2.77243709564209, 2.819303035736084, 2.866168975830078, 2.9130349159240723]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 1.0, 6.0, 4.0, 8.0, 6.0, 7.0, 12.0, 11.0, 22.0, 25.0, 32.0, 20.0, 25.0, 33.0, 38.0, 48.0, 52.0, 43.0, 56.0, 62.0, 50.0, 57.0, 54.0, 34.0, 40.0, 46.0, 40.0, 33.0, 30.0, 22.0, 16.0, 14.0, 9.0, 15.0, 9.0, 6.0, 2.0, 9.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12080889940261841, -0.11715881526470184, -0.11350873112678528, -0.10985865443944931, -0.10620857030153275, -0.10255848616361618, -0.09890840947628021, -0.09525832533836365, -0.09160824120044708, -0.08795815706253052, -0.08430807292461395, -0.08065799623727798, -0.07700791209936142, -0.07335782796144485, -0.06970775127410889, -0.06605766713619232, -0.06240758299827576, -0.05875749886035919, -0.055107418447732925, -0.05145733803510666, -0.047807253897190094, -0.04415716975927353, -0.04050708934664726, -0.036857008934020996, -0.03320692479610443, -0.029556842520833015, -0.0259067602455616, -0.022256677970290184, -0.01860659569501877, -0.014956513419747353, -0.011306431144475937, -0.007656348869204521, -0.0040062665939331055, -0.00035618431866168976, 0.003293897956609726, 0.006943980231881142, 0.010594062507152557, 0.014244144782423973, 0.01789422705769539, 0.021544309332966805, 0.02519439160823822, 0.028844473883509636, 0.03249455615878105, 0.03614463657140732, 0.03979472070932388, 0.04344480484724045, 0.047094885259866714, 0.05074496567249298, 0.054395049810409546, 0.05804513394832611, 0.06169521436095238, 0.06534529477357864, 0.06899537891149521, 0.07264546304941177, 0.07629553973674774, 0.0799456238746643, 0.08359570801258087, 0.08724579215049744, 0.090895876288414, 0.09454595297574997, 0.09819603711366653, 0.1018461212515831, 0.10549619793891907, 0.10914628207683563, 0.1127963662147522]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 15.0, 21.0, 18.0, 24.0, 32.0, 38.0, 57.0, 90.0, 158.0, 312.0, 646.0, 1364.0, 3603.0, 14996.0, 3868315.0, 290601.0, 8795.0, 2770.0, 1107.0, 549.0, 272.0, 169.0, 108.0, 76.0, 43.0, 30.0, 19.0, 13.0, 5.0, 10.0, 7.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.087890625, -0.08521556854248047, -0.08254051208496094, -0.0798654556274414, -0.07719039916992188, -0.07451534271240234, -0.07184028625488281, -0.06916522979736328, -0.06649017333984375, -0.06381511688232422, -0.06114006042480469, -0.058465003967285156, -0.055789947509765625, -0.053114891052246094, -0.05043983459472656, -0.04776477813720703, -0.0450897216796875, -0.04241466522216797, -0.03973960876464844, -0.037064552307128906, -0.034389495849609375, -0.031714439392089844, -0.029039382934570312, -0.02636432647705078, -0.02368927001953125, -0.02101421356201172, -0.018339157104492188, -0.015664100646972656, -0.012989044189453125, -0.010313987731933594, -0.0076389312744140625, -0.004963874816894531, -0.002288818359375, 0.00038623809814453125, 0.0030612945556640625, 0.005736351013183594, 0.008411407470703125, 0.011086463928222656, 0.013761520385742188, 0.01643657684326172, 0.01911163330078125, 0.02178668975830078, 0.024461746215820312, 0.027136802673339844, 0.029811859130859375, 0.032486915588378906, 0.03516197204589844, 0.03783702850341797, 0.0405120849609375, 0.04318714141845703, 0.04586219787597656, 0.048537254333496094, 0.051212310791015625, 0.053887367248535156, 0.05656242370605469, 0.05923748016357422, 0.06191253662109375, 0.06458759307861328, 0.06726264953613281, 0.06993770599365234, 0.07261276245117188, 0.0752878189086914, 0.07796287536621094, 0.08063793182373047, 0.08331298828125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 10.0, 7.0, 16.0, 9.0, 18.0, 14.0, 17.0, 25.0, 37.0, 51.0, 50.0, 66.0, 72.0, 61.0, 79.0, 56.0, 60.0, 63.0, 45.0, 46.0, 38.0, 29.0, 33.0, 25.0, 25.0, 12.0, 14.0, 5.0, 5.0, 7.0, 1.0, 2.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00940704345703125, -0.009130001068115234, -0.008852958679199219, -0.008575916290283203, -0.008298873901367188, -0.008021831512451172, -0.007744789123535156, -0.007467746734619141, -0.007190704345703125, -0.006913661956787109, -0.006636619567871094, -0.006359577178955078, -0.0060825347900390625, -0.005805492401123047, -0.005528450012207031, -0.005251407623291016, -0.004974365234375, -0.004697322845458984, -0.004420280456542969, -0.004143238067626953, -0.0038661956787109375, -0.003589153289794922, -0.0033121109008789062, -0.0030350685119628906, -0.002758026123046875, -0.0024809837341308594, -0.0022039413452148438, -0.0019268989562988281, -0.0016498565673828125, -0.0013728141784667969, -0.0010957717895507812, -0.0008187294006347656, -0.00054168701171875, -0.0002646446228027344, 1.239776611328125e-05, 0.0002894401550292969, 0.0005664825439453125, 0.0008435249328613281, 0.0011205673217773438, 0.0013976097106933594, 0.001674652099609375, 0.0019516944885253906, 0.0022287368774414062, 0.002505779266357422, 0.0027828216552734375, 0.003059864044189453, 0.0033369064331054688, 0.0036139488220214844, 0.0038909912109375, 0.004168033599853516, 0.004445075988769531, 0.004722118377685547, 0.0049991607666015625, 0.005276203155517578, 0.005553245544433594, 0.005830287933349609, 0.006107330322265625, 0.006384372711181641, 0.006661415100097656, 0.006938457489013672, 0.0072154998779296875, 0.007492542266845703, 0.007769584655761719, 0.008046627044677734, 0.00832366943359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 8.0, 11.0, 20.0, 21.0, 24.0, 77.0, 181.0, 637.0, 3103.0, 42473.0, 4090434.0, 52643.0, 3423.0, 723.0, 237.0, 90.0, 47.0, 31.0, 18.0, 19.0, 9.0, 6.0, 10.0, 3.0, 10.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.049835205078125, -0.04752016067504883, -0.045205116271972656, -0.042890071868896484, -0.04057502746582031, -0.03825998306274414, -0.03594493865966797, -0.0336298942565918, -0.031314849853515625, -0.028999805450439453, -0.02668476104736328, -0.02436971664428711, -0.022054672241210938, -0.019739627838134766, -0.017424583435058594, -0.015109539031982422, -0.01279449462890625, -0.010479450225830078, -0.008164405822753906, -0.005849361419677734, -0.0035343170166015625, -0.0012192726135253906, 0.0010957717895507812, 0.003410816192626953, 0.005725860595703125, 0.008040904998779297, 0.010355949401855469, 0.01267099380493164, 0.014986038208007812, 0.017301082611083984, 0.019616127014160156, 0.021931171417236328, 0.0242462158203125, 0.026561260223388672, 0.028876304626464844, 0.031191349029541016, 0.03350639343261719, 0.03582143783569336, 0.03813648223876953, 0.0404515266418457, 0.042766571044921875, 0.04508161544799805, 0.04739665985107422, 0.04971170425415039, 0.05202674865722656, 0.054341793060302734, 0.056656837463378906, 0.05897188186645508, 0.06128692626953125, 0.06360197067260742, 0.0659170150756836, 0.06823205947875977, 0.07054710388183594, 0.07286214828491211, 0.07517719268798828, 0.07749223709106445, 0.07980728149414062, 0.0821223258972168, 0.08443737030029297, 0.08675241470336914, 0.08906745910644531, 0.09138250350952148, 0.09369754791259766, 0.09601259231567383, 0.09832763671875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 5.0, 7.0, 10.0, 9.0, 17.0, 21.0, 26.0, 37.0, 50.0, 57.0, 119.0, 245.0, 684.0, 1424.0, 740.0, 267.0, 121.0, 74.0, 39.0, 34.0, 19.0, 17.0, 8.0, 5.0, 16.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.019073486328125, -0.018614768981933594, -0.018156051635742188, -0.01769733428955078, -0.017238616943359375, -0.01677989959716797, -0.016321182250976562, -0.015862464904785156, -0.01540374755859375, -0.014945030212402344, -0.014486312866210938, -0.014027595520019531, -0.013568878173828125, -0.013110160827636719, -0.012651443481445312, -0.012192726135253906, -0.0117340087890625, -0.011275291442871094, -0.010816574096679688, -0.010357856750488281, -0.009899139404296875, -0.009440422058105469, -0.008981704711914062, -0.008522987365722656, -0.00806427001953125, -0.007605552673339844, -0.0071468353271484375, -0.006688117980957031, -0.006229400634765625, -0.005770683288574219, -0.0053119659423828125, -0.004853248596191406, -0.00439453125, -0.003935813903808594, -0.0034770965576171875, -0.0030183792114257812, -0.002559661865234375, -0.0021009445190429688, -0.0016422271728515625, -0.0011835098266601562, -0.00072479248046875, -0.00026607513427734375, 0.0001926422119140625, 0.0006513595581054688, 0.001110076904296875, 0.0015687942504882812, 0.0020275115966796875, 0.0024862289428710938, 0.0029449462890625, 0.0034036636352539062, 0.0038623809814453125, 0.004321098327636719, 0.004779815673828125, 0.005238533020019531, 0.0056972503662109375, 0.006155967712402344, 0.00661468505859375, 0.007073402404785156, 0.0075321197509765625, 0.007990837097167969, 0.008449554443359375, 0.008908271789550781, 0.009366989135742188, 0.009825706481933594, 0.010284423828125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 38.0, 939.0, 41.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7823076248168945, -0.7671431303024292, -0.7519786953926086, -0.7368142008781433, -0.721649706363678, -0.7064852714538574, -0.6913207769393921, -0.6761562824249268, -0.6609917879104614, -0.6458272933959961, -0.6306628584861755, -0.6154983639717102, -0.6003338694572449, -0.5851694345474243, -0.570004940032959, -0.5548404455184937, -0.5396760106086731, -0.5245115160942078, -0.5093470811843872, -0.4941825866699219, -0.47901809215545654, -0.4638536274433136, -0.44868916273117065, -0.4335246682167053, -0.41836017370224, -0.40319570899009705, -0.3880312144756317, -0.37286674976348877, -0.35770225524902344, -0.3425377905368805, -0.32737332582473755, -0.3122088313102722, -0.2970443367958069, -0.28187987208366394, -0.2667153775691986, -0.25155091285705566, -0.23638643324375153, -0.2212219536304474, -0.20605747401714325, -0.1908929944038391, -0.17572852969169617, -0.16056405007839203, -0.1453995704650879, -0.13023510575294495, -0.11507062613964081, -0.09990614652633667, -0.08474166691303253, -0.06957719475030899, -0.05441272258758545, -0.03924824669957161, -0.02408376894891262, -0.008919291198253632, 0.006245184689760208, 0.021409660577774048, 0.036574140191078186, 0.05173861235380173, 0.06690309196710587, 0.08206757158041, 0.09723204374313354, 0.11239652335643768, 0.12756100296974182, 0.14272546768188477, 0.1578899621963501, 0.17305442690849304, 0.18821890652179718]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 7.0, 5.0, 8.0, 13.0, 8.0, 12.0, 16.0, 26.0, 20.0, 25.0, 21.0, 38.0, 30.0, 29.0, 44.0, 27.0, 38.0, 35.0, 35.0, 44.0, 37.0, 45.0, 50.0, 36.0, 40.0, 38.0, 39.0, 21.0, 31.0, 30.0, 30.0, 24.0, 22.0, 11.0, 11.0, 10.0, 11.0, 4.0, 8.0, 10.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.03634387254714966, -0.03531333804130554, -0.034282803535461426, -0.03325226902961731, -0.03222173452377319, -0.031191200017929077, -0.03016066551208496, -0.029130131006240845, -0.02809959650039673, -0.027069061994552612, -0.026038527488708496, -0.02500799298286438, -0.023977458477020264, -0.022946923971176147, -0.02191638946533203, -0.020885854959487915, -0.0198553204536438, -0.018824785947799683, -0.017794251441955566, -0.01676371693611145, -0.015733182430267334, -0.014702647924423218, -0.013672113418579102, -0.012641578912734985, -0.01161104440689087, -0.010580509901046753, -0.009549975395202637, -0.00851944088935852, -0.007488906383514404, -0.006458371877670288, -0.005427837371826172, -0.004397302865982056, -0.0033667683601379395, -0.0023362338542938232, -0.001305699348449707, -0.0002751648426055908, 0.0007553696632385254, 0.0017859041690826416, 0.002816438674926758, 0.003846973180770874, 0.00487750768661499, 0.0059080421924591064, 0.006938576698303223, 0.007969111204147339, 0.008999645709991455, 0.010030180215835571, 0.011060714721679688, 0.012091249227523804, 0.01312178373336792, 0.014152318239212036, 0.015182852745056152, 0.01621338725090027, 0.017243921756744385, 0.0182744562625885, 0.019304990768432617, 0.020335525274276733, 0.02136605978012085, 0.022396594285964966, 0.023427128791809082, 0.024457663297653198, 0.025488197803497314, 0.02651873230934143, 0.027549266815185547, 0.028579801321029663, 0.02961033582687378]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 2.0, 6.0, 10.0, 14.0, 11.0, 14.0, 30.0, 39.0, 47.0, 68.0, 77.0, 120.0, 172.0, 240.0, 305.0, 465.0, 674.0, 1050.0, 1777.0, 2899.0, 4967.0, 8401.0, 14703.0, 28002.0, 55464.0, 125890.0, 404732.0, 224707.0, 84765.0, 39696.0, 20788.0, 11631.0, 6452.0, 3658.0, 2370.0, 1478.0, 929.0, 671.0, 400.0, 267.0, 180.0, 107.0, 81.0, 46.0, 38.0, 30.0, 21.0, 15.0, 12.0, 7.0, 6.0, 9.0, 5.0, 5.0, 6.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.026153564453125, -0.02530360221862793, -0.02445363998413086, -0.02360367774963379, -0.02275371551513672, -0.02190375328063965, -0.021053791046142578, -0.020203828811645508, -0.019353866577148438, -0.018503904342651367, -0.017653942108154297, -0.016803979873657227, -0.015954017639160156, -0.015104055404663086, -0.014254093170166016, -0.013404130935668945, -0.012554168701171875, -0.011704206466674805, -0.010854244232177734, -0.010004281997680664, -0.009154319763183594, -0.008304357528686523, -0.007454395294189453, -0.006604433059692383, -0.0057544708251953125, -0.004904508590698242, -0.004054546356201172, -0.0032045841217041016, -0.0023546218872070312, -0.001504659652709961, -0.0006546974182128906, 0.0001952648162841797, 0.00104522705078125, 0.0018951892852783203, 0.0027451515197753906, 0.003595113754272461, 0.004445075988769531, 0.0052950382232666016, 0.006145000457763672, 0.006994962692260742, 0.007844924926757812, 0.008694887161254883, 0.009544849395751953, 0.010394811630249023, 0.011244773864746094, 0.012094736099243164, 0.012944698333740234, 0.013794660568237305, 0.014644622802734375, 0.015494585037231445, 0.016344547271728516, 0.017194509506225586, 0.018044471740722656, 0.018894433975219727, 0.019744396209716797, 0.020594358444213867, 0.021444320678710938, 0.022294282913208008, 0.023144245147705078, 0.02399420738220215, 0.02484416961669922, 0.02569413185119629, 0.02654409408569336, 0.02739405632019043, 0.0282440185546875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 11.0, 15.0, 13.0, 14.0, 17.0, 17.0, 27.0, 35.0, 46.0, 46.0, 62.0, 50.0, 68.0, 77.0, 65.0, 65.0, 46.0, 52.0, 50.0, 38.0, 34.0, 30.0, 30.0, 21.0, 20.0, 11.0, 13.0, 8.0, 5.0, 2.0, 4.0, 5.0, 1.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0087127685546875, -0.008451700210571289, -0.008190631866455078, -0.007929563522338867, -0.007668495178222656, -0.007407426834106445, -0.007146358489990234, -0.0068852901458740234, -0.0066242218017578125, -0.0063631534576416016, -0.006102085113525391, -0.00584101676940918, -0.005579948425292969, -0.005318880081176758, -0.005057811737060547, -0.004796743392944336, -0.004535675048828125, -0.004274606704711914, -0.004013538360595703, -0.003752470016479492, -0.0034914016723632812, -0.0032303333282470703, -0.0029692649841308594, -0.0027081966400146484, -0.0024471282958984375, -0.0021860599517822266, -0.0019249916076660156, -0.0016639232635498047, -0.0014028549194335938, -0.0011417865753173828, -0.0008807182312011719, -0.0006196498870849609, -0.00035858154296875, -9.751319885253906e-05, 0.00016355514526367188, 0.0004246234893798828, 0.0006856918334960938, 0.0009467601776123047, 0.0012078285217285156, 0.0014688968658447266, 0.0017299652099609375, 0.0019910335540771484, 0.0022521018981933594, 0.0025131702423095703, 0.0027742385864257812, 0.003035306930541992, 0.003296375274658203, 0.003557443618774414, 0.003818511962890625, 0.004079580307006836, 0.004340648651123047, 0.004601716995239258, 0.004862785339355469, 0.00512385368347168, 0.005384922027587891, 0.0056459903717041016, 0.0059070587158203125, 0.0061681270599365234, 0.006429195404052734, 0.006690263748168945, 0.006951332092285156, 0.007212400436401367, 0.007473468780517578, 0.007734537124633789, 0.00799560546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 5.0, 6.0, 9.0, 7.0, 9.0, 14.0, 22.0, 23.0, 41.0, 34.0, 84.0, 114.0, 247.0, 471.0, 1302.0, 5846.0, 48298.0, 767887.0, 201976.0, 17725.0, 2807.0, 778.0, 328.0, 183.0, 93.0, 68.0, 54.0, 35.0, 16.0, 9.0, 8.0, 8.0, 3.0, 4.0, 9.0, 2.0, 6.0, 5.0, 1.0, 3.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.08612060546875, -0.08364391326904297, -0.08116722106933594, -0.0786905288696289, -0.07621383666992188, -0.07373714447021484, -0.07126045227050781, -0.06878376007080078, -0.06630706787109375, -0.06383037567138672, -0.06135368347167969, -0.058876991271972656, -0.056400299072265625, -0.053923606872558594, -0.05144691467285156, -0.04897022247314453, -0.0464935302734375, -0.04401683807373047, -0.04154014587402344, -0.039063453674316406, -0.036586761474609375, -0.034110069274902344, -0.03163337707519531, -0.02915668487548828, -0.02667999267578125, -0.02420330047607422, -0.021726608276367188, -0.019249916076660156, -0.016773223876953125, -0.014296531677246094, -0.011819839477539062, -0.009343147277832031, -0.006866455078125, -0.004389762878417969, -0.0019130706787109375, 0.0005636215209960938, 0.003040313720703125, 0.005517005920410156, 0.007993698120117188, 0.010470390319824219, 0.01294708251953125, 0.015423774719238281, 0.017900466918945312, 0.020377159118652344, 0.022853851318359375, 0.025330543518066406, 0.027807235717773438, 0.03028392791748047, 0.0327606201171875, 0.03523731231689453, 0.03771400451660156, 0.040190696716308594, 0.042667388916015625, 0.045144081115722656, 0.04762077331542969, 0.05009746551513672, 0.05257415771484375, 0.05505084991455078, 0.05752754211425781, 0.060004234313964844, 0.062480926513671875, 0.0649576187133789, 0.06743431091308594, 0.06991100311279297, 0.0723876953125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 5.0, 8.0, 11.0, 14.0, 16.0, 19.0, 18.0, 19.0, 15.0, 29.0, 33.0, 22.0, 31.0, 36.0, 28.0, 47.0, 50.0, 43.0, 49.0, 50.0, 44.0, 42.0, 42.0, 30.0, 32.0, 34.0, 37.0, 22.0, 29.0, 21.0, 23.0, 12.0, 18.0, 11.0, 16.0, 9.0, 5.0, 4.0, 6.0, 7.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013580322265625, -0.013089179992675781, -0.012598037719726562, -0.012106895446777344, -0.011615753173828125, -0.011124610900878906, -0.010633468627929688, -0.010142326354980469, -0.00965118408203125, -0.009160041809082031, -0.008668899536132812, -0.008177757263183594, -0.007686614990234375, -0.007195472717285156, -0.0067043304443359375, -0.006213188171386719, -0.0057220458984375, -0.005230903625488281, -0.0047397613525390625, -0.004248619079589844, -0.003757476806640625, -0.0032663345336914062, -0.0027751922607421875, -0.0022840499877929688, -0.00179290771484375, -0.0013017654418945312, -0.0008106231689453125, -0.00031948089599609375, 0.000171661376953125, 0.0006628036499023438, 0.0011539459228515625, 0.0016450881958007812, 0.00213623046875, 0.0026273727416992188, 0.0031185150146484375, 0.0036096572875976562, 0.004100799560546875, 0.004591941833496094, 0.0050830841064453125, 0.005574226379394531, 0.00606536865234375, 0.006556510925292969, 0.0070476531982421875, 0.007538795471191406, 0.008029937744140625, 0.008521080017089844, 0.009012222290039062, 0.009503364562988281, 0.0099945068359375, 0.010485649108886719, 0.010976791381835938, 0.011467933654785156, 0.011959075927734375, 0.012450218200683594, 0.012941360473632812, 0.013432502746582031, 0.01392364501953125, 0.014414787292480469, 0.014905929565429688, 0.015397071838378906, 0.015888214111328125, 0.016379356384277344, 0.016870498657226562, 0.01736164093017578, 0.017852783203125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 9.0, 8.0, 7.0, 9.0, 11.0, 23.0, 24.0, 33.0, 44.0, 80.0, 119.0, 242.0, 630.0, 1763.0, 6332.0, 36012.0, 917122.0, 72670.0, 9439.0, 2438.0, 753.0, 301.0, 181.0, 81.0, 59.0, 49.0, 19.0, 20.0, 21.0, 14.0, 9.0, 10.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01727294921875, -0.01674365997314453, -0.016214370727539062, -0.015685081481933594, -0.015155792236328125, -0.014626502990722656, -0.014097213745117188, -0.013567924499511719, -0.01303863525390625, -0.012509346008300781, -0.011980056762695312, -0.011450767517089844, -0.010921478271484375, -0.010392189025878906, -0.009862899780273438, -0.009333610534667969, -0.0088043212890625, -0.008275032043457031, -0.0077457427978515625, -0.007216453552246094, -0.006687164306640625, -0.006157875061035156, -0.0056285858154296875, -0.005099296569824219, -0.00457000732421875, -0.004040718078613281, -0.0035114288330078125, -0.0029821395874023438, -0.002452850341796875, -0.0019235610961914062, -0.0013942718505859375, -0.0008649826049804688, -0.000335693359375, 0.00019359588623046875, 0.0007228851318359375, 0.0012521743774414062, 0.001781463623046875, 0.0023107528686523438, 0.0028400421142578125, 0.0033693313598632812, 0.00389862060546875, 0.004427909851074219, 0.0049571990966796875, 0.005486488342285156, 0.006015777587890625, 0.006545066833496094, 0.0070743560791015625, 0.007603645324707031, 0.0081329345703125, 0.008662223815917969, 0.009191513061523438, 0.009720802307128906, 0.010250091552734375, 0.010779380798339844, 0.011308670043945312, 0.011837959289550781, 0.01236724853515625, 0.012896537780761719, 0.013425827026367188, 0.013955116271972656, 0.014484405517578125, 0.015013694763183594, 0.015542984008789062, 0.01607227325439453, 0.0166015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 4.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 8.0, 11.0, 10.0, 18.0, 10.0, 15.0, 31.0, 22.0, 68.0, 61.0, 71.0, 124.0, 81.0, 120.0, 66.0, 82.0, 28.0, 21.0, 35.0, 18.0, 13.0, 7.0, 9.0, 18.0, 7.0, 7.0, 2.0, 2.0, 5.0, 1.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.76837158203125e-06, -4.624947905540466e-06, -4.481524229049683e-06, -4.338100552558899e-06, -4.194676876068115e-06, -4.0512531995773315e-06, -3.907829523086548e-06, -3.764405846595764e-06, -3.6209821701049805e-06, -3.4775584936141968e-06, -3.334134817123413e-06, -3.1907111406326294e-06, -3.0472874641418457e-06, -2.903863787651062e-06, -2.7604401111602783e-06, -2.6170164346694946e-06, -2.473592758178711e-06, -2.3301690816879272e-06, -2.1867454051971436e-06, -2.04332172870636e-06, -1.8998980522155762e-06, -1.7564743757247925e-06, -1.6130506992340088e-06, -1.469627022743225e-06, -1.3262033462524414e-06, -1.1827796697616577e-06, -1.039355993270874e-06, -8.959323167800903e-07, -7.525086402893066e-07, -6.09084963798523e-07, -4.6566128730773926e-07, -3.2223761081695557e-07, -1.7881393432617188e-07, -3.5390257835388184e-08, 1.0803341865539551e-07, 2.514570951461792e-07, 3.948807716369629e-07, 5.383044481277466e-07, 6.817281246185303e-07, 8.25151801109314e-07, 9.685754776000977e-07, 1.1119991540908813e-06, 1.255422830581665e-06, 1.3988465070724487e-06, 1.5422701835632324e-06, 1.6856938600540161e-06, 1.8291175365447998e-06, 1.9725412130355835e-06, 2.115964889526367e-06, 2.259388566017151e-06, 2.4028122425079346e-06, 2.5462359189987183e-06, 2.689659595489502e-06, 2.8330832719802856e-06, 2.9765069484710693e-06, 3.119930624961853e-06, 3.2633543014526367e-06, 3.4067779779434204e-06, 3.550201654434204e-06, 3.693625330924988e-06, 3.8370490074157715e-06, 3.980472683906555e-06, 4.123896360397339e-06, 4.2673200368881226e-06, 4.410743713378906e-06]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 8.0, 4.0, 14.0, 26.0, 34.0, 62.0, 123.0, 265.0, 638.0, 1978.0, 8605.0, 117951.0, 899186.0, 15030.0, 3003.0, 928.0, 353.0, 137.0, 98.0, 42.0, 26.0, 21.0, 9.0, 7.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01271820068359375, -0.012366414070129395, -0.012014627456665039, -0.011662840843200684, -0.011311054229736328, -0.010959267616271973, -0.010607481002807617, -0.010255694389343262, -0.009903907775878906, -0.00955212116241455, -0.009200334548950195, -0.00884854793548584, -0.008496761322021484, -0.008144974708557129, -0.0077931880950927734, -0.007441401481628418, -0.0070896148681640625, -0.006737828254699707, -0.0063860416412353516, -0.006034255027770996, -0.005682468414306641, -0.005330681800842285, -0.00497889518737793, -0.004627108573913574, -0.004275321960449219, -0.003923535346984863, -0.003571748733520508, -0.0032199621200561523, -0.002868175506591797, -0.0025163888931274414, -0.002164602279663086, -0.0018128156661987305, -0.001461029052734375, -0.0011092424392700195, -0.0007574558258056641, -0.0004056692123413086, -5.3882598876953125e-05, 0.00029790401458740234, 0.0006496906280517578, 0.0010014772415161133, 0.0013532638549804688, 0.0017050504684448242, 0.0020568370819091797, 0.002408623695373535, 0.0027604103088378906, 0.003112196922302246, 0.0034639835357666016, 0.003815770149230957, 0.0041675567626953125, 0.004519343376159668, 0.0048711299896240234, 0.005222916603088379, 0.005574703216552734, 0.00592648983001709, 0.006278276443481445, 0.006630063056945801, 0.006981849670410156, 0.007333636283874512, 0.007685422897338867, 0.008037209510803223, 0.008388996124267578, 0.008740782737731934, 0.009092569351196289, 0.009444355964660645, 0.009796142578125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 2.0, 8.0, 9.0, 12.0, 32.0, 33.0, 58.0, 248.0, 373.0, 94.0, 42.0, 22.0, 14.0, 12.0, 9.0, 9.0, 4.0, 8.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003814697265625, -0.003668665885925293, -0.003522634506225586, -0.003376603126525879, -0.003230571746826172, -0.003084540367126465, -0.002938508987426758, -0.0027924776077270508, -0.0026464462280273438, -0.0025004148483276367, -0.0023543834686279297, -0.0022083520889282227, -0.0020623207092285156, -0.0019162893295288086, -0.0017702579498291016, -0.0016242265701293945, -0.0014781951904296875, -0.0013321638107299805, -0.0011861324310302734, -0.0010401010513305664, -0.0008940696716308594, -0.0007480382919311523, -0.0006020069122314453, -0.0004559755325317383, -0.00030994415283203125, -0.00016391277313232422, -1.7881393432617188e-05, 0.00012814998626708984, 0.0002741813659667969, 0.0004202127456665039, 0.0005662441253662109, 0.000712275505065918, 0.000858306884765625, 0.001004338264465332, 0.001150369644165039, 0.001296401023864746, 0.0014424324035644531, 0.0015884637832641602, 0.0017344951629638672, 0.0018805265426635742, 0.0020265579223632812, 0.0021725893020629883, 0.0023186206817626953, 0.0024646520614624023, 0.0026106834411621094, 0.0027567148208618164, 0.0029027462005615234, 0.0030487775802612305, 0.0031948089599609375, 0.0033408403396606445, 0.0034868717193603516, 0.0036329030990600586, 0.0037789344787597656, 0.003924965858459473, 0.00407099723815918, 0.004217028617858887, 0.004363059997558594, 0.004509091377258301, 0.004655122756958008, 0.004801154136657715, 0.004947185516357422, 0.005093216896057129, 0.005239248275756836, 0.005385279655456543, 0.00553131103515625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 29.0, 419.0, 538.0, 24.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10656151920557022, -0.0890379324555397, -0.07151434570550919, -0.05399075895547867, -0.03646717220544815, -0.018943585455417633, -0.0014199987053871155, 0.016103588044643402, 0.03362717479467392, 0.05115076154470444, 0.06867434829473495, 0.08619793504476547, 0.10372152179479599, 0.12124510854482651, 0.13876870274543762, 0.15629228949546814, 0.17381587624549866, 0.19133946299552917, 0.2088630497455597, 0.2263866364955902, 0.24391022324562073, 0.26143380999565125, 0.27895739674568176, 0.2964809834957123, 0.3140045702457428, 0.3315281569957733, 0.34905174374580383, 0.36657533049583435, 0.38409891724586487, 0.4016225039958954, 0.4191460907459259, 0.4366696774959564, 0.45419323444366455, 0.47171682119369507, 0.4892404079437256, 0.5067639946937561, 0.5242875814437866, 0.5418111681938171, 0.5593347549438477, 0.5768583416938782, 0.5943819284439087, 0.6119055151939392, 0.6294291019439697, 0.6469526886940002, 0.6644762754440308, 0.6819998621940613, 0.6995234489440918, 0.7170470356941223, 0.7345706224441528, 0.7520942091941833, 0.7696177959442139, 0.7871413826942444, 0.8046649694442749, 0.8221885561943054, 0.8397121429443359, 0.8572357296943665, 0.874759316444397, 0.8922829031944275, 0.909806489944458, 0.9273300766944885, 0.944853663444519, 0.9623772501945496, 0.9799008369445801, 0.9974244236946106, 1.0149480104446411]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 9.0, 13.0, 7.0, 5.0, 16.0, 7.0, 15.0, 18.0, 21.0, 22.0, 22.0, 17.0, 33.0, 34.0, 33.0, 43.0, 32.0, 49.0, 35.0, 38.0, 53.0, 36.0, 41.0, 34.0, 43.0, 38.0, 40.0, 27.0, 22.0, 31.0, 21.0, 21.0, 23.0, 14.0, 13.0, 13.0, 19.0, 6.0, 8.0, 7.0, 4.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.062411487102508545, -0.0605529248714447, -0.05869436264038086, -0.056835804134607315, -0.05497724190354347, -0.05311867967247963, -0.051260121166706085, -0.04940155893564224, -0.0475429967045784, -0.04568443447351456, -0.043825872242450714, -0.04196731373667717, -0.04010875150561333, -0.038250189274549484, -0.03639163076877594, -0.0345330685377121, -0.032674506306648254, -0.03081594407558441, -0.028957383707165718, -0.027098823338747025, -0.025240261107683182, -0.02338169887661934, -0.021523138508200645, -0.019664578139781952, -0.01780601590871811, -0.015947453677654266, -0.014088893309235573, -0.012230332009494305, -0.010371770709753036, -0.008513209410011768, -0.0066546481102705, -0.004796086810529232, -0.002937525510787964, -0.0010789642110466957, 0.0007795970886945724, 0.0026381583884358406, 0.004496719688177109, 0.006355280987918377, 0.008213842287659645, 0.010072403587400913, 0.011930964887142181, 0.01378952618688345, 0.015648087486624718, 0.01750664785504341, 0.019365210086107254, 0.021223772317171097, 0.02308233268558979, 0.024940893054008484, 0.026799455285072327, 0.02865801751613617, 0.030516577884554863, 0.032375138252973557, 0.0342337004840374, 0.03609226271510124, 0.037950821220874786, 0.03980938345193863, 0.04166794568300247, 0.043526507914066315, 0.04538507014513016, 0.0472436286509037, 0.049102190881967545, 0.05096075311303139, 0.05281931161880493, 0.054677873849868774, 0.05653643608093262]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 8.0, 10.0, 11.0, 39.0, 28.0, 48.0, 75.0, 81.0, 117.0, 186.0, 280.0, 456.0, 881.0, 1716.0, 6755.0, 116908.0, 4036140.0, 23799.0, 3624.0, 1321.0, 617.0, 402.0, 254.0, 157.0, 83.0, 70.0, 61.0, 41.0, 29.0, 29.0, 12.0, 11.0, 13.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08673095703125, -0.08404350280761719, -0.08135604858398438, -0.07866859436035156, -0.07598114013671875, -0.07329368591308594, -0.07060623168945312, -0.06791877746582031, -0.0652313232421875, -0.06254386901855469, -0.059856414794921875, -0.05716896057128906, -0.05448150634765625, -0.05179405212402344, -0.049106597900390625, -0.04641914367675781, -0.043731689453125, -0.04104423522949219, -0.038356781005859375, -0.03566932678222656, -0.03298187255859375, -0.030294418334960938, -0.027606964111328125, -0.024919509887695312, -0.0222320556640625, -0.019544601440429688, -0.016857147216796875, -0.014169692993164062, -0.01148223876953125, -0.008794784545898438, -0.006107330322265625, -0.0034198760986328125, -0.000732421875, 0.0019550323486328125, 0.004642486572265625, 0.0073299407958984375, 0.01001739501953125, 0.012704849243164062, 0.015392303466796875, 0.018079757690429688, 0.0207672119140625, 0.023454666137695312, 0.026142120361328125, 0.028829574584960938, 0.03151702880859375, 0.03420448303222656, 0.036891937255859375, 0.03957939147949219, 0.042266845703125, 0.04495429992675781, 0.047641754150390625, 0.05032920837402344, 0.05301666259765625, 0.05570411682128906, 0.058391571044921875, 0.06107902526855469, 0.0637664794921875, 0.06645393371582031, 0.06914138793945312, 0.07182884216308594, 0.07451629638671875, 0.07720375061035156, 0.07989120483398438, 0.08257865905761719, 0.08526611328125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 8.0, 2.0, 7.0, 15.0, 15.0, 12.0, 26.0, 29.0, 24.0, 26.0, 45.0, 50.0, 46.0, 55.0, 71.0, 81.0, 65.0, 54.0, 45.0, 52.0, 40.0, 43.0, 37.0, 37.0, 24.0, 20.0, 11.0, 16.0, 12.0, 5.0, 7.0, 7.0, 8.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00814056396484375, -0.007895231246948242, -0.007649898529052734, -0.0074045658111572266, -0.007159233093261719, -0.006913900375366211, -0.006668567657470703, -0.006423234939575195, -0.0061779022216796875, -0.00593256950378418, -0.005687236785888672, -0.005441904067993164, -0.005196571350097656, -0.0049512386322021484, -0.004705905914306641, -0.004460573196411133, -0.004215240478515625, -0.003969907760620117, -0.0037245750427246094, -0.0034792423248291016, -0.0032339096069335938, -0.002988576889038086, -0.002743244171142578, -0.0024979114532470703, -0.0022525787353515625, -0.0020072460174560547, -0.0017619132995605469, -0.001516580581665039, -0.0012712478637695312, -0.0010259151458740234, -0.0007805824279785156, -0.0005352497100830078, -0.0002899169921875, -4.458427429199219e-05, 0.00020074844360351562, 0.00044608116149902344, 0.0006914138793945312, 0.0009367465972900391, 0.0011820793151855469, 0.0014274120330810547, 0.0016727447509765625, 0.0019180774688720703, 0.002163410186767578, 0.002408742904663086, 0.0026540756225585938, 0.0028994083404541016, 0.0031447410583496094, 0.003390073776245117, 0.003635406494140625, 0.003880739212036133, 0.004126071929931641, 0.0043714046478271484, 0.004616737365722656, 0.004862070083618164, 0.005107402801513672, 0.00535273551940918, 0.0055980682373046875, 0.005843400955200195, 0.006088733673095703, 0.006334066390991211, 0.006579399108886719, 0.0068247318267822266, 0.007070064544677734, 0.007315397262573242, 0.00756072998046875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 8.0, 8.0, 10.0, 17.0, 22.0, 35.0, 41.0, 70.0, 202.0, 566.0, 2813.0, 37367.0, 4045097.0, 101850.0, 4834.0, 818.0, 235.0, 95.0, 75.0, 35.0, 24.0, 11.0, 8.0, 10.0, 9.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07464599609375, -0.07173347473144531, -0.06882095336914062, -0.06590843200683594, -0.06299591064453125, -0.06008338928222656, -0.057170867919921875, -0.05425834655761719, -0.0513458251953125, -0.04843330383300781, -0.045520782470703125, -0.04260826110839844, -0.03969573974609375, -0.03678321838378906, -0.033870697021484375, -0.030958175659179688, -0.028045654296875, -0.025133132934570312, -0.022220611572265625, -0.019308090209960938, -0.01639556884765625, -0.013483047485351562, -0.010570526123046875, -0.0076580047607421875, -0.0047454833984375, -0.0018329620361328125, 0.001079559326171875, 0.0039920806884765625, 0.00690460205078125, 0.009817123413085938, 0.012729644775390625, 0.015642166137695312, 0.0185546875, 0.021467208862304688, 0.024379730224609375, 0.027292251586914062, 0.03020477294921875, 0.03311729431152344, 0.036029815673828125, 0.03894233703613281, 0.0418548583984375, 0.04476737976074219, 0.047679901123046875, 0.05059242248535156, 0.05350494384765625, 0.05641746520996094, 0.059329986572265625, 0.06224250793457031, 0.065155029296875, 0.06806755065917969, 0.07098007202148438, 0.07389259338378906, 0.07680511474609375, 0.07971763610839844, 0.08263015747070312, 0.08554267883300781, 0.0884552001953125, 0.09136772155761719, 0.09428024291992188, 0.09719276428222656, 0.10010528564453125, 0.10301780700683594, 0.10593032836914062, 0.10884284973144531, 0.11175537109375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 6.0, 8.0, 6.0, 7.0, 13.0, 13.0, 16.0, 35.0, 42.0, 52.0, 101.0, 128.0, 232.0, 638.0, 1518.0, 599.0, 251.0, 126.0, 88.0, 59.0, 27.0, 28.0, 25.0, 11.0, 14.0, 13.0, 9.0, 2.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0228271484375, -0.02221822738647461, -0.02160930633544922, -0.021000385284423828, -0.020391464233398438, -0.019782543182373047, -0.019173622131347656, -0.018564701080322266, -0.017955780029296875, -0.017346858978271484, -0.016737937927246094, -0.016129016876220703, -0.015520095825195312, -0.014911174774169922, -0.014302253723144531, -0.01369333267211914, -0.01308441162109375, -0.01247549057006836, -0.011866569519042969, -0.011257648468017578, -0.010648727416992188, -0.010039806365966797, -0.009430885314941406, -0.008821964263916016, -0.008213043212890625, -0.007604122161865234, -0.006995201110839844, -0.006386280059814453, -0.0057773590087890625, -0.005168437957763672, -0.004559516906738281, -0.003950595855712891, -0.0033416748046875, -0.0027327537536621094, -0.0021238327026367188, -0.0015149116516113281, -0.0009059906005859375, -0.0002970695495605469, 0.00031185150146484375, 0.0009207725524902344, 0.001529693603515625, 0.0021386146545410156, 0.0027475357055664062, 0.003356456756591797, 0.0039653778076171875, 0.004574298858642578, 0.005183219909667969, 0.005792140960693359, 0.00640106201171875, 0.007009983062744141, 0.007618904113769531, 0.008227825164794922, 0.008836746215820312, 0.009445667266845703, 0.010054588317871094, 0.010663509368896484, 0.011272430419921875, 0.011881351470947266, 0.012490272521972656, 0.013099193572998047, 0.013708114624023438, 0.014317035675048828, 0.014925956726074219, 0.01553487777709961, 0.016143798828125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 7.0, 21.0, 89.0, 377.0, 408.0, 83.0, 12.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09778594225645065, -0.09125438332557678, -0.08472282439470291, -0.07819126546382904, -0.07165970653295517, -0.0651281476020813, -0.05859658494591713, -0.05206502601504326, -0.04553346708416939, -0.03900190815329552, -0.032470349222421646, -0.025938788428902626, -0.019407229498028755, -0.012875668704509735, -0.006344109773635864, 0.0001874491572380066, 0.0067190080881118774, 0.013250567018985748, 0.01978212594985962, 0.02631368674337864, 0.03284524381160736, 0.03937680646777153, 0.0459083653986454, 0.05243992432951927, 0.05897148326039314, 0.06550304591655731, 0.07203460484743118, 0.07856616377830505, 0.08509772270917892, 0.0916292816400528, 0.09816084057092667, 0.10469239950180054, 0.11122395098209381, 0.11775550991296768, 0.12428706884384155, 0.13081863522529602, 0.1373501867055893, 0.14388175308704376, 0.15041330456733704, 0.1569448709487915, 0.16347642242908478, 0.17000798881053925, 0.17653954029083252, 0.183071106672287, 0.18960265815258026, 0.19613422453403473, 0.202665776014328, 0.20919734239578247, 0.21572890877723694, 0.2222604751586914, 0.22879202663898468, 0.23532359302043915, 0.24185514450073242, 0.2483867108821869, 0.25491827726364136, 0.26144981384277344, 0.2679813802242279, 0.2745129466056824, 0.28104451298713684, 0.2875760495662689, 0.2941076159477234, 0.30063918232917786, 0.3071707487106323, 0.3137022852897644, 0.32023385167121887]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 7.0, 4.0, 6.0, 17.0, 15.0, 12.0, 23.0, 39.0, 43.0, 36.0, 46.0, 43.0, 56.0, 66.0, 59.0, 45.0, 51.0, 56.0, 51.0, 48.0, 42.0, 32.0, 25.0, 36.0, 35.0, 23.0, 16.0, 21.0, 12.0, 8.0, 7.0, 3.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043725013732910156, -0.042000360786914825, -0.040275707840919495, -0.03855105862021446, -0.03682640567421913, -0.0351017527282238, -0.03337710350751877, -0.03165245056152344, -0.029927797615528107, -0.028203144669532776, -0.026478493586182594, -0.024753842502832413, -0.023029189556837082, -0.02130453661084175, -0.01957988552749157, -0.017855234444141388, -0.016130581498146057, -0.014405929483473301, -0.012681277468800545, -0.010956625454127789, -0.009231973439455032, -0.007507321424782276, -0.00578266941010952, -0.004058017395436764, -0.0023333653807640076, -0.0006087133660912514, 0.0011159386485815048, 0.002840590663254261, 0.004565242677927017, 0.006289894692599773, 0.00801454670727253, 0.009739198721945286, 0.011463850736618042, 0.013188502751290798, 0.014913154765963554, 0.016637805849313736, 0.018362458795309067, 0.020087111741304398, 0.02181176282465458, 0.02353641390800476, 0.02526106685400009, 0.026985719799995422, 0.028710370883345604, 0.030435021966695786, 0.032159674912691116, 0.03388432785868645, 0.03560897707939148, 0.03733363002538681, 0.03905828297138214, 0.04078293591737747, 0.0425075888633728, 0.044232238084077835, 0.045956891030073166, 0.0476815439760685, 0.04940619319677353, 0.05113084614276886, 0.05285549908876419, 0.05458015203475952, 0.05630480498075485, 0.058029454201459885, 0.059754107147455215, 0.061478760093450546, 0.06320340931415558, 0.06492806226015091, 0.06665271520614624]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 9.0, 5.0, 9.0, 19.0, 25.0, 49.0, 51.0, 69.0, 108.0, 183.0, 304.0, 427.0, 686.0, 1233.0, 2214.0, 4299.0, 8953.0, 21393.0, 62460.0, 306886.0, 501145.0, 87851.0, 27601.0, 11023.0, 5204.0, 2677.0, 1414.0, 852.0, 514.0, 318.0, 192.0, 123.0, 84.0, 49.0, 37.0, 14.0, 20.0, 16.0, 9.0, 4.0, 12.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040802001953125, -0.03953218460083008, -0.038262367248535156, -0.036992549896240234, -0.03572273254394531, -0.03445291519165039, -0.03318309783935547, -0.03191328048706055, -0.030643463134765625, -0.029373645782470703, -0.02810382843017578, -0.02683401107788086, -0.025564193725585938, -0.024294376373291016, -0.023024559020996094, -0.021754741668701172, -0.02048492431640625, -0.019215106964111328, -0.017945289611816406, -0.016675472259521484, -0.015405654907226562, -0.01413583755493164, -0.012866020202636719, -0.011596202850341797, -0.010326385498046875, -0.009056568145751953, -0.007786750793457031, -0.006516933441162109, -0.0052471160888671875, -0.003977298736572266, -0.0027074813842773438, -0.0014376640319824219, -0.0001678466796875, 0.0011019706726074219, 0.0023717880249023438, 0.0036416053771972656, 0.0049114227294921875, 0.006181240081787109, 0.007451057434082031, 0.008720874786376953, 0.009990692138671875, 0.011260509490966797, 0.012530326843261719, 0.01380014419555664, 0.015069961547851562, 0.016339778900146484, 0.017609596252441406, 0.018879413604736328, 0.02014923095703125, 0.021419048309326172, 0.022688865661621094, 0.023958683013916016, 0.025228500366210938, 0.02649831771850586, 0.02776813507080078, 0.029037952423095703, 0.030307769775390625, 0.03157758712768555, 0.03284740447998047, 0.03411722183227539, 0.03538703918457031, 0.036656856536865234, 0.037926673889160156, 0.03919649124145508, 0.04046630859375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 15.0, 6.0, 14.0, 12.0, 17.0, 27.0, 38.0, 40.0, 39.0, 54.0, 61.0, 49.0, 60.0, 69.0, 62.0, 53.0, 58.0, 61.0, 42.0, 36.0, 22.0, 49.0, 26.0, 14.0, 23.0, 14.0, 11.0, 7.0, 6.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007640838623046875, -0.007410526275634766, -0.007180213928222656, -0.006949901580810547, -0.0067195892333984375, -0.006489276885986328, -0.006258964538574219, -0.006028652191162109, -0.00579833984375, -0.005568027496337891, -0.005337715148925781, -0.005107402801513672, -0.0048770904541015625, -0.004646778106689453, -0.004416465759277344, -0.004186153411865234, -0.003955841064453125, -0.0037255287170410156, -0.0034952163696289062, -0.003264904022216797, -0.0030345916748046875, -0.002804279327392578, -0.0025739669799804688, -0.0023436546325683594, -0.00211334228515625, -0.0018830299377441406, -0.0016527175903320312, -0.0014224052429199219, -0.0011920928955078125, -0.0009617805480957031, -0.0007314682006835938, -0.0005011558532714844, -0.000270843505859375, -4.0531158447265625e-05, 0.00018978118896484375, 0.0004200935363769531, 0.0006504058837890625, 0.0008807182312011719, 0.0011110305786132812, 0.0013413429260253906, 0.0015716552734375, 0.0018019676208496094, 0.0020322799682617188, 0.002262592315673828, 0.0024929046630859375, 0.002723217010498047, 0.0029535293579101562, 0.0031838417053222656, 0.003414154052734375, 0.0036444664001464844, 0.0038747787475585938, 0.004105091094970703, 0.0043354034423828125, 0.004565715789794922, 0.004796028137207031, 0.005026340484619141, 0.00525665283203125, 0.005486965179443359, 0.005717277526855469, 0.005947589874267578, 0.0061779022216796875, 0.006408214569091797, 0.006638526916503906, 0.006868839263916016, 0.007099151611328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 8.0, 3.0, 4.0, 3.0, 4.0, 6.0, 14.0, 12.0, 19.0, 29.0, 31.0, 29.0, 52.0, 89.0, 110.0, 186.0, 360.0, 722.0, 1530.0, 3437.0, 7419.0, 17805.0, 44755.0, 136448.0, 478156.0, 242132.0, 69437.0, 25833.0, 10753.0, 4719.0, 2187.0, 1023.0, 494.0, 251.0, 147.0, 102.0, 61.0, 48.0, 26.0, 23.0, 27.0, 14.0, 13.0, 6.0, 9.0, 5.0, 9.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0258026123046875, -0.024962425231933594, -0.024122238159179688, -0.02328205108642578, -0.022441864013671875, -0.02160167694091797, -0.020761489868164062, -0.019921302795410156, -0.01908111572265625, -0.018240928649902344, -0.017400741577148438, -0.01656055450439453, -0.015720367431640625, -0.014880180358886719, -0.014039993286132812, -0.013199806213378906, -0.012359619140625, -0.011519432067871094, -0.010679244995117188, -0.009839057922363281, -0.008998870849609375, -0.008158683776855469, -0.0073184967041015625, -0.006478309631347656, -0.00563812255859375, -0.004797935485839844, -0.0039577484130859375, -0.0031175613403320312, -0.002277374267578125, -0.0014371871948242188, -0.0005970001220703125, 0.00024318695068359375, 0.0010833740234375, 0.0019235610961914062, 0.0027637481689453125, 0.0036039352416992188, 0.004444122314453125, 0.005284309387207031, 0.0061244964599609375, 0.006964683532714844, 0.00780487060546875, 0.008645057678222656, 0.009485244750976562, 0.010325431823730469, 0.011165618896484375, 0.012005805969238281, 0.012845993041992188, 0.013686180114746094, 0.0145263671875, 0.015366554260253906, 0.016206741333007812, 0.01704692840576172, 0.017887115478515625, 0.01872730255126953, 0.019567489624023438, 0.020407676696777344, 0.02124786376953125, 0.022088050842285156, 0.022928237915039062, 0.02376842498779297, 0.024608612060546875, 0.02544879913330078, 0.026288986206054688, 0.027129173278808594, 0.0279693603515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 2.0, 6.0, 4.0, 6.0, 10.0, 11.0, 12.0, 14.0, 11.0, 21.0, 26.0, 32.0, 20.0, 26.0, 37.0, 40.0, 42.0, 41.0, 54.0, 45.0, 31.0, 43.0, 38.0, 33.0, 51.0, 34.0, 47.0, 33.0, 31.0, 26.0, 17.0, 23.0, 20.0, 17.0, 20.0, 11.0, 13.0, 11.0, 10.0, 5.0, 5.0, 5.0, 2.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0130615234375, -0.012659192085266113, -0.012256860733032227, -0.01185452938079834, -0.011452198028564453, -0.011049866676330566, -0.01064753532409668, -0.010245203971862793, -0.009842872619628906, -0.00944054126739502, -0.009038209915161133, -0.008635878562927246, -0.00823354721069336, -0.007831215858459473, -0.007428884506225586, -0.007026553153991699, -0.0066242218017578125, -0.006221890449523926, -0.005819559097290039, -0.005417227745056152, -0.005014896392822266, -0.004612565040588379, -0.004210233688354492, -0.0038079023361206055, -0.0034055709838867188, -0.003003239631652832, -0.0026009082794189453, -0.0021985769271850586, -0.0017962455749511719, -0.0013939142227172852, -0.0009915828704833984, -0.0005892515182495117, -0.000186920166015625, 0.00021541118621826172, 0.0006177425384521484, 0.0010200738906860352, 0.0014224052429199219, 0.0018247365951538086, 0.0022270679473876953, 0.002629399299621582, 0.0030317306518554688, 0.0034340620040893555, 0.003836393356323242, 0.004238724708557129, 0.004641056060791016, 0.005043387413024902, 0.005445718765258789, 0.005848050117492676, 0.0062503814697265625, 0.006652712821960449, 0.007055044174194336, 0.007457375526428223, 0.00785970687866211, 0.008262038230895996, 0.008664369583129883, 0.00906670093536377, 0.009469032287597656, 0.009871363639831543, 0.01027369499206543, 0.010676026344299316, 0.011078357696533203, 0.01148068904876709, 0.011883020401000977, 0.012285351753234863, 0.01268768310546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 7.0, 17.0, 20.0, 28.0, 41.0, 86.0, 115.0, 182.0, 400.0, 717.0, 1593.0, 4234.0, 18008.0, 205928.0, 775805.0, 31183.0, 6254.0, 1995.0, 853.0, 432.0, 253.0, 143.0, 81.0, 57.0, 29.0, 27.0, 25.0, 12.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0267333984375, -0.025972843170166016, -0.02521228790283203, -0.024451732635498047, -0.023691177368164062, -0.022930622100830078, -0.022170066833496094, -0.02140951156616211, -0.020648956298828125, -0.01988840103149414, -0.019127845764160156, -0.018367290496826172, -0.017606735229492188, -0.016846179962158203, -0.01608562469482422, -0.015325069427490234, -0.01456451416015625, -0.013803958892822266, -0.013043403625488281, -0.012282848358154297, -0.011522293090820312, -0.010761737823486328, -0.010001182556152344, -0.00924062728881836, -0.008480072021484375, -0.007719516754150391, -0.006958961486816406, -0.006198406219482422, -0.0054378509521484375, -0.004677295684814453, -0.003916740417480469, -0.0031561851501464844, -0.0023956298828125, -0.0016350746154785156, -0.0008745193481445312, -0.00011396408081054688, 0.0006465911865234375, 0.0014071464538574219, 0.0021677017211914062, 0.0029282569885253906, 0.003688812255859375, 0.004449367523193359, 0.005209922790527344, 0.005970478057861328, 0.0067310333251953125, 0.007491588592529297, 0.008252143859863281, 0.009012699127197266, 0.00977325439453125, 0.010533809661865234, 0.011294364929199219, 0.012054920196533203, 0.012815475463867188, 0.013576030731201172, 0.014336585998535156, 0.01509714126586914, 0.015857696533203125, 0.01661825180053711, 0.017378807067871094, 0.018139362335205078, 0.018899917602539062, 0.019660472869873047, 0.02042102813720703, 0.021181583404541016, 0.021942138671875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 7.0, 2.0, 2.0, 2.0, 2.0, 10.0, 3.0, 3.0, 10.0, 12.0, 19.0, 15.0, 30.0, 42.0, 84.0, 73.0, 86.0, 103.0, 106.0, 149.0, 72.0, 56.0, 32.0, 32.0, 11.0, 9.0, 11.0, 4.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-5.245208740234375e-06, -5.112960934638977e-06, -4.980713129043579e-06, -4.848465323448181e-06, -4.716217517852783e-06, -4.583969712257385e-06, -4.451721906661987e-06, -4.319474101066589e-06, -4.187226295471191e-06, -4.0549784898757935e-06, -3.9227306842803955e-06, -3.7904828786849976e-06, -3.6582350730895996e-06, -3.5259872674942017e-06, -3.3937394618988037e-06, -3.2614916563034058e-06, -3.129243850708008e-06, -2.99699604511261e-06, -2.864748239517212e-06, -2.732500433921814e-06, -2.600252628326416e-06, -2.468004822731018e-06, -2.33575701713562e-06, -2.203509211540222e-06, -2.0712614059448242e-06, -1.9390136003494263e-06, -1.8067657947540283e-06, -1.6745179891586304e-06, -1.5422701835632324e-06, -1.4100223779678345e-06, -1.2777745723724365e-06, -1.1455267667770386e-06, -1.0132789611816406e-06, -8.810311555862427e-07, -7.487833499908447e-07, -6.165355443954468e-07, -4.842877388000488e-07, -3.520399332046509e-07, -2.1979212760925293e-07, -8.754432201385498e-08, 4.470348358154297e-08, 1.7695128917694092e-07, 3.0919909477233887e-07, 4.414469003677368e-07, 5.736947059631348e-07, 7.059425115585327e-07, 8.381903171539307e-07, 9.704381227493286e-07, 1.1026859283447266e-06, 1.2349337339401245e-06, 1.3671815395355225e-06, 1.4994293451309204e-06, 1.6316771507263184e-06, 1.7639249563217163e-06, 1.8961727619171143e-06, 2.028420567512512e-06, 2.16066837310791e-06, 2.292916178703308e-06, 2.425163984298706e-06, 2.557411789894104e-06, 2.689659595489502e-06, 2.8219074010849e-06, 2.954155206680298e-06, 3.086403012275696e-06, 3.2186508178710938e-06]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 6.0, 11.0, 18.0, 38.0, 39.0, 95.0, 134.0, 307.0, 540.0, 1126.0, 2572.0, 6401.0, 32995.0, 864256.0, 122232.0, 11079.0, 3560.0, 1590.0, 747.0, 362.0, 188.0, 93.0, 64.0, 27.0, 17.0, 13.0, 12.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018280029296875, -0.017721176147460938, -0.017162322998046875, -0.016603469848632812, -0.01604461669921875, -0.015485763549804688, -0.014926910400390625, -0.014368057250976562, -0.0138092041015625, -0.013250350952148438, -0.012691497802734375, -0.012132644653320312, -0.01157379150390625, -0.011014938354492188, -0.010456085205078125, -0.009897232055664062, -0.00933837890625, -0.008779525756835938, -0.008220672607421875, -0.0076618194580078125, -0.00710296630859375, -0.0065441131591796875, -0.005985260009765625, -0.0054264068603515625, -0.0048675537109375, -0.0043087005615234375, -0.003749847412109375, -0.0031909942626953125, -0.00263214111328125, -0.0020732879638671875, -0.001514434814453125, -0.0009555816650390625, -0.000396728515625, 0.0001621246337890625, 0.000720977783203125, 0.0012798309326171875, 0.00183868408203125, 0.0023975372314453125, 0.002956390380859375, 0.0035152435302734375, 0.0040740966796875, 0.0046329498291015625, 0.005191802978515625, 0.0057506561279296875, 0.00630950927734375, 0.0068683624267578125, 0.007427215576171875, 0.007986068725585938, 0.008544921875, 0.009103775024414062, 0.009662628173828125, 0.010221481323242188, 0.01078033447265625, 0.011339187622070312, 0.011898040771484375, 0.012456893920898438, 0.0130157470703125, 0.013574600219726562, 0.014133453369140625, 0.014692306518554688, 0.01525115966796875, 0.015810012817382812, 0.016368865966796875, 0.016927719116210938, 0.017486572265625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 8.0, 13.0, 37.0, 78.0, 105.0, 200.0, 232.0, 140.0, 71.0, 35.0, 20.0, 15.0, 8.0, 6.0, 2.0, 4.0, 8.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007427215576171875, -0.0071814656257629395, -0.006935715675354004, -0.006689965724945068, -0.006444215774536133, -0.006198465824127197, -0.005952715873718262, -0.005706965923309326, -0.005461215972900391, -0.005215466022491455, -0.0049697160720825195, -0.004723966121673584, -0.0044782161712646484, -0.004232466220855713, -0.003986716270446777, -0.003740966320037842, -0.0034952163696289062, -0.0032494664192199707, -0.003003716468811035, -0.0027579665184020996, -0.002512216567993164, -0.0022664666175842285, -0.002020716667175293, -0.0017749667167663574, -0.0015292167663574219, -0.0012834668159484863, -0.0010377168655395508, -0.0007919669151306152, -0.0005462169647216797, -0.00030046701431274414, -5.4717063903808594e-05, 0.00019103288650512695, 0.0004367828369140625, 0.000682532787322998, 0.0009282827377319336, 0.0011740326881408691, 0.0014197826385498047, 0.0016655325889587402, 0.0019112825393676758, 0.0021570324897766113, 0.002402782440185547, 0.0026485323905944824, 0.002894282341003418, 0.0031400322914123535, 0.003385782241821289, 0.0036315321922302246, 0.00387728214263916, 0.004123032093048096, 0.004368782043457031, 0.004614531993865967, 0.004860281944274902, 0.005106031894683838, 0.0053517818450927734, 0.005597531795501709, 0.0058432817459106445, 0.00608903169631958, 0.006334781646728516, 0.006580531597137451, 0.006826281547546387, 0.007072031497955322, 0.007317781448364258, 0.007563531398773193, 0.007809281349182129, 0.008055031299591064, 0.00830078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 19.0, 170.0, 684.0, 126.0, 13.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23933587968349457, -0.2286563217639923, -0.21797674894332886, -0.2072971910238266, -0.19661763310432434, -0.1859380602836609, -0.17525850236415863, -0.16457894444465637, -0.15389937162399292, -0.14321981370449066, -0.1325402408838272, -0.12186068296432495, -0.11118112504482269, -0.10050155967473984, -0.08982199430465698, -0.07914243638515472, -0.06846287846565247, -0.05778331682085991, -0.04710375517606735, -0.0364241898059845, -0.02574462816119194, -0.015065066516399384, -0.004385501146316528, 0.00629405677318573, 0.016973622143268585, 0.027653183788061142, 0.0383327454328537, 0.049012310802936554, 0.05969187244772911, 0.07037143409252167, 0.08105099946260452, 0.09173055738210678, 0.10241010785102844, 0.1130896732211113, 0.12376923114061356, 0.1344487965106964, 0.14512835443019867, 0.15580791234970093, 0.16648748517036438, 0.17716704308986664, 0.1878466010093689, 0.19852615892887115, 0.2092057317495346, 0.21988528966903687, 0.23056484758853912, 0.24124440550804138, 0.25192397832870483, 0.2626035213470459, 0.27328312397003174, 0.2839626967906952, 0.29464223980903625, 0.3053218126296997, 0.31600138545036316, 0.3266809284687042, 0.3373605012893677, 0.34804004430770874, 0.3587196171283722, 0.36939918994903564, 0.3800787329673767, 0.39075830578804016, 0.4014378786087036, 0.4121174216270447, 0.42279699444770813, 0.4334765672683716, 0.44415611028671265]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 2.0, 1.0, 6.0, 11.0, 8.0, 13.0, 12.0, 11.0, 17.0, 13.0, 22.0, 23.0, 28.0, 29.0, 33.0, 35.0, 32.0, 32.0, 31.0, 36.0, 31.0, 41.0, 54.0, 41.0, 43.0, 50.0, 37.0, 36.0, 36.0, 22.0, 28.0, 24.0, 29.0, 15.0, 29.0, 19.0, 10.0, 6.0, 16.0, 8.0, 5.0, 7.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.03566277027130127, -0.03454548120498657, -0.033428192138671875, -0.03231090307235718, -0.03119361400604248, -0.030076324939727783, -0.028959035873413086, -0.02784174680709839, -0.02672445774078369, -0.025607168674468994, -0.024489879608154297, -0.0233725905418396, -0.022255301475524902, -0.021138012409210205, -0.020020723342895508, -0.01890343427658081, -0.017786145210266113, -0.016668856143951416, -0.015551567077636719, -0.014434278011322021, -0.013316988945007324, -0.012199699878692627, -0.01108241081237793, -0.009965121746063232, -0.008847832679748535, -0.007730543613433838, -0.006613254547119141, -0.005495965480804443, -0.004378676414489746, -0.003261387348175049, -0.0021440982818603516, -0.0010268092155456543, 9.047985076904297e-05, 0.0012077689170837402, 0.0023250579833984375, 0.0034423470497131348, 0.004559636116027832, 0.005676925182342529, 0.0067942142486572266, 0.007911503314971924, 0.009028792381286621, 0.010146081447601318, 0.011263370513916016, 0.012380659580230713, 0.01349794864654541, 0.014615237712860107, 0.015732526779174805, 0.016849815845489502, 0.0179671049118042, 0.019084393978118896, 0.020201683044433594, 0.02131897211074829, 0.02243626117706299, 0.023553550243377686, 0.024670839309692383, 0.02578812837600708, 0.026905417442321777, 0.028022706508636475, 0.029139995574951172, 0.03025728464126587, 0.031374573707580566, 0.032491862773895264, 0.03360915184020996, 0.03472644090652466, 0.035843729972839355]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 11.0, 8.0, 7.0, 14.0, 16.0, 22.0, 42.0, 59.0, 98.0, 161.0, 237.0, 414.0, 729.0, 1267.0, 2410.0, 4810.0, 10917.0, 27505.0, 96584.0, 1004121.0, 2729785.0, 234677.0, 47772.0, 17071.0, 7488.0, 3569.0, 1909.0, 1016.0, 578.0, 355.0, 205.0, 136.0, 102.0, 59.0, 49.0, 20.0, 18.0, 15.0, 8.0, 6.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01474761962890625, -0.014243245124816895, -0.013738870620727539, -0.013234496116638184, -0.012730121612548828, -0.012225747108459473, -0.011721372604370117, -0.011216998100280762, -0.010712623596191406, -0.01020824909210205, -0.009703874588012695, -0.00919950008392334, -0.008695125579833984, -0.008190751075744629, -0.0076863765716552734, -0.007182002067565918, -0.0066776275634765625, -0.006173253059387207, -0.0056688785552978516, -0.005164504051208496, -0.004660129547119141, -0.004155755043029785, -0.0036513805389404297, -0.0031470060348510742, -0.0026426315307617188, -0.0021382570266723633, -0.0016338825225830078, -0.0011295080184936523, -0.0006251335144042969, -0.0001207590103149414, 0.00038361549377441406, 0.0008879899978637695, 0.001392364501953125, 0.0018967390060424805, 0.002401113510131836, 0.0029054880142211914, 0.003409862518310547, 0.003914237022399902, 0.004418611526489258, 0.004922986030578613, 0.005427360534667969, 0.005931735038757324, 0.00643610954284668, 0.006940484046936035, 0.007444858551025391, 0.007949233055114746, 0.008453607559204102, 0.008957982063293457, 0.009462356567382812, 0.009966731071472168, 0.010471105575561523, 0.010975480079650879, 0.011479854583740234, 0.01198422908782959, 0.012488603591918945, 0.0129929780960083, 0.013497352600097656, 0.014001727104187012, 0.014506101608276367, 0.015010476112365723, 0.015514850616455078, 0.016019225120544434, 0.01652359962463379, 0.017027974128723145, 0.0175323486328125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 11.0, 6.0, 18.0, 16.0, 14.0, 20.0, 24.0, 33.0, 33.0, 40.0, 45.0, 55.0, 69.0, 57.0, 71.0, 61.0, 57.0, 56.0, 51.0, 36.0, 45.0, 39.0, 21.0, 34.0, 19.0, 18.0, 18.0, 11.0, 9.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0079498291015625, -0.007722735404968262, -0.0074956417083740234, -0.007268548011779785, -0.007041454315185547, -0.006814360618591309, -0.00658726692199707, -0.006360173225402832, -0.006133079528808594, -0.0059059858322143555, -0.005678892135620117, -0.005451798439025879, -0.005224704742431641, -0.004997611045837402, -0.004770517349243164, -0.004543423652648926, -0.0043163299560546875, -0.004089236259460449, -0.003862142562866211, -0.0036350488662719727, -0.0034079551696777344, -0.003180861473083496, -0.002953767776489258, -0.0027266740798950195, -0.0024995803833007812, -0.002272486686706543, -0.0020453929901123047, -0.0018182992935180664, -0.0015912055969238281, -0.0013641119003295898, -0.0011370182037353516, -0.0009099245071411133, -0.000682830810546875, -0.0004557371139526367, -0.00022864341735839844, -1.5497207641601562e-06, 0.00022554397583007812, 0.0004526376724243164, 0.0006797313690185547, 0.000906825065612793, 0.0011339187622070312, 0.0013610124588012695, 0.0015881061553955078, 0.001815199851989746, 0.0020422935485839844, 0.0022693872451782227, 0.002496480941772461, 0.0027235746383666992, 0.0029506683349609375, 0.0031777620315551758, 0.003404855728149414, 0.0036319494247436523, 0.0038590431213378906, 0.004086136817932129, 0.004313230514526367, 0.0045403242111206055, 0.004767417907714844, 0.004994511604309082, 0.00522160530090332, 0.005448698997497559, 0.005675792694091797, 0.005902886390686035, 0.0061299800872802734, 0.006357073783874512, 0.00658416748046875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 7.0, 7.0, 14.0, 16.0, 28.0, 53.0, 84.0, 124.0, 184.0, 488.0, 1827.0, 19324.0, 1340905.0, 2803606.0, 24492.0, 2075.0, 495.0, 216.0, 142.0, 66.0, 46.0, 31.0, 22.0, 18.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03656005859375, -0.03453350067138672, -0.03250694274902344, -0.030480384826660156, -0.028453826904296875, -0.026427268981933594, -0.024400711059570312, -0.02237415313720703, -0.02034759521484375, -0.01832103729248047, -0.016294479370117188, -0.014267921447753906, -0.012241363525390625, -0.010214805603027344, -0.008188247680664062, -0.006161689758300781, -0.0041351318359375, -0.0021085739135742188, -8.20159912109375e-05, 0.0019445419311523438, 0.003971099853515625, 0.005997657775878906, 0.008024215698242188, 0.010050773620605469, 0.01207733154296875, 0.014103889465332031, 0.016130447387695312, 0.018157005310058594, 0.020183563232421875, 0.022210121154785156, 0.024236679077148438, 0.02626323699951172, 0.028289794921875, 0.03031635284423828, 0.03234291076660156, 0.034369468688964844, 0.036396026611328125, 0.038422584533691406, 0.04044914245605469, 0.04247570037841797, 0.04450225830078125, 0.04652881622314453, 0.04855537414550781, 0.050581932067871094, 0.052608489990234375, 0.054635047912597656, 0.05666160583496094, 0.05868816375732422, 0.0607147216796875, 0.06274127960205078, 0.06476783752441406, 0.06679439544677734, 0.06882095336914062, 0.0708475112915039, 0.07287406921386719, 0.07490062713623047, 0.07692718505859375, 0.07895374298095703, 0.08098030090332031, 0.0830068588256836, 0.08503341674804688, 0.08705997467041016, 0.08908653259277344, 0.09111309051513672, 0.0931396484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 10.0, 7.0, 13.0, 19.0, 34.0, 48.0, 47.0, 91.0, 128.0, 179.0, 326.0, 733.0, 1081.0, 582.0, 252.0, 174.0, 105.0, 75.0, 62.0, 38.0, 32.0, 15.0, 13.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025909423828125, -0.025234222412109375, -0.02455902099609375, -0.023883819580078125, -0.0232086181640625, -0.022533416748046875, -0.02185821533203125, -0.021183013916015625, -0.0205078125, -0.019832611083984375, -0.01915740966796875, -0.018482208251953125, -0.0178070068359375, -0.017131805419921875, -0.01645660400390625, -0.015781402587890625, -0.015106201171875, -0.014430999755859375, -0.01375579833984375, -0.013080596923828125, -0.0124053955078125, -0.011730194091796875, -0.01105499267578125, -0.010379791259765625, -0.00970458984375, -0.009029388427734375, -0.00835418701171875, -0.007678985595703125, -0.0070037841796875, -0.006328582763671875, -0.00565338134765625, -0.004978179931640625, -0.004302978515625, -0.003627777099609375, -0.00295257568359375, -0.002277374267578125, -0.0016021728515625, -0.000926971435546875, -0.00025177001953125, 0.000423431396484375, 0.0010986328125, 0.001773834228515625, 0.00244903564453125, 0.003124237060546875, 0.0037994384765625, 0.004474639892578125, 0.00514984130859375, 0.005825042724609375, 0.006500244140625, 0.007175445556640625, 0.00785064697265625, 0.008525848388671875, 0.0092010498046875, 0.009876251220703125, 0.01055145263671875, 0.011226654052734375, 0.01190185546875, 0.012577056884765625, 0.01325225830078125, 0.013927459716796875, 0.0146026611328125, 0.015277862548828125, 0.01595306396484375, 0.016628265380859375, 0.017303466796875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 10.0, 22.0, 52.0, 121.0, 324.0, 292.0, 120.0, 35.0, 13.0, 12.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13081800937652588, -0.12510137259960175, -0.11938472837209702, -0.11366809159517288, -0.10795144736766815, -0.10223481059074402, -0.09651817381381989, -0.09080152958631516, -0.08508488535881042, -0.07936824858188629, -0.07365160435438156, -0.06793496757745743, -0.0622183233499527, -0.056501686573028564, -0.05078504607081413, -0.0450684055685997, -0.03935176879167557, -0.033635128289461136, -0.027918487787246704, -0.02220184914767742, -0.01648520864546299, -0.010768568143248558, -0.0050519295036792755, 0.0006647109985351562, 0.006381351500749588, 0.01209799200296402, 0.01781463250517845, 0.023531271144747734, 0.029247911646962166, 0.03496455401182175, 0.04068119078874588, 0.04639783129096031, 0.052114471793174744, 0.057831112295389175, 0.06354775279760361, 0.06926438957452774, 0.07498103380203247, 0.0806976705789566, 0.08641430735588074, 0.09213095158338547, 0.0978475958108902, 0.10356423258781433, 0.10928087681531906, 0.1149975135922432, 0.12071415781974792, 0.12643079459667206, 0.1321474313735962, 0.13786408305168152, 0.14358070492744446, 0.1492973417043686, 0.15501397848129272, 0.16073063015937805, 0.16644726693630219, 0.17216390371322632, 0.17788054049015045, 0.18359717726707458, 0.1893138289451599, 0.19503046572208405, 0.20074710249900818, 0.2064637541770935, 0.21218039095401764, 0.21789702773094177, 0.2236136645078659, 0.22933030128479004, 0.23504695296287537]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 9.0, 7.0, 10.0, 12.0, 15.0, 12.0, 21.0, 25.0, 16.0, 28.0, 39.0, 41.0, 40.0, 42.0, 49.0, 54.0, 56.0, 42.0, 49.0, 43.0, 39.0, 40.0, 36.0, 39.0, 36.0, 30.0, 40.0, 31.0, 15.0, 19.0, 14.0, 7.0, 9.0, 6.0, 4.0, 6.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.05793541669845581, -0.056287892162799835, -0.05464036762714386, -0.052992839366197586, -0.05134531483054161, -0.049697790294885635, -0.04805026203393936, -0.046402737498283386, -0.04475521296262741, -0.043107688426971436, -0.04146016389131546, -0.039812635630369186, -0.03816511109471321, -0.036517586559057236, -0.03487005829811096, -0.03322253376245499, -0.03157500922679901, -0.029927484691143036, -0.02827995829284191, -0.026632431894540787, -0.02498490735888481, -0.023337382823228836, -0.02168985642492771, -0.020042330026626587, -0.01839480549097061, -0.016747280955314636, -0.015099754557013512, -0.013452229090034962, -0.011804703623056412, -0.010157178156077862, -0.008509652689099312, -0.006862127222120762, -0.005214601755142212, -0.003567076288163662, -0.001919550821185112, -0.00027202535420656204, 0.001375500112771988, 0.003023025579750538, 0.004670551046729088, 0.006318076513707638, 0.007965601980686188, 0.009613127447664738, 0.011260652914643288, 0.012908178381621838, 0.014555703848600388, 0.016203228384256363, 0.017850754782557487, 0.019498281180858612, 0.021145805716514587, 0.022793330252170563, 0.024440856650471687, 0.026088383048772812, 0.027735907584428787, 0.029383432120084763, 0.031030958518385887, 0.03267848491668701, 0.03432600945234299, 0.03597353398799896, 0.03762105852365494, 0.03926858678460121, 0.04091611132025719, 0.04256363585591316, 0.044211164116859436, 0.04585868865251541, 0.04750621318817139]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 16.0, 13.0, 16.0, 39.0, 58.0, 91.0, 155.0, 248.0, 383.0, 779.0, 1592.0, 3159.0, 6775.0, 15650.0, 38561.0, 106941.0, 383941.0, 334582.0, 94483.0, 34501.0, 14283.0, 6349.0, 2819.0, 1381.0, 748.0, 386.0, 233.0, 143.0, 77.0, 53.0, 36.0, 16.0, 17.0, 12.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0270233154296875, -0.026149988174438477, -0.025276660919189453, -0.02440333366394043, -0.023530006408691406, -0.022656679153442383, -0.02178335189819336, -0.020910024642944336, -0.020036697387695312, -0.01916337013244629, -0.018290042877197266, -0.017416715621948242, -0.01654338836669922, -0.015670061111450195, -0.014796733856201172, -0.013923406600952148, -0.013050079345703125, -0.012176752090454102, -0.011303424835205078, -0.010430097579956055, -0.009556770324707031, -0.008683443069458008, -0.007810115814208984, -0.006936788558959961, -0.0060634613037109375, -0.005190134048461914, -0.004316806793212891, -0.003443479537963867, -0.0025701522827148438, -0.0016968250274658203, -0.0008234977722167969, 4.982948303222656e-05, 0.00092315673828125, 0.0017964839935302734, 0.002669811248779297, 0.0035431385040283203, 0.004416465759277344, 0.005289793014526367, 0.006163120269775391, 0.007036447525024414, 0.007909774780273438, 0.008783102035522461, 0.009656429290771484, 0.010529756546020508, 0.011403083801269531, 0.012276411056518555, 0.013149738311767578, 0.014023065567016602, 0.014896392822265625, 0.01576972007751465, 0.016643047332763672, 0.017516374588012695, 0.01838970184326172, 0.019263029098510742, 0.020136356353759766, 0.02100968360900879, 0.021883010864257812, 0.022756338119506836, 0.02362966537475586, 0.024502992630004883, 0.025376319885253906, 0.02624964714050293, 0.027122974395751953, 0.027996301651000977, 0.02886962890625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 4.0, 7.0, 11.0, 11.0, 19.0, 13.0, 18.0, 36.0, 36.0, 44.0, 57.0, 60.0, 61.0, 64.0, 71.0, 47.0, 73.0, 63.0, 60.0, 41.0, 48.0, 31.0, 33.0, 21.0, 24.0, 19.0, 13.0, 6.0, 5.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007427215576171875, -0.007202744483947754, -0.006978273391723633, -0.006753802299499512, -0.006529331207275391, -0.0063048601150512695, -0.0060803890228271484, -0.005855917930603027, -0.005631446838378906, -0.005406975746154785, -0.005182504653930664, -0.004958033561706543, -0.004733562469482422, -0.004509091377258301, -0.00428462028503418, -0.004060149192810059, -0.0038356781005859375, -0.0036112070083618164, -0.0033867359161376953, -0.0031622648239135742, -0.002937793731689453, -0.002713322639465332, -0.002488851547241211, -0.00226438045501709, -0.0020399093627929688, -0.0018154382705688477, -0.0015909671783447266, -0.0013664960861206055, -0.0011420249938964844, -0.0009175539016723633, -0.0006930828094482422, -0.0004686117172241211, -0.000244140625, -1.9669532775878906e-05, 0.0002048015594482422, 0.0004292726516723633, 0.0006537437438964844, 0.0008782148361206055, 0.0011026859283447266, 0.0013271570205688477, 0.0015516281127929688, 0.0017760992050170898, 0.002000570297241211, 0.002225041389465332, 0.002449512481689453, 0.0026739835739135742, 0.0028984546661376953, 0.0031229257583618164, 0.0033473968505859375, 0.0035718679428100586, 0.0037963390350341797, 0.004020810127258301, 0.004245281219482422, 0.004469752311706543, 0.004694223403930664, 0.004918694496154785, 0.005143165588378906, 0.005367636680603027, 0.0055921077728271484, 0.0058165788650512695, 0.006041049957275391, 0.006265521049499512, 0.006489992141723633, 0.006714463233947754, 0.006938934326171875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 9.0, 10.0, 16.0, 15.0, 14.0, 21.0, 33.0, 57.0, 89.0, 141.0, 198.0, 301.0, 490.0, 907.0, 1548.0, 3044.0, 6024.0, 13419.0, 30848.0, 80763.0, 265501.0, 430952.0, 131158.0, 46417.0, 18908.0, 8543.0, 4175.0, 2091.0, 1140.0, 640.0, 363.0, 248.0, 144.0, 105.0, 68.0, 40.0, 36.0, 27.0, 11.0, 12.0, 11.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022613525390625, -0.021889209747314453, -0.021164894104003906, -0.02044057846069336, -0.019716262817382812, -0.018991947174072266, -0.01826763153076172, -0.017543315887451172, -0.016819000244140625, -0.016094684600830078, -0.015370368957519531, -0.014646053314208984, -0.013921737670898438, -0.01319742202758789, -0.012473106384277344, -0.011748790740966797, -0.01102447509765625, -0.010300159454345703, -0.009575843811035156, -0.00885152816772461, -0.008127212524414062, -0.007402896881103516, -0.006678581237792969, -0.005954265594482422, -0.005229949951171875, -0.004505634307861328, -0.0037813186645507812, -0.0030570030212402344, -0.0023326873779296875, -0.0016083717346191406, -0.0008840560913085938, -0.00015974044799804688, 0.0005645751953125, 0.0012888908386230469, 0.0020132064819335938, 0.0027375221252441406, 0.0034618377685546875, 0.004186153411865234, 0.004910469055175781, 0.005634784698486328, 0.006359100341796875, 0.007083415985107422, 0.007807731628417969, 0.008532047271728516, 0.009256362915039062, 0.00998067855834961, 0.010704994201660156, 0.011429309844970703, 0.01215362548828125, 0.012877941131591797, 0.013602256774902344, 0.01432657241821289, 0.015050888061523438, 0.015775203704833984, 0.01649951934814453, 0.017223834991455078, 0.017948150634765625, 0.018672466278076172, 0.01939678192138672, 0.020121097564697266, 0.020845413208007812, 0.02156972885131836, 0.022294044494628906, 0.023018360137939453, 0.02374267578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 2.0, 3.0, 6.0, 8.0, 12.0, 9.0, 14.0, 16.0, 10.0, 21.0, 13.0, 27.0, 20.0, 30.0, 31.0, 24.0, 38.0, 40.0, 41.0, 44.0, 40.0, 35.0, 33.0, 33.0, 36.0, 48.0, 35.0, 34.0, 35.0, 24.0, 28.0, 28.0, 15.0, 25.0, 29.0, 15.0, 20.0, 15.0, 15.0, 6.0, 6.0, 5.0, 3.0, 8.0, 4.0, 3.0, 4.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.010528564453125, -0.010172128677368164, -0.009815692901611328, -0.009459257125854492, -0.009102821350097656, -0.00874638557434082, -0.008389949798583984, -0.008033514022827148, -0.0076770782470703125, -0.0073206424713134766, -0.006964206695556641, -0.006607770919799805, -0.006251335144042969, -0.005894899368286133, -0.005538463592529297, -0.005182027816772461, -0.004825592041015625, -0.004469156265258789, -0.004112720489501953, -0.003756284713745117, -0.0033998489379882812, -0.0030434131622314453, -0.0026869773864746094, -0.0023305416107177734, -0.0019741058349609375, -0.0016176700592041016, -0.0012612342834472656, -0.0009047985076904297, -0.0005483627319335938, -0.0001919269561767578, 0.00016450881958007812, 0.0005209445953369141, 0.00087738037109375, 0.001233816146850586, 0.0015902519226074219, 0.0019466876983642578, 0.0023031234741210938, 0.0026595592498779297, 0.0030159950256347656, 0.0033724308013916016, 0.0037288665771484375, 0.0040853023529052734, 0.004441738128662109, 0.004798173904418945, 0.005154609680175781, 0.005511045455932617, 0.005867481231689453, 0.006223917007446289, 0.006580352783203125, 0.006936788558959961, 0.007293224334716797, 0.007649660110473633, 0.008006095886230469, 0.008362531661987305, 0.00871896743774414, 0.009075403213500977, 0.009431838989257812, 0.009788274765014648, 0.010144710540771484, 0.01050114631652832, 0.010857582092285156, 0.011214017868041992, 0.011570453643798828, 0.011926889419555664, 0.0122833251953125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 4.0, 11.0, 13.0, 17.0, 27.0, 29.0, 34.0, 52.0, 97.0, 111.0, 173.0, 316.0, 475.0, 843.0, 1624.0, 3351.0, 9110.0, 62663.0, 846230.0, 103208.0, 12215.0, 3785.0, 1694.0, 894.0, 570.0, 325.0, 230.0, 142.0, 90.0, 55.0, 47.0, 34.0, 25.0, 16.0, 15.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.019317626953125, -0.018706083297729492, -0.018094539642333984, -0.017482995986938477, -0.01687145233154297, -0.01625990867614746, -0.015648365020751953, -0.015036821365356445, -0.014425277709960938, -0.01381373405456543, -0.013202190399169922, -0.012590646743774414, -0.011979103088378906, -0.011367559432983398, -0.01075601577758789, -0.010144472122192383, -0.009532928466796875, -0.008921384811401367, -0.00830984115600586, -0.0076982975006103516, -0.007086753845214844, -0.006475210189819336, -0.005863666534423828, -0.00525212287902832, -0.0046405792236328125, -0.004029035568237305, -0.003417491912841797, -0.002805948257446289, -0.0021944046020507812, -0.0015828609466552734, -0.0009713172912597656, -0.0003597736358642578, 0.00025177001953125, 0.0008633136749267578, 0.0014748573303222656, 0.0020864009857177734, 0.0026979446411132812, 0.003309488296508789, 0.003921031951904297, 0.004532575607299805, 0.0051441192626953125, 0.00575566291809082, 0.006367206573486328, 0.006978750228881836, 0.007590293884277344, 0.008201837539672852, 0.00881338119506836, 0.009424924850463867, 0.010036468505859375, 0.010648012161254883, 0.01125955581665039, 0.011871099472045898, 0.012482643127441406, 0.013094186782836914, 0.013705730438232422, 0.01431727409362793, 0.014928817749023438, 0.015540361404418945, 0.016151905059814453, 0.01676344871520996, 0.01737499237060547, 0.017986536026000977, 0.018598079681396484, 0.019209623336791992, 0.0198211669921875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 12.0, 38.0, 105.0, 235.0, 288.0, 184.0, 77.0, 29.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.000301361083984e-06, -8.692964911460876e-06, -8.385628461837769e-06, -8.07829201221466e-06, -7.770955562591553e-06, -7.463619112968445e-06, -7.156282663345337e-06, -6.848946213722229e-06, -6.541609764099121e-06, -6.234273314476013e-06, -5.926936864852905e-06, -5.619600415229797e-06, -5.3122639656066895e-06, -5.0049275159835815e-06, -4.697591066360474e-06, -4.390254616737366e-06, -4.082918167114258e-06, -3.77558171749115e-06, -3.468245267868042e-06, -3.160908818244934e-06, -2.853572368621826e-06, -2.5462359189987183e-06, -2.2388994693756104e-06, -1.9315630197525024e-06, -1.6242265701293945e-06, -1.3168901205062866e-06, -1.0095536708831787e-06, -7.022172212600708e-07, -3.948807716369629e-07, -8.754432201385498e-08, 2.1979212760925293e-07, 5.271285772323608e-07, 8.344650268554688e-07, 1.1418014764785767e-06, 1.4491379261016846e-06, 1.7564743757247925e-06, 2.0638108253479004e-06, 2.3711472749710083e-06, 2.678483724594116e-06, 2.985820174217224e-06, 3.293156623840332e-06, 3.60049307346344e-06, 3.907829523086548e-06, 4.215165972709656e-06, 4.522502422332764e-06, 4.829838871955872e-06, 5.1371753215789795e-06, 5.444511771202087e-06, 5.751848220825195e-06, 6.059184670448303e-06, 6.366521120071411e-06, 6.673857569694519e-06, 6.981194019317627e-06, 7.288530468940735e-06, 7.595866918563843e-06, 7.90320336818695e-06, 8.210539817810059e-06, 8.517876267433167e-06, 8.825212717056274e-06, 9.132549166679382e-06, 9.43988561630249e-06, 9.747222065925598e-06, 1.0054558515548706e-05, 1.0361894965171814e-05, 1.0669231414794922e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 3.0, 11.0, 12.0, 23.0, 24.0, 32.0, 75.0, 86.0, 190.0, 271.0, 430.0, 828.0, 1561.0, 3370.0, 7832.0, 19885.0, 61862.0, 331205.0, 489452.0, 86979.0, 25956.0, 9883.0, 4227.0, 1933.0, 1008.0, 559.0, 312.0, 190.0, 102.0, 77.0, 61.0, 40.0, 21.0, 16.0, 17.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0080108642578125, -0.007744908332824707, -0.007478952407836914, -0.007212996482849121, -0.006947040557861328, -0.006681084632873535, -0.006415128707885742, -0.006149172782897949, -0.005883216857910156, -0.005617260932922363, -0.00535130500793457, -0.005085349082946777, -0.004819393157958984, -0.004553437232971191, -0.0042874813079833984, -0.0040215253829956055, -0.0037555694580078125, -0.0034896135330200195, -0.0032236576080322266, -0.0029577016830444336, -0.0026917457580566406, -0.0024257898330688477, -0.0021598339080810547, -0.0018938779830932617, -0.0016279220581054688, -0.0013619661331176758, -0.0010960102081298828, -0.0008300542831420898, -0.0005640983581542969, -0.0002981424331665039, -3.218650817871094e-05, 0.00023376941680908203, 0.000499725341796875, 0.000765681266784668, 0.001031637191772461, 0.001297593116760254, 0.0015635490417480469, 0.0018295049667358398, 0.002095460891723633, 0.0023614168167114258, 0.0026273727416992188, 0.0028933286666870117, 0.0031592845916748047, 0.0034252405166625977, 0.0036911964416503906, 0.003957152366638184, 0.0042231082916259766, 0.0044890642166137695, 0.0047550201416015625, 0.0050209760665893555, 0.0052869319915771484, 0.005552887916564941, 0.005818843841552734, 0.006084799766540527, 0.00635075569152832, 0.006616711616516113, 0.006882667541503906, 0.007148623466491699, 0.007414579391479492, 0.007680535316467285, 0.007946491241455078, 0.008212447166442871, 0.008478403091430664, 0.008744359016418457, 0.00901031494140625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 5.0, 9.0, 12.0, 11.0, 15.0, 24.0, 22.0, 27.0, 31.0, 44.0, 52.0, 77.0, 92.0, 122.0, 83.0, 89.0, 60.0, 53.0, 29.0, 38.0, 19.0, 18.0, 15.0, 8.0, 12.0, 9.0, 2.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0055389404296875, -0.005392670631408691, -0.005246400833129883, -0.005100131034851074, -0.004953861236572266, -0.004807591438293457, -0.0046613216400146484, -0.00451505184173584, -0.004368782043457031, -0.004222512245178223, -0.004076242446899414, -0.0039299726486206055, -0.003783702850341797, -0.0036374330520629883, -0.0034911632537841797, -0.003344893455505371, -0.0031986236572265625, -0.003052353858947754, -0.0029060840606689453, -0.0027598142623901367, -0.002613544464111328, -0.0024672746658325195, -0.002321004867553711, -0.0021747350692749023, -0.0020284652709960938, -0.0018821954727172852, -0.0017359256744384766, -0.001589655876159668, -0.0014433860778808594, -0.0012971162796020508, -0.0011508464813232422, -0.0010045766830444336, -0.000858306884765625, -0.0007120370864868164, -0.0005657672882080078, -0.0004194974899291992, -0.0002732276916503906, -0.00012695789337158203, 1.9311904907226562e-05, 0.00016558170318603516, 0.00031185150146484375, 0.00045812129974365234, 0.0006043910980224609, 0.0007506608963012695, 0.0008969306945800781, 0.0010432004928588867, 0.0011894702911376953, 0.001335740089416504, 0.0014820098876953125, 0.001628279685974121, 0.0017745494842529297, 0.0019208192825317383, 0.002067089080810547, 0.0022133588790893555, 0.002359628677368164, 0.0025058984756469727, 0.0026521682739257812, 0.00279843807220459, 0.0029447078704833984, 0.003090977668762207, 0.0032372474670410156, 0.0033835172653198242, 0.003529787063598633, 0.0036760568618774414, 0.00382232666015625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 11.0, 71.0, 526.0, 351.0, 43.0, 11.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16276349127292633, -0.15250332653522491, -0.1422431617975235, -0.13198299705982208, -0.12172283232212067, -0.11146266758441925, -0.10120249539613724, -0.09094233065843582, -0.0806821659207344, -0.07042200118303299, -0.060161836445331573, -0.04990166798233986, -0.03964150324463844, -0.029381338506937027, -0.019121170043945312, -0.008861005306243896, 0.0013991594314575195, 0.01165932510048151, 0.0219194907695055, 0.032179657369852066, 0.04243982210755348, 0.0526999868452549, 0.06296015530824661, 0.07322032004594803, 0.08348048478364944, 0.09374064952135086, 0.10400081425905228, 0.11426098644733429, 0.1245211511850357, 0.13478131592273712, 0.14504148066043854, 0.15530164539813995, 0.16556182503700256, 0.17582198977470398, 0.1860821545124054, 0.1963423192501068, 0.20660248398780823, 0.21686264872550964, 0.22712281346321106, 0.23738297820091248, 0.2476431429386139, 0.2579033076763153, 0.2681634724140167, 0.27842363715171814, 0.28868380188941956, 0.29894396662712097, 0.3092041313648224, 0.3194642961025238, 0.3297244906425476, 0.339984655380249, 0.35024482011795044, 0.36050498485565186, 0.37076514959335327, 0.3810253143310547, 0.3912854790687561, 0.4015456438064575, 0.41180580854415894, 0.42206597328186035, 0.43232613801956177, 0.4425863027572632, 0.4528464674949646, 0.463106632232666, 0.47336679697036743, 0.48362696170806885, 0.49388712644577026]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 10.0, 8.0, 7.0, 7.0, 12.0, 15.0, 18.0, 20.0, 35.0, 35.0, 38.0, 55.0, 42.0, 49.0, 60.0, 64.0, 64.0, 58.0, 61.0, 61.0, 56.0, 51.0, 39.0, 33.0, 27.0, 16.0, 21.0, 17.0, 9.0, 8.0, 3.0, 5.0, 2.0, 5.0, 2.0], "bins": [-0.07976877689361572, -0.0779941976070404, -0.07621961086988449, -0.07444503158330917, -0.07267044484615326, -0.07089586555957794, -0.06912128627300262, -0.06734669953584671, -0.06557212024927139, -0.06379754096269608, -0.06202295422554016, -0.060248374938964844, -0.05847379192709923, -0.05669920891523361, -0.054924629628658295, -0.05315004661679268, -0.05137546360492706, -0.04960088059306145, -0.04782629758119583, -0.046051718294620514, -0.0442771352827549, -0.04250255227088928, -0.040727972984313965, -0.03895338997244835, -0.03717880696058273, -0.03540422394871712, -0.0336296409368515, -0.031855061650276184, -0.030080478638410568, -0.028305895626544952, -0.026531314477324486, -0.02475673332810402, -0.022982150316238403, -0.021207567304372787, -0.01943298615515232, -0.017658405005931854, -0.01588382199406624, -0.014109239913523197, -0.012334657832980156, -0.010560075752437115, -0.008785493671894073, -0.007010911591351032, -0.005236329510807991, -0.00346174743026495, -0.0016871653497219086, 8.741673082113266e-05, 0.0018619988113641739, 0.003636580891907215, 0.005411162972450256, 0.007185745052993298, 0.008960327133536339, 0.01073490921407938, 0.012509491294622421, 0.014284073375165462, 0.016058655455708504, 0.01783323660492897, 0.019607819616794586, 0.021382402628660202, 0.02315698377788067, 0.024931564927101135, 0.02670614793896675, 0.028480730950832367, 0.030255312100052834, 0.0320298932492733, 0.033804476261138916]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 10.0, 7.0, 6.0, 12.0, 21.0, 20.0, 29.0, 29.0, 45.0, 75.0, 124.0, 269.0, 879.0, 4698.0, 61066.0, 4055837.0, 64850.0, 4744.0, 929.0, 268.0, 116.0, 64.0, 44.0, 28.0, 20.0, 22.0, 19.0, 17.0, 13.0, 9.0, 5.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055023193359375, -0.05315828323364258, -0.051293373107910156, -0.049428462982177734, -0.04756355285644531, -0.04569864273071289, -0.04383373260498047, -0.04196882247924805, -0.040103912353515625, -0.0382390022277832, -0.03637409210205078, -0.03450918197631836, -0.03264427185058594, -0.030779361724853516, -0.028914451599121094, -0.027049541473388672, -0.02518463134765625, -0.023319721221923828, -0.021454811096191406, -0.019589900970458984, -0.017724990844726562, -0.01586008071899414, -0.013995170593261719, -0.012130260467529297, -0.010265350341796875, -0.008400440216064453, -0.006535530090332031, -0.004670619964599609, -0.0028057098388671875, -0.0009407997131347656, 0.0009241104125976562, 0.002789020538330078, 0.0046539306640625, 0.006518840789794922, 0.008383750915527344, 0.010248661041259766, 0.012113571166992188, 0.01397848129272461, 0.01584339141845703, 0.017708301544189453, 0.019573211669921875, 0.021438121795654297, 0.02330303192138672, 0.02516794204711914, 0.027032852172851562, 0.028897762298583984, 0.030762672424316406, 0.03262758255004883, 0.03449249267578125, 0.03635740280151367, 0.038222312927246094, 0.040087223052978516, 0.04195213317871094, 0.04381704330444336, 0.04568195343017578, 0.0475468635559082, 0.049411773681640625, 0.05127668380737305, 0.05314159393310547, 0.05500650405883789, 0.05687141418457031, 0.058736324310302734, 0.060601234436035156, 0.06246614456176758, 0.0643310546875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 3.0, 8.0, 10.0, 17.0, 19.0, 19.0, 23.0, 35.0, 45.0, 37.0, 47.0, 50.0, 67.0, 80.0, 66.0, 64.0, 51.0, 61.0, 60.0, 36.0, 44.0, 32.0, 29.0, 22.0, 20.0, 19.0, 13.0, 11.0, 3.0, 5.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0074310302734375, -0.0072040557861328125, -0.006977081298828125, -0.0067501068115234375, -0.00652313232421875, -0.0062961578369140625, -0.006069183349609375, -0.0058422088623046875, -0.005615234375, -0.0053882598876953125, -0.005161285400390625, -0.0049343109130859375, -0.00470733642578125, -0.0044803619384765625, -0.004253387451171875, -0.0040264129638671875, -0.0037994384765625, -0.0035724639892578125, -0.003345489501953125, -0.0031185150146484375, -0.00289154052734375, -0.0026645660400390625, -0.002437591552734375, -0.0022106170654296875, -0.001983642578125, -0.0017566680908203125, -0.001529693603515625, -0.0013027191162109375, -0.00107574462890625, -0.0008487701416015625, -0.000621795654296875, -0.0003948211669921875, -0.0001678466796875, 5.91278076171875e-05, 0.000286102294921875, 0.0005130767822265625, 0.00074005126953125, 0.0009670257568359375, 0.001194000244140625, 0.0014209747314453125, 0.00164794921875, 0.0018749237060546875, 0.002101898193359375, 0.0023288726806640625, 0.00255584716796875, 0.0027828216552734375, 0.003009796142578125, 0.0032367706298828125, 0.0034637451171875, 0.0036907196044921875, 0.003917694091796875, 0.0041446685791015625, 0.00437164306640625, 0.0045986175537109375, 0.004825592041015625, 0.0050525665283203125, 0.005279541015625, 0.0055065155029296875, 0.005733489990234375, 0.0059604644775390625, 0.00618743896484375, 0.0064144134521484375, 0.006641387939453125, 0.0068683624267578125, 0.0070953369140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 11.0, 3.0, 11.0, 18.0, 18.0, 26.0, 27.0, 38.0, 87.0, 127.0, 194.0, 477.0, 1186.0, 3441.0, 11264.0, 47371.0, 381196.0, 3462581.0, 237084.0, 35343.0, 8952.0, 2842.0, 987.0, 418.0, 210.0, 110.0, 68.0, 52.0, 37.0, 21.0, 18.0, 15.0, 14.0, 11.0, 5.0, 9.0, 2.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022857666015625, -0.021992206573486328, -0.021126747131347656, -0.020261287689208984, -0.019395828247070312, -0.01853036880493164, -0.01766490936279297, -0.016799449920654297, -0.015933990478515625, -0.015068531036376953, -0.014203071594238281, -0.01333761215209961, -0.012472152709960938, -0.011606693267822266, -0.010741233825683594, -0.009875774383544922, -0.00901031494140625, -0.008144855499267578, -0.007279396057128906, -0.006413936614990234, -0.0055484771728515625, -0.004683017730712891, -0.0038175582885742188, -0.002952098846435547, -0.002086639404296875, -0.0012211799621582031, -0.00035572052001953125, 0.0005097389221191406, 0.0013751983642578125, 0.0022406578063964844, 0.0031061172485351562, 0.003971576690673828, 0.0048370361328125, 0.005702495574951172, 0.006567955017089844, 0.007433414459228516, 0.008298873901367188, 0.00916433334350586, 0.010029792785644531, 0.010895252227783203, 0.011760711669921875, 0.012626171112060547, 0.013491630554199219, 0.01435708999633789, 0.015222549438476562, 0.016088008880615234, 0.016953468322753906, 0.017818927764892578, 0.01868438720703125, 0.019549846649169922, 0.020415306091308594, 0.021280765533447266, 0.022146224975585938, 0.02301168441772461, 0.02387714385986328, 0.024742603302001953, 0.025608062744140625, 0.026473522186279297, 0.02733898162841797, 0.02820444107055664, 0.029069900512695312, 0.029935359954833984, 0.030800819396972656, 0.03166627883911133, 0.03253173828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 5.0, 4.0, 9.0, 8.0, 6.0, 15.0, 20.0, 18.0, 24.0, 38.0, 29.0, 49.0, 54.0, 72.0, 97.0, 125.0, 215.0, 274.0, 481.0, 725.0, 608.0, 338.0, 227.0, 157.0, 121.0, 91.0, 53.0, 43.0, 46.0, 26.0, 17.0, 13.0, 11.0, 9.0, 15.0, 5.0, 8.0, 9.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0135345458984375, -0.013165712356567383, -0.012796878814697266, -0.012428045272827148, -0.012059211730957031, -0.011690378189086914, -0.011321544647216797, -0.01095271110534668, -0.010583877563476562, -0.010215044021606445, -0.009846210479736328, -0.009477376937866211, -0.009108543395996094, -0.008739709854125977, -0.00837087631225586, -0.008002042770385742, -0.007633209228515625, -0.007264375686645508, -0.006895542144775391, -0.0065267086029052734, -0.006157875061035156, -0.005789041519165039, -0.005420207977294922, -0.005051374435424805, -0.0046825408935546875, -0.00431370735168457, -0.003944873809814453, -0.003576040267944336, -0.0032072067260742188, -0.0028383731842041016, -0.0024695396423339844, -0.002100706100463867, -0.00173187255859375, -0.0013630390167236328, -0.0009942054748535156, -0.0006253719329833984, -0.00025653839111328125, 0.00011229515075683594, 0.0004811286926269531, 0.0008499622344970703, 0.0012187957763671875, 0.0015876293182373047, 0.001956462860107422, 0.002325296401977539, 0.0026941299438476562, 0.0030629634857177734, 0.0034317970275878906, 0.003800630569458008, 0.004169464111328125, 0.004538297653198242, 0.004907131195068359, 0.0052759647369384766, 0.005644798278808594, 0.006013631820678711, 0.006382465362548828, 0.006751298904418945, 0.0071201324462890625, 0.00748896598815918, 0.007857799530029297, 0.008226633071899414, 0.008595466613769531, 0.008964300155639648, 0.009333133697509766, 0.009701967239379883, 0.01007080078125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 12.0, 39.0, 190.0, 494.0, 205.0, 50.0, 15.0, 7.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.4218927025794983, -0.4143020510673523, -0.4067113995552063, -0.3991207480430603, -0.3915300667285919, -0.3839394152164459, -0.3763487637042999, -0.36875811219215393, -0.36116746068000793, -0.35357680916786194, -0.34598615765571594, -0.33839550614356995, -0.33080482482910156, -0.32321417331695557, -0.31562352180480957, -0.3080328702926636, -0.3004422187805176, -0.2928515672683716, -0.2852609157562256, -0.2776702642440796, -0.2700795829296112, -0.2624889314174652, -0.2548982799053192, -0.24730762839317322, -0.23971696197986603, -0.23212631046772003, -0.22453564405441284, -0.21694499254226685, -0.20935434103012085, -0.20176368951797485, -0.19417302310466766, -0.18658237159252167, -0.17899172008037567, -0.17140106856822968, -0.16381040215492249, -0.1562197506427765, -0.1486290991306305, -0.1410384476184845, -0.1334477812051773, -0.1258571296930313, -0.11826647818088531, -0.11067581921815872, -0.10308516770601273, -0.09549450874328613, -0.08790385723114014, -0.08031319826841354, -0.07272253930568695, -0.06513188779354095, -0.05754122883081436, -0.04995057359337807, -0.04235991835594177, -0.03476925939321518, -0.027178606018424034, -0.01958794891834259, -0.011997293680906296, -0.004406638443470001, 0.0031840167939662933, 0.010774672031402588, 0.018365327268838882, 0.025955984368920326, 0.03354664146900177, 0.041137296706438065, 0.04872795194387436, 0.056318607181310654, 0.06390926241874695]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 4.0, 6.0, 8.0, 15.0, 17.0, 15.0, 19.0, 18.0, 20.0, 41.0, 26.0, 37.0, 22.0, 38.0, 48.0, 46.0, 40.0, 40.0, 39.0, 44.0, 42.0, 41.0, 47.0, 37.0, 34.0, 27.0, 36.0, 23.0, 30.0, 25.0, 21.0, 18.0, 6.0, 14.0, 15.0, 10.0, 3.0, 9.0, 3.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.04379284381866455, -0.04251968115568161, -0.04124651849269867, -0.03997335210442543, -0.03870018944144249, -0.03742702677845955, -0.03615386039018631, -0.03488069772720337, -0.03360753506422043, -0.03233437240123749, -0.031061207875609398, -0.029788043349981308, -0.028514880686998367, -0.027241718024015427, -0.025968553498387337, -0.024695388972759247, -0.023422226309776306, -0.022149063646793365, -0.020875899121165276, -0.019602734595537186, -0.018329571932554245, -0.017056409269571304, -0.015783244743943214, -0.014510081149637699, -0.013236917555332184, -0.011963753961026669, -0.010690590366721153, -0.009417426772415638, -0.008144263178110123, -0.006871099583804607, -0.005597935989499092, -0.004324772395193577, -0.0030516088008880615, -0.0017784452065825462, -0.0005052816122770309, 0.0007678819820284843, 0.0020410455763339996, 0.003314209170639515, 0.00458737276494503, 0.0058605363592505455, 0.007133699953556061, 0.008406863547861576, 0.009680027142167091, 0.010953190736472607, 0.012226354330778122, 0.013499517925083637, 0.014772681519389153, 0.016045846045017242, 0.017319008708000183, 0.018592171370983124, 0.019865335896611214, 0.021138500422239304, 0.022411663085222244, 0.023684825748205185, 0.024957990273833275, 0.026231154799461365, 0.027504317462444305, 0.028777480125427246, 0.030050644651055336, 0.031323809176683426, 0.03259697183966637, 0.03387013450264931, 0.035143300890922546, 0.03641646355390549, 0.03768962621688843]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 5.0, 5.0, 6.0, 11.0, 13.0, 23.0, 40.0, 48.0, 61.0, 124.0, 224.0, 424.0, 759.0, 1577.0, 3392.0, 7676.0, 18960.0, 52325.0, 178315.0, 484708.0, 204363.0, 59119.0, 20794.0, 8415.0, 3676.0, 1676.0, 804.0, 434.0, 201.0, 146.0, 76.0, 61.0, 29.0, 20.0, 11.0, 8.0, 8.0, 11.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028228759765625, -0.027387380599975586, -0.026546001434326172, -0.025704622268676758, -0.024863243103027344, -0.02402186393737793, -0.023180484771728516, -0.0223391056060791, -0.021497726440429688, -0.020656347274780273, -0.01981496810913086, -0.018973588943481445, -0.01813220977783203, -0.017290830612182617, -0.016449451446533203, -0.015608072280883789, -0.014766693115234375, -0.013925313949584961, -0.013083934783935547, -0.012242555618286133, -0.011401176452636719, -0.010559797286987305, -0.00971841812133789, -0.008877038955688477, -0.008035659790039062, -0.0071942806243896484, -0.006352901458740234, -0.00551152229309082, -0.004670143127441406, -0.003828763961791992, -0.002987384796142578, -0.002146005630493164, -0.00130462646484375, -0.00046324729919433594, 0.0003781318664550781, 0.0012195110321044922, 0.0020608901977539062, 0.0029022693634033203, 0.0037436485290527344, 0.0045850276947021484, 0.0054264068603515625, 0.0062677860260009766, 0.007109165191650391, 0.007950544357299805, 0.008791923522949219, 0.009633302688598633, 0.010474681854248047, 0.011316061019897461, 0.012157440185546875, 0.012998819351196289, 0.013840198516845703, 0.014681577682495117, 0.015522956848144531, 0.016364336013793945, 0.01720571517944336, 0.018047094345092773, 0.018888473510742188, 0.0197298526763916, 0.020571231842041016, 0.02141261100769043, 0.022253990173339844, 0.023095369338989258, 0.023936748504638672, 0.024778127670288086, 0.0256195068359375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 7.0, 11.0, 15.0, 24.0, 29.0, 43.0, 43.0, 51.0, 60.0, 69.0, 87.0, 89.0, 75.0, 73.0, 68.0, 61.0, 46.0, 35.0, 29.0, 19.0, 28.0, 19.0, 7.0, 4.0, 7.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0066986083984375, -0.00644838809967041, -0.00619816780090332, -0.0059479475021362305, -0.005697727203369141, -0.005447506904602051, -0.005197286605834961, -0.004947066307067871, -0.004696846008300781, -0.004446625709533691, -0.0041964054107666016, -0.003946185111999512, -0.003695964813232422, -0.003445744514465332, -0.003195524215698242, -0.0029453039169311523, -0.0026950836181640625, -0.0024448633193969727, -0.002194643020629883, -0.001944422721862793, -0.0016942024230957031, -0.0014439821243286133, -0.0011937618255615234, -0.0009435415267944336, -0.0006933212280273438, -0.0004431009292602539, -0.00019288063049316406, 5.733966827392578e-05, 0.0003075599670410156, 0.0005577802658081055, 0.0008080005645751953, 0.0010582208633422852, 0.001308441162109375, 0.0015586614608764648, 0.0018088817596435547, 0.0020591020584106445, 0.0023093223571777344, 0.0025595426559448242, 0.002809762954711914, 0.003059983253479004, 0.0033102035522460938, 0.0035604238510131836, 0.0038106441497802734, 0.004060864448547363, 0.004311084747314453, 0.004561305046081543, 0.004811525344848633, 0.005061745643615723, 0.0053119659423828125, 0.005562186241149902, 0.005812406539916992, 0.006062626838684082, 0.006312847137451172, 0.006563067436218262, 0.0068132877349853516, 0.007063508033752441, 0.007313728332519531, 0.007563948631286621, 0.007814168930053711, 0.0080643892288208, 0.00831460952758789, 0.00856482982635498, 0.00881505012512207, 0.00906527042388916, 0.00931549072265625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 3.0, 7.0, 6.0, 3.0, 10.0, 22.0, 18.0, 18.0, 24.0, 48.0, 58.0, 69.0, 95.0, 156.0, 216.0, 333.0, 501.0, 953.0, 1736.0, 3867.0, 9535.0, 26732.0, 92526.0, 393541.0, 384068.0, 90183.0, 26314.0, 9390.0, 3865.0, 1735.0, 890.0, 547.0, 335.0, 231.0, 130.0, 116.0, 76.0, 55.0, 41.0, 28.0, 18.0, 13.0, 11.0, 12.0, 10.0, 6.0, 0.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0238037109375, -0.0230100154876709, -0.022216320037841797, -0.021422624588012695, -0.020628929138183594, -0.019835233688354492, -0.01904153823852539, -0.01824784278869629, -0.017454147338867188, -0.016660451889038086, -0.015866756439208984, -0.015073060989379883, -0.014279365539550781, -0.01348567008972168, -0.012691974639892578, -0.011898279190063477, -0.011104583740234375, -0.010310888290405273, -0.009517192840576172, -0.00872349739074707, -0.007929801940917969, -0.007136106491088867, -0.006342411041259766, -0.005548715591430664, -0.0047550201416015625, -0.003961324691772461, -0.0031676292419433594, -0.002373933792114258, -0.0015802383422851562, -0.0007865428924560547, 7.152557373046875e-06, 0.0008008480072021484, 0.00159454345703125, 0.0023882389068603516, 0.003181934356689453, 0.003975629806518555, 0.004769325256347656, 0.005563020706176758, 0.006356716156005859, 0.007150411605834961, 0.007944107055664062, 0.008737802505493164, 0.009531497955322266, 0.010325193405151367, 0.011118888854980469, 0.01191258430480957, 0.012706279754638672, 0.013499975204467773, 0.014293670654296875, 0.015087366104125977, 0.015881061553955078, 0.01667475700378418, 0.01746845245361328, 0.018262147903442383, 0.019055843353271484, 0.019849538803100586, 0.020643234252929688, 0.02143692970275879, 0.02223062515258789, 0.023024320602416992, 0.023818016052246094, 0.024611711502075195, 0.025405406951904297, 0.0261991024017334, 0.0269927978515625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 7.0, 6.0, 13.0, 7.0, 8.0, 11.0, 21.0, 13.0, 23.0, 29.0, 35.0, 33.0, 39.0, 43.0, 37.0, 38.0, 43.0, 56.0, 38.0, 45.0, 42.0, 29.0, 34.0, 39.0, 31.0, 39.0, 26.0, 33.0, 23.0, 31.0, 20.0, 14.0, 17.0, 14.0, 8.0, 11.0, 10.0, 9.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.01351165771484375, -0.013113975524902344, -0.012716293334960938, -0.012318611145019531, -0.011920928955078125, -0.011523246765136719, -0.011125564575195312, -0.010727882385253906, -0.0103302001953125, -0.009932518005371094, -0.009534835815429688, -0.009137153625488281, -0.008739471435546875, -0.008341789245605469, -0.007944107055664062, -0.007546424865722656, -0.00714874267578125, -0.006751060485839844, -0.0063533782958984375, -0.005955696105957031, -0.005558013916015625, -0.005160331726074219, -0.0047626495361328125, -0.004364967346191406, -0.00396728515625, -0.0035696029663085938, -0.0031719207763671875, -0.0027742385864257812, -0.002376556396484375, -0.0019788742065429688, -0.0015811920166015625, -0.0011835098266601562, -0.00078582763671875, -0.00038814544677734375, 9.5367431640625e-06, 0.00040721893310546875, 0.000804901123046875, 0.0012025833129882812, 0.0016002655029296875, 0.0019979476928710938, 0.0023956298828125, 0.0027933120727539062, 0.0031909942626953125, 0.0035886764526367188, 0.003986358642578125, 0.004384040832519531, 0.0047817230224609375, 0.005179405212402344, 0.00557708740234375, 0.005974769592285156, 0.0063724517822265625, 0.006770133972167969, 0.007167816162109375, 0.007565498352050781, 0.007963180541992188, 0.008360862731933594, 0.008758544921875, 0.009156227111816406, 0.009553909301757812, 0.009951591491699219, 0.010349273681640625, 0.010746955871582031, 0.011144638061523438, 0.011542320251464844, 0.01194000244140625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 8.0, 10.0, 8.0, 12.0, 16.0, 21.0, 44.0, 52.0, 82.0, 177.0, 348.0, 1061.0, 3620.0, 33794.0, 942203.0, 60302.0, 4707.0, 1212.0, 426.0, 183.0, 99.0, 49.0, 30.0, 25.0, 18.0, 10.0, 6.0, 5.0, 5.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.019561767578125, -0.018996000289916992, -0.018430233001708984, -0.017864465713500977, -0.01729869842529297, -0.01673293113708496, -0.016167163848876953, -0.015601396560668945, -0.015035629272460938, -0.01446986198425293, -0.013904094696044922, -0.013338327407836914, -0.012772560119628906, -0.012206792831420898, -0.01164102554321289, -0.011075258255004883, -0.010509490966796875, -0.009943723678588867, -0.00937795639038086, -0.008812189102172852, -0.008246421813964844, -0.007680654525756836, -0.007114887237548828, -0.00654911994934082, -0.0059833526611328125, -0.005417585372924805, -0.004851818084716797, -0.004286050796508789, -0.0037202835083007812, -0.0031545162200927734, -0.0025887489318847656, -0.002022981643676758, -0.00145721435546875, -0.0008914470672607422, -0.0003256797790527344, 0.00024008750915527344, 0.0008058547973632812, 0.001371622085571289, 0.0019373893737792969, 0.0025031566619873047, 0.0030689239501953125, 0.0036346912384033203, 0.004200458526611328, 0.004766225814819336, 0.005331993103027344, 0.0058977603912353516, 0.006463527679443359, 0.007029294967651367, 0.007595062255859375, 0.008160829544067383, 0.00872659683227539, 0.009292364120483398, 0.009858131408691406, 0.010423898696899414, 0.010989665985107422, 0.01155543327331543, 0.012121200561523438, 0.012686967849731445, 0.013252735137939453, 0.013818502426147461, 0.014384269714355469, 0.014950037002563477, 0.015515804290771484, 0.016081571578979492, 0.0166473388671875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 0.0, 3.0, 7.0, 2.0, 8.0, 16.0, 16.0, 26.0, 0.0, 35.0, 35.0, 33.0, 42.0, 46.0, 50.0, 50.0, 0.0, 57.0, 46.0, 57.0, 73.0, 51.0, 44.0, 53.0, 0.0, 42.0, 50.0, 31.0, 18.0, 23.0, 15.0, 17.0, 0.0, 12.0, 16.0, 7.0, 11.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.7881393432617188e-06, -1.735985279083252e-06, -1.6838312149047852e-06, -1.6316771507263184e-06, -1.5795230865478516e-06, -1.5273690223693848e-06, -1.475214958190918e-06, -1.4230608940124512e-06, -1.3709068298339844e-06, -1.3187527656555176e-06, -1.2665987014770508e-06, -1.214444637298584e-06, -1.1622905731201172e-06, -1.1101365089416504e-06, -1.0579824447631836e-06, -1.0058283805847168e-06, -9.5367431640625e-07, -9.015202522277832e-07, -8.493661880493164e-07, -7.972121238708496e-07, -7.450580596923828e-07, -6.92903995513916e-07, -6.407499313354492e-07, -5.885958671569824e-07, -5.364418029785156e-07, -4.842877388000488e-07, -4.3213367462158203e-07, -3.7997961044311523e-07, -3.2782554626464844e-07, -2.7567148208618164e-07, -2.2351741790771484e-07, -1.7136335372924805e-07, -1.1920928955078125e-07, -6.705522537231445e-08, -1.4901161193847656e-08, 3.725290298461914e-08, 8.940696716308594e-08, 1.4156103134155273e-07, 1.9371509552001953e-07, 2.4586915969848633e-07, 2.980232238769531e-07, 3.501772880554199e-07, 4.023313522338867e-07, 4.544854164123535e-07, 5.066394805908203e-07, 5.587935447692871e-07, 6.109476089477539e-07, 6.631016731262207e-07, 7.152557373046875e-07, 7.674098014831543e-07, 8.195638656616211e-07, 8.717179298400879e-07, 9.238719940185547e-07, 9.760260581970215e-07, 1.0281801223754883e-06, 1.080334186553955e-06, 1.1324882507324219e-06, 1.1846423149108887e-06, 1.2367963790893555e-06, 1.2889504432678223e-06, 1.341104507446289e-06, 1.3932585716247559e-06, 1.4454126358032227e-06, 1.4975666999816895e-06, 1.5497207641601562e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 6.0, 1.0, 3.0, 4.0, 12.0, 16.0, 34.0, 43.0, 95.0, 182.0, 407.0, 1148.0, 5116.0, 70817.0, 940901.0, 25157.0, 3140.0, 855.0, 291.0, 129.0, 94.0, 47.0, 28.0, 12.0, 11.0, 3.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024261474609375, -0.023534059524536133, -0.022806644439697266, -0.0220792293548584, -0.02135181427001953, -0.020624399185180664, -0.019896984100341797, -0.01916956901550293, -0.018442153930664062, -0.017714738845825195, -0.016987323760986328, -0.01625990867614746, -0.015532493591308594, -0.014805078506469727, -0.01407766342163086, -0.013350248336791992, -0.012622833251953125, -0.011895418167114258, -0.01116800308227539, -0.010440587997436523, -0.009713172912597656, -0.008985757827758789, -0.008258342742919922, -0.007530927658081055, -0.0068035125732421875, -0.00607609748840332, -0.005348682403564453, -0.004621267318725586, -0.0038938522338867188, -0.0031664371490478516, -0.0024390220642089844, -0.0017116069793701172, -0.00098419189453125, -0.0002567768096923828, 0.0004706382751464844, 0.0011980533599853516, 0.0019254684448242188, 0.002652883529663086, 0.003380298614501953, 0.00410771369934082, 0.0048351287841796875, 0.005562543869018555, 0.006289958953857422, 0.007017374038696289, 0.007744789123535156, 0.008472204208374023, 0.00919961929321289, 0.009927034378051758, 0.010654449462890625, 0.011381864547729492, 0.01210927963256836, 0.012836694717407227, 0.013564109802246094, 0.014291524887084961, 0.015018939971923828, 0.015746355056762695, 0.016473770141601562, 0.01720118522644043, 0.017928600311279297, 0.018656015396118164, 0.01938343048095703, 0.0201108455657959, 0.020838260650634766, 0.021565675735473633, 0.0222930908203125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 8.0, 4.0, 12.0, 18.0, 22.0, 41.0, 86.0, 155.0, 198.0, 176.0, 110.0, 70.0, 36.0, 24.0, 10.0, 9.0, 9.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005588531494140625, -0.005332052707672119, -0.005075573921203613, -0.004819095134735107, -0.0045626163482666016, -0.004306137561798096, -0.00404965877532959, -0.003793179988861084, -0.003536701202392578, -0.0032802224159240723, -0.0030237436294555664, -0.0027672648429870605, -0.0025107860565185547, -0.002254307270050049, -0.001997828483581543, -0.0017413496971130371, -0.0014848709106445312, -0.0012283921241760254, -0.0009719133377075195, -0.0007154345512390137, -0.0004589557647705078, -0.00020247697830200195, 5.4001808166503906e-05, 0.00031048059463500977, 0.0005669593811035156, 0.0008234381675720215, 0.0010799169540405273, 0.0013363957405090332, 0.001592874526977539, 0.001849353313446045, 0.0021058320999145508, 0.0023623108863830566, 0.0026187896728515625, 0.0028752684593200684, 0.0031317472457885742, 0.00338822603225708, 0.003644704818725586, 0.003901183605194092, 0.004157662391662598, 0.0044141411781311035, 0.004670619964599609, 0.004927098751068115, 0.005183577537536621, 0.005440056324005127, 0.005696535110473633, 0.005953013896942139, 0.0062094926834106445, 0.00646597146987915, 0.006722450256347656, 0.006978929042816162, 0.007235407829284668, 0.007491886615753174, 0.00774836540222168, 0.008004844188690186, 0.008261322975158691, 0.008517801761627197, 0.008774280548095703, 0.009030759334564209, 0.009287238121032715, 0.00954371690750122, 0.009800195693969727, 0.010056674480438232, 0.010313153266906738, 0.010569632053375244, 0.01082611083984375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 9.0, 21.0, 115.0, 412.0, 343.0, 77.0, 26.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.122086301445961, -0.11443466693162918, -0.10678303241729736, -0.09913139045238495, -0.09147975593805313, -0.08382812142372131, -0.0761764794588089, -0.06852484494447708, -0.060873210430145264, -0.053221575915813446, -0.04556993767619133, -0.037918299436569214, -0.030266664922237396, -0.02261503040790558, -0.014963392168283463, -0.0073117539286613464, 0.0003398805856704712, 0.007991516962647438, 0.015643153339624405, 0.023294789716601372, 0.03094642609357834, 0.038598060607910156, 0.04624969884753227, 0.05390133708715439, 0.061552971601486206, 0.06920460611581802, 0.07685624063014984, 0.08450788259506226, 0.09215951710939407, 0.09981115162372589, 0.1074627935886383, 0.11511442810297012, 0.12276607751846313, 0.13041771948337555, 0.13806934654712677, 0.14572098851203918, 0.1533726155757904, 0.16102425754070282, 0.16867589950561523, 0.17632752656936646, 0.18397916853427887, 0.19163081049919128, 0.1992824375629425, 0.20693407952785492, 0.21458572149276733, 0.22223734855651855, 0.22988899052143097, 0.23754063248634338, 0.2451922595500946, 0.2528438866138458, 0.26049554347991943, 0.26814717054367065, 0.2757987976074219, 0.2834504246711731, 0.2911020815372467, 0.2987537086009979, 0.30640536546707153, 0.31405699253082275, 0.32170864939689636, 0.3293602764606476, 0.3370119035243988, 0.3446635603904724, 0.35231518745422363, 0.35996681451797485, 0.3676184415817261]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 3.0, 7.0, 6.0, 10.0, 5.0, 7.0, 10.0, 7.0, 15.0, 14.0, 15.0, 21.0, 24.0, 28.0, 20.0, 21.0, 23.0, 41.0, 31.0, 40.0, 45.0, 39.0, 34.0, 36.0, 42.0, 43.0, 49.0, 34.0, 34.0, 26.0, 25.0, 24.0, 26.0, 30.0, 29.0, 22.0, 20.0, 24.0, 15.0, 10.0, 8.0, 8.0, 8.0, 8.0, 5.0, 5.0, 3.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.044526875019073486, -0.04321208596229553, -0.04189729690551758, -0.04058251157402992, -0.03926772251725197, -0.037952933460474014, -0.03663814812898636, -0.035323359072208405, -0.03400857001543045, -0.032693780958652496, -0.03137899190187454, -0.030064206570386887, -0.028749417513608932, -0.02743462845683098, -0.026119841262698174, -0.02480505406856537, -0.023490265011787415, -0.02217547595500946, -0.020860688760876656, -0.01954590156674385, -0.018231112509965897, -0.016916323453187943, -0.015601536259055138, -0.014286748133599758, -0.012971960008144379, -0.011657171882689, -0.01034238375723362, -0.00902759563177824, -0.007712807506322861, -0.006398019380867481, -0.005083231255412102, -0.0037684431299567223, -0.0024536550045013428, -0.0011388668790459633, 0.0001759212464094162, 0.0014907093718647957, 0.002805497497320175, 0.004120285622775555, 0.005435073748230934, 0.006749861873686314, 0.008064649999141693, 0.009379438124597073, 0.010694226250052452, 0.012009014375507832, 0.013323802500963211, 0.01463859062641859, 0.01595337875187397, 0.017268165946006775, 0.01858295500278473, 0.019897744059562683, 0.021212531253695488, 0.022527318447828293, 0.023842107504606247, 0.0251568965613842, 0.026471683755517006, 0.02778647094964981, 0.029101260006427765, 0.03041604906320572, 0.03173083811998367, 0.03304562345147133, 0.03436041250824928, 0.03567520156502724, 0.03698998689651489, 0.03830477595329285, 0.0396195650100708]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 10.0, 9.0, 17.0, 16.0, 30.0, 42.0, 68.0, 117.0, 207.0, 483.0, 1299.0, 4554.0, 23056.0, 391561.0, 3684457.0, 74214.0, 10439.0, 2338.0, 737.0, 265.0, 134.0, 71.0, 54.0, 46.0, 14.0, 15.0, 14.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031768798828125, -0.03075265884399414, -0.02973651885986328, -0.028720378875732422, -0.027704238891601562, -0.026688098907470703, -0.025671958923339844, -0.024655818939208984, -0.023639678955078125, -0.022623538970947266, -0.021607398986816406, -0.020591259002685547, -0.019575119018554688, -0.018558979034423828, -0.01754283905029297, -0.01652669906616211, -0.01551055908203125, -0.01449441909790039, -0.013478279113769531, -0.012462139129638672, -0.011445999145507812, -0.010429859161376953, -0.009413719177246094, -0.008397579193115234, -0.007381439208984375, -0.006365299224853516, -0.005349159240722656, -0.004333019256591797, -0.0033168792724609375, -0.002300739288330078, -0.0012845993041992188, -0.0002684593200683594, 0.0007476806640625, 0.0017638206481933594, 0.0027799606323242188, 0.003796100616455078, 0.0048122406005859375, 0.005828380584716797, 0.006844520568847656, 0.007860660552978516, 0.008876800537109375, 0.009892940521240234, 0.010909080505371094, 0.011925220489501953, 0.012941360473632812, 0.013957500457763672, 0.014973640441894531, 0.01598978042602539, 0.01700592041015625, 0.01802206039428711, 0.01903820037841797, 0.020054340362548828, 0.021070480346679688, 0.022086620330810547, 0.023102760314941406, 0.024118900299072266, 0.025135040283203125, 0.026151180267333984, 0.027167320251464844, 0.028183460235595703, 0.029199600219726562, 0.030215740203857422, 0.03123188018798828, 0.03224802017211914, 0.03326416015625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 12.0, 11.0, 14.0, 16.0, 30.0, 33.0, 40.0, 41.0, 67.0, 56.0, 62.0, 79.0, 80.0, 84.0, 64.0, 56.0, 60.0, 36.0, 37.0, 38.0, 26.0, 23.0, 17.0, 8.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0080413818359375, -0.007800698280334473, -0.007560014724731445, -0.007319331169128418, -0.007078647613525391, -0.006837964057922363, -0.006597280502319336, -0.006356596946716309, -0.006115913391113281, -0.005875229835510254, -0.0056345462799072266, -0.005393862724304199, -0.005153179168701172, -0.0049124956130981445, -0.004671812057495117, -0.00443112850189209, -0.0041904449462890625, -0.003949761390686035, -0.003709077835083008, -0.0034683942794799805, -0.003227710723876953, -0.0029870271682739258, -0.0027463436126708984, -0.002505660057067871, -0.0022649765014648438, -0.0020242929458618164, -0.001783609390258789, -0.0015429258346557617, -0.0013022422790527344, -0.001061558723449707, -0.0008208751678466797, -0.0005801916122436523, -0.000339508056640625, -9.882450103759766e-05, 0.0001418590545654297, 0.00038254261016845703, 0.0006232261657714844, 0.0008639097213745117, 0.001104593276977539, 0.0013452768325805664, 0.0015859603881835938, 0.001826643943786621, 0.0020673274993896484, 0.0023080110549926758, 0.002548694610595703, 0.0027893781661987305, 0.003030061721801758, 0.003270745277404785, 0.0035114288330078125, 0.00375211238861084, 0.003992795944213867, 0.0042334794998168945, 0.004474163055419922, 0.004714846611022949, 0.0049555301666259766, 0.005196213722229004, 0.005436897277832031, 0.005677580833435059, 0.005918264389038086, 0.006158947944641113, 0.006399631500244141, 0.006640315055847168, 0.006880998611450195, 0.007121682167053223, 0.00736236572265625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 9.0, 17.0, 41.0, 66.0, 147.0, 308.0, 891.0, 4739.0, 83471.0, 4000088.0, 97760.0, 5192.0, 945.0, 318.0, 141.0, 68.0, 40.0, 19.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06463623046875, -0.0629582405090332, -0.061280250549316406, -0.05960226058959961, -0.05792427062988281, -0.056246280670166016, -0.05456829071044922, -0.05289030075073242, -0.051212310791015625, -0.04953432083129883, -0.04785633087158203, -0.046178340911865234, -0.04450035095214844, -0.04282236099243164, -0.041144371032714844, -0.03946638107299805, -0.03778839111328125, -0.03611040115356445, -0.034432411193847656, -0.03275442123413086, -0.031076431274414062, -0.029398441314697266, -0.02772045135498047, -0.026042461395263672, -0.024364471435546875, -0.022686481475830078, -0.02100849151611328, -0.019330501556396484, -0.017652511596679688, -0.01597452163696289, -0.014296531677246094, -0.012618541717529297, -0.0109405517578125, -0.009262561798095703, -0.007584571838378906, -0.005906581878662109, -0.0042285919189453125, -0.0025506019592285156, -0.0008726119995117188, 0.0008053779602050781, 0.002483367919921875, 0.004161357879638672, 0.005839347839355469, 0.007517337799072266, 0.009195327758789062, 0.01087331771850586, 0.012551307678222656, 0.014229297637939453, 0.01590728759765625, 0.017585277557373047, 0.019263267517089844, 0.02094125747680664, 0.022619247436523438, 0.024297237396240234, 0.02597522735595703, 0.027653217315673828, 0.029331207275390625, 0.031009197235107422, 0.03268718719482422, 0.034365177154541016, 0.03604316711425781, 0.03772115707397461, 0.039399147033691406, 0.0410771369934082, 0.042755126953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 5.0, 10.0, 16.0, 14.0, 33.0, 34.0, 69.0, 68.0, 132.0, 190.0, 364.0, 870.0, 1088.0, 522.0, 222.0, 135.0, 92.0, 63.0, 44.0, 28.0, 28.0, 12.0, 15.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01403045654296875, -0.01349484920501709, -0.01295924186706543, -0.01242363452911377, -0.01188802719116211, -0.01135241985321045, -0.010816812515258789, -0.010281205177307129, -0.009745597839355469, -0.009209990501403809, -0.008674383163452148, -0.008138775825500488, -0.007603168487548828, -0.007067561149597168, -0.006531953811645508, -0.005996346473693848, -0.0054607391357421875, -0.004925131797790527, -0.004389524459838867, -0.003853917121887207, -0.003318309783935547, -0.0027827024459838867, -0.0022470951080322266, -0.0017114877700805664, -0.0011758804321289062, -0.0006402730941772461, -0.00010466575622558594, 0.0004309415817260742, 0.0009665489196777344, 0.0015021562576293945, 0.0020377635955810547, 0.002573370933532715, 0.003108978271484375, 0.003644585609436035, 0.004180192947387695, 0.0047158002853393555, 0.005251407623291016, 0.005787014961242676, 0.006322622299194336, 0.006858229637145996, 0.007393836975097656, 0.007929444313049316, 0.008465051651000977, 0.009000658988952637, 0.009536266326904297, 0.010071873664855957, 0.010607481002807617, 0.011143088340759277, 0.011678695678710938, 0.012214303016662598, 0.012749910354614258, 0.013285517692565918, 0.013821125030517578, 0.014356732368469238, 0.014892339706420898, 0.015427947044372559, 0.01596355438232422, 0.01649916172027588, 0.01703476905822754, 0.0175703763961792, 0.01810598373413086, 0.01864159107208252, 0.01917719841003418, 0.01971280574798584, 0.0202484130859375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 16.0, 20.0, 50.0, 115.0, 269.0, 284.0, 133.0, 56.0, 34.0, 9.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1501832902431488, -0.14634837210178375, -0.1425134688615799, -0.13867855072021484, -0.134843647480011, -0.13100872933864594, -0.12717381119728088, -0.12333890795707703, -0.11950398981571198, -0.11566907912492752, -0.11183416843414307, -0.10799925029277802, -0.10416433960199356, -0.1003294289112091, -0.09649451822042465, -0.0926596075296402, -0.08882469683885574, -0.08498978614807129, -0.08115487545728683, -0.07731996476650238, -0.07348504662513733, -0.06965013593435287, -0.06581522524356842, -0.061980314552783966, -0.05814540013670921, -0.05431048944592476, -0.050475575029850006, -0.04664066433906555, -0.0428057536482811, -0.038970839232206345, -0.03513592854142189, -0.03130101412534714, -0.027466103434562683, -0.02363119088113308, -0.019796278327703476, -0.01596136763691902, -0.012126455083489418, -0.008291542530059814, -0.00445663183927536, -0.0006217192858457565, 0.003213193267583847, 0.007048105355352163, 0.01088301744312048, 0.014717929065227509, 0.018552841618657112, 0.022387754172086716, 0.02622266486287117, 0.030057577416300774, 0.03389248996973038, 0.03772740066051483, 0.041562315076589584, 0.04539722576737404, 0.04923214018344879, 0.053067050874233246, 0.0569019615650177, 0.060736872255802155, 0.06457178294658661, 0.06840669363737106, 0.07224160432815552, 0.07607652246952057, 0.07991143316030502, 0.08374634385108948, 0.08758125454187393, 0.09141616523265839, 0.09525108337402344]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 7.0, 13.0, 13.0, 12.0, 14.0, 23.0, 35.0, 30.0, 33.0, 40.0, 51.0, 59.0, 59.0, 49.0, 56.0, 72.0, 48.0, 50.0, 57.0, 39.0, 47.0, 35.0, 29.0, 37.0, 24.0, 18.0, 12.0, 9.0, 6.0, 7.0, 6.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03745317459106445, -0.03603023663163185, -0.03460729867219925, -0.03318435698747635, -0.03176141902804375, -0.030338481068611145, -0.028915541246533394, -0.027492601424455643, -0.02606966346502304, -0.02464672550559044, -0.023223785683512688, -0.021800845861434937, -0.020377907902002335, -0.018954969942569733, -0.01753203012049198, -0.01610909029841423, -0.014686152338981628, -0.013263213448226452, -0.011840274557471275, -0.010417335666716099, -0.008994396775960922, -0.007571457885205746, -0.006148518994450569, -0.004725580103695393, -0.003302641212940216, -0.0018797023221850395, -0.000456763431429863, 0.0009661754593253136, 0.00238911435008049, 0.0038120532408356667, 0.005234992131590843, 0.00665793102234602, 0.008080869913101196, 0.009503808803856373, 0.01092674769461155, 0.012349686585366726, 0.013772625476121902, 0.015195564366877079, 0.016618503257632256, 0.018041443079710007, 0.01946438103914261, 0.02088731899857521, 0.02231025882065296, 0.023733198642730713, 0.025156136602163315, 0.026579074561595917, 0.028002014383673668, 0.02942495420575142, 0.03084789216518402, 0.03227083012461662, 0.033693768084049225, 0.035116709768772125, 0.03653964772820473, 0.03796258568763733, 0.03938552737236023, 0.04080846533179283, 0.04223140329122543, 0.043654341250658035, 0.04507727921009064, 0.04650022089481354, 0.04792315885424614, 0.04934609681367874, 0.05076903849840164, 0.052191976457834244, 0.053614914417266846]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [6.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 10.0, 10.0, 6.0, 15.0, 14.0, 26.0, 36.0, 37.0, 49.0, 74.0, 84.0, 106.0, 166.0, 216.0, 379.0, 676.0, 1216.0, 2255.0, 4576.0, 9447.0, 20223.0, 45822.0, 114453.0, 311733.0, 326546.0, 121059.0, 47886.0, 21195.0, 9897.0, 4803.0, 2306.0, 1229.0, 732.0, 394.0, 216.0, 173.0, 125.0, 78.0, 54.0, 44.0, 33.0, 32.0, 22.0, 24.0, 17.0, 17.0, 7.0, 12.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.01499176025390625, -0.014508605003356934, -0.014025449752807617, -0.0135422945022583, -0.013059139251708984, -0.012575984001159668, -0.012092828750610352, -0.011609673500061035, -0.011126518249511719, -0.010643362998962402, -0.010160207748413086, -0.00967705249786377, -0.009193897247314453, -0.008710741996765137, -0.00822758674621582, -0.007744431495666504, -0.0072612762451171875, -0.006778120994567871, -0.006294965744018555, -0.005811810493469238, -0.005328655242919922, -0.0048454999923706055, -0.004362344741821289, -0.0038791894912719727, -0.0033960342407226562, -0.00291287899017334, -0.0024297237396240234, -0.001946568489074707, -0.0014634132385253906, -0.0009802579879760742, -0.0004971027374267578, -1.3947486877441406e-05, 0.000469207763671875, 0.0009523630142211914, 0.0014355182647705078, 0.0019186735153198242, 0.0024018287658691406, 0.002884984016418457, 0.0033681392669677734, 0.00385129451751709, 0.004334449768066406, 0.004817605018615723, 0.005300760269165039, 0.0057839155197143555, 0.006267070770263672, 0.006750226020812988, 0.007233381271362305, 0.007716536521911621, 0.008199691772460938, 0.008682847023010254, 0.00916600227355957, 0.009649157524108887, 0.010132312774658203, 0.01061546802520752, 0.011098623275756836, 0.011581778526306152, 0.012064933776855469, 0.012548089027404785, 0.013031244277954102, 0.013514399528503418, 0.013997554779052734, 0.01448071002960205, 0.014963865280151367, 0.015447020530700684, 0.01593017578125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 15.0, 16.0, 17.0, 24.0, 46.0, 47.0, 55.0, 72.0, 79.0, 86.0, 83.0, 87.0, 78.0, 69.0, 70.0, 47.0, 37.0, 33.0, 16.0, 15.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007602691650390625, -0.007344424724578857, -0.00708615779876709, -0.006827890872955322, -0.006569623947143555, -0.006311357021331787, -0.0060530900955200195, -0.005794823169708252, -0.005536556243896484, -0.005278289318084717, -0.005020022392272949, -0.004761755466461182, -0.004503488540649414, -0.0042452216148376465, -0.003986954689025879, -0.0037286877632141113, -0.0034704208374023438, -0.003212153911590576, -0.0029538869857788086, -0.002695620059967041, -0.0024373531341552734, -0.002179086208343506, -0.0019208192825317383, -0.0016625523567199707, -0.0014042854309082031, -0.0011460185050964355, -0.000887751579284668, -0.0006294846534729004, -0.0003712177276611328, -0.00011295080184936523, 0.00014531612396240234, 0.0004035830497741699, 0.0006618499755859375, 0.0009201169013977051, 0.0011783838272094727, 0.0014366507530212402, 0.0016949176788330078, 0.0019531846046447754, 0.002211451530456543, 0.0024697184562683105, 0.002727985382080078, 0.0029862523078918457, 0.0032445192337036133, 0.003502786159515381, 0.0037610530853271484, 0.004019320011138916, 0.004277586936950684, 0.004535853862762451, 0.004794120788574219, 0.005052387714385986, 0.005310654640197754, 0.0055689215660095215, 0.005827188491821289, 0.006085455417633057, 0.006343722343444824, 0.006601989269256592, 0.006860256195068359, 0.007118523120880127, 0.0073767900466918945, 0.007635056972503662, 0.00789332389831543, 0.008151590824127197, 0.008409857749938965, 0.008668124675750732, 0.0089263916015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 8.0, 4.0, 9.0, 9.0, 4.0, 12.0, 13.0, 26.0, 21.0, 23.0, 44.0, 54.0, 76.0, 113.0, 157.0, 298.0, 417.0, 712.0, 1329.0, 2779.0, 5615.0, 12102.0, 27981.0, 67813.0, 187124.0, 408781.0, 204929.0, 72954.0, 29790.0, 13148.0, 5820.0, 2903.0, 1416.0, 785.0, 414.0, 277.0, 164.0, 98.0, 81.0, 54.0, 50.0, 35.0, 34.0, 22.0, 14.0, 15.0, 7.0, 7.0, 9.0, 6.0, 2.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.0161895751953125, -0.015720844268798828, -0.015252113342285156, -0.014783382415771484, -0.014314651489257812, -0.01384592056274414, -0.013377189636230469, -0.012908458709716797, -0.012439727783203125, -0.011970996856689453, -0.011502265930175781, -0.01103353500366211, -0.010564804077148438, -0.010096073150634766, -0.009627342224121094, -0.009158611297607422, -0.00868988037109375, -0.008221149444580078, -0.007752418518066406, -0.007283687591552734, -0.0068149566650390625, -0.006346225738525391, -0.005877494812011719, -0.005408763885498047, -0.004940032958984375, -0.004471302032470703, -0.004002571105957031, -0.0035338401794433594, -0.0030651092529296875, -0.0025963783264160156, -0.0021276473999023438, -0.0016589164733886719, -0.001190185546875, -0.0007214546203613281, -0.00025272369384765625, 0.00021600723266601562, 0.0006847381591796875, 0.0011534690856933594, 0.0016222000122070312, 0.002090930938720703, 0.002559661865234375, 0.003028392791748047, 0.0034971237182617188, 0.003965854644775391, 0.0044345855712890625, 0.004903316497802734, 0.005372047424316406, 0.005840778350830078, 0.00630950927734375, 0.006778240203857422, 0.007246971130371094, 0.007715702056884766, 0.008184432983398438, 0.00865316390991211, 0.009121894836425781, 0.009590625762939453, 0.010059356689453125, 0.010528087615966797, 0.010996818542480469, 0.01146554946899414, 0.011934280395507812, 0.012403011322021484, 0.012871742248535156, 0.013340473175048828, 0.0138092041015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 3.0, 0.0, 4.0, 3.0, 5.0, 5.0, 6.0, 12.0, 16.0, 14.0, 12.0, 21.0, 19.0, 19.0, 18.0, 27.0, 24.0, 26.0, 27.0, 37.0, 29.0, 31.0, 39.0, 38.0, 41.0, 39.0, 33.0, 43.0, 35.0, 39.0, 37.0, 30.0, 30.0, 27.0, 36.0, 24.0, 31.0, 26.0, 16.0, 20.0, 7.0, 8.0, 9.0, 11.0, 7.0, 4.0, 6.0, 4.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00942230224609375, -0.00909125804901123, -0.008760213851928711, -0.008429169654846191, -0.008098125457763672, -0.007767081260681152, -0.007436037063598633, -0.007104992866516113, -0.006773948669433594, -0.006442904472351074, -0.006111860275268555, -0.005780816078186035, -0.005449771881103516, -0.005118727684020996, -0.0047876834869384766, -0.004456639289855957, -0.0041255950927734375, -0.003794550895690918, -0.0034635066986083984, -0.003132462501525879, -0.0028014183044433594, -0.00247037410736084, -0.0021393299102783203, -0.0018082857131958008, -0.0014772415161132812, -0.0011461973190307617, -0.0008151531219482422, -0.00048410892486572266, -0.00015306472778320312, 0.0001779794692993164, 0.0005090236663818359, 0.0008400678634643555, 0.001171112060546875, 0.0015021562576293945, 0.001833200454711914, 0.0021642446517944336, 0.002495288848876953, 0.0028263330459594727, 0.003157377243041992, 0.0034884214401245117, 0.0038194656372070312, 0.004150509834289551, 0.00448155403137207, 0.00481259822845459, 0.005143642425537109, 0.005474686622619629, 0.0058057308197021484, 0.006136775016784668, 0.0064678192138671875, 0.006798863410949707, 0.0071299076080322266, 0.007460951805114746, 0.007791996002197266, 0.008123040199279785, 0.008454084396362305, 0.008785128593444824, 0.009116172790527344, 0.009447216987609863, 0.009778261184692383, 0.010109305381774902, 0.010440349578857422, 0.010771393775939941, 0.011102437973022461, 0.01143348217010498, 0.0117645263671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 0.0, 4.0, 6.0, 12.0, 17.0, 22.0, 28.0, 59.0, 84.0, 153.0, 306.0, 583.0, 1343.0, 3120.0, 9160.0, 34207.0, 220869.0, 632772.0, 113440.0, 21449.0, 6488.0, 2405.0, 965.0, 460.0, 236.0, 123.0, 61.0, 52.0, 24.0, 31.0, 23.0, 15.0, 8.0, 6.0, 9.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.007965087890625, -0.007745921611785889, -0.007526755332946777, -0.007307589054107666, -0.007088422775268555, -0.006869256496429443, -0.006650090217590332, -0.006430923938751221, -0.006211757659912109, -0.005992591381072998, -0.005773425102233887, -0.005554258823394775, -0.005335092544555664, -0.005115926265716553, -0.004896759986877441, -0.00467759370803833, -0.004458427429199219, -0.004239261150360107, -0.004020094871520996, -0.0038009285926818848, -0.0035817623138427734, -0.003362596035003662, -0.0031434297561645508, -0.0029242634773254395, -0.002705097198486328, -0.002485930919647217, -0.0022667646408081055, -0.002047598361968994, -0.0018284320831298828, -0.0016092658042907715, -0.0013900995254516602, -0.0011709332466125488, -0.0009517669677734375, -0.0007326006889343262, -0.0005134344100952148, -0.0002942681312561035, -7.510185241699219e-05, 0.00014406442642211914, 0.00036323070526123047, 0.0005823969841003418, 0.0008015632629394531, 0.0010207295417785645, 0.0012398958206176758, 0.0014590620994567871, 0.0016782283782958984, 0.0018973946571350098, 0.002116560935974121, 0.0023357272148132324, 0.0025548934936523438, 0.002774059772491455, 0.0029932260513305664, 0.0032123923301696777, 0.003431558609008789, 0.0036507248878479004, 0.0038698911666870117, 0.004089057445526123, 0.004308223724365234, 0.004527390003204346, 0.004746556282043457, 0.004965722560882568, 0.00518488883972168, 0.005404055118560791, 0.005623221397399902, 0.005842387676239014, 0.006061553955078125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 6.0, 8.0, 10.0, 13.0, 13.0, 31.0, 28.0, 36.0, 38.0, 39.0, 62.0, 56.0, 45.0, 48.0, 61.0, 66.0, 110.0, 61.0, 47.0, 34.0, 44.0, 33.0, 24.0, 19.0, 16.0, 9.0, 9.0, 5.0, 3.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8477439880371094e-06, -1.7862766981124878e-06, -1.7248094081878662e-06, -1.6633421182632446e-06, -1.601874828338623e-06, -1.5404075384140015e-06, -1.4789402484893799e-06, -1.4174729585647583e-06, -1.3560056686401367e-06, -1.2945383787155151e-06, -1.2330710887908936e-06, -1.171603798866272e-06, -1.1101365089416504e-06, -1.0486692190170288e-06, -9.872019290924072e-07, -9.257346391677856e-07, -8.642673492431641e-07, -8.028000593185425e-07, -7.413327693939209e-07, -6.798654794692993e-07, -6.183981895446777e-07, -5.569308996200562e-07, -4.954636096954346e-07, -4.33996319770813e-07, -3.725290298461914e-07, -3.110617399215698e-07, -2.4959444999694824e-07, -1.8812716007232666e-07, -1.2665987014770508e-07, -6.51925802230835e-08, -3.725290298461914e-09, 5.774199962615967e-08, 1.1920928955078125e-07, 1.8067657947540283e-07, 2.421438694000244e-07, 3.03611159324646e-07, 3.650784492492676e-07, 4.2654573917388916e-07, 4.880130290985107e-07, 5.494803190231323e-07, 6.109476089477539e-07, 6.724148988723755e-07, 7.338821887969971e-07, 7.953494787216187e-07, 8.568167686462402e-07, 9.182840585708618e-07, 9.797513484954834e-07, 1.041218638420105e-06, 1.1026859283447266e-06, 1.1641532182693481e-06, 1.2256205081939697e-06, 1.2870877981185913e-06, 1.3485550880432129e-06, 1.4100223779678345e-06, 1.471489667892456e-06, 1.5329569578170776e-06, 1.5944242477416992e-06, 1.6558915376663208e-06, 1.7173588275909424e-06, 1.778826117515564e-06, 1.8402934074401855e-06, 1.9017606973648071e-06, 1.9632279872894287e-06, 2.0246952772140503e-06, 2.086162567138672e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 9.0, 22.0, 21.0, 32.0, 61.0, 69.0, 134.0, 228.0, 412.0, 760.0, 1579.0, 3876.0, 12547.0, 63221.0, 618163.0, 300099.0, 33881.0, 8123.0, 2721.0, 1135.0, 602.0, 332.0, 205.0, 117.0, 77.0, 33.0, 29.0, 16.0, 10.0, 13.0, 5.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00989532470703125, -0.009584426879882812, -0.009273529052734375, -0.008962631225585938, -0.0086517333984375, -0.008340835571289062, -0.008029937744140625, -0.0077190399169921875, -0.00740814208984375, -0.0070972442626953125, -0.006786346435546875, -0.0064754486083984375, -0.00616455078125, -0.0058536529541015625, -0.005542755126953125, -0.0052318572998046875, -0.00492095947265625, -0.0046100616455078125, -0.004299163818359375, -0.0039882659912109375, -0.0036773681640625, -0.0033664703369140625, -0.003055572509765625, -0.0027446746826171875, -0.00243377685546875, -0.0021228790283203125, -0.001811981201171875, -0.0015010833740234375, -0.001190185546875, -0.0008792877197265625, -0.000568389892578125, -0.0002574920654296875, 5.340576171875e-05, 0.0003643035888671875, 0.000675201416015625, 0.0009860992431640625, 0.0012969970703125, 0.0016078948974609375, 0.001918792724609375, 0.0022296905517578125, 0.00254058837890625, 0.0028514862060546875, 0.003162384033203125, 0.0034732818603515625, 0.0037841796875, 0.0040950775146484375, 0.004405975341796875, 0.0047168731689453125, 0.00502777099609375, 0.0053386688232421875, 0.005649566650390625, 0.0059604644775390625, 0.0062713623046875, 0.0065822601318359375, 0.006893157958984375, 0.0072040557861328125, 0.00751495361328125, 0.007825851440429688, 0.008136749267578125, 0.008447647094726562, 0.008758544921875, 0.009069442749023438, 0.009380340576171875, 0.009691238403320312, 0.01000213623046875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 14.0, 8.0, 10.0, 23.0, 25.0, 55.0, 64.0, 99.0, 140.0, 155.0, 110.0, 99.0, 69.0, 36.0, 36.0, 10.0, 20.0, 8.0, 6.0, 4.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0070648193359375, -0.006839931011199951, -0.006615042686462402, -0.0063901543617248535, -0.006165266036987305, -0.005940377712249756, -0.005715489387512207, -0.005490601062774658, -0.005265712738037109, -0.0050408244132995605, -0.004815936088562012, -0.004591047763824463, -0.004366159439086914, -0.004141271114349365, -0.003916382789611816, -0.0036914944648742676, -0.0034666061401367188, -0.00324171781539917, -0.003016829490661621, -0.0027919411659240723, -0.0025670528411865234, -0.0023421645164489746, -0.0021172761917114258, -0.001892387866973877, -0.0016674995422363281, -0.0014426112174987793, -0.0012177228927612305, -0.0009928345680236816, -0.0007679462432861328, -0.000543057918548584, -0.00031816959381103516, -9.328126907348633e-05, 0.0001316070556640625, 0.00035649538040161133, 0.0005813837051391602, 0.000806272029876709, 0.0010311603546142578, 0.0012560486793518066, 0.0014809370040893555, 0.0017058253288269043, 0.0019307136535644531, 0.002155601978302002, 0.0023804903030395508, 0.0026053786277770996, 0.0028302669525146484, 0.0030551552772521973, 0.003280043601989746, 0.003504931926727295, 0.0037298202514648438, 0.003954708576202393, 0.004179596900939941, 0.00440448522567749, 0.004629373550415039, 0.004854261875152588, 0.005079150199890137, 0.0053040385246276855, 0.005528926849365234, 0.005753815174102783, 0.005978703498840332, 0.006203591823577881, 0.00642848014831543, 0.0066533684730529785, 0.006878256797790527, 0.007103145122528076, 0.007328033447265625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 52.0, 437.0, 463.0, 45.0, 8.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5087988972663879, -0.498422771692276, -0.48804667592048645, -0.4776705503463745, -0.46729445457458496, -0.456918329000473, -0.4465422034263611, -0.43616610765457153, -0.4257899820804596, -0.41541385650634766, -0.4050377607345581, -0.39466163516044617, -0.3842855393886566, -0.3739094138145447, -0.3635333180427551, -0.3531571924686432, -0.34278106689453125, -0.3324049413204193, -0.32202884554862976, -0.3116527199745178, -0.30127662420272827, -0.29090049862861633, -0.2805243730545044, -0.27014827728271484, -0.2597721815109253, -0.24939607083797455, -0.2390199601650238, -0.22864383459091187, -0.21826772391796112, -0.20789161324501038, -0.19751550257205963, -0.1871393918991089, -0.17676326632499695, -0.1663871556520462, -0.15601104497909546, -0.14563491940498352, -0.13525880873203278, -0.12488269805908203, -0.11450658738613129, -0.10413046926259995, -0.0937543585896492, -0.08337824791669846, -0.07300212979316711, -0.06262601912021637, -0.05224990472197533, -0.04187379032373428, -0.03149767965078354, -0.021121561527252197, -0.010745450854301453, -0.00036933738738298416, 0.010006776079535484, 0.020382888615131378, 0.03075900301337242, 0.041135117411613464, 0.05151122808456421, 0.06188734620809555, 0.0722634568810463, 0.08263956755399704, 0.09301568567752838, 0.10339179635047913, 0.11376790702342987, 0.12414402514696121, 0.13452014327049255, 0.1448962539434433, 0.15527236461639404]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 15.0, 9.0, 12.0, 11.0, 11.0, 27.0, 32.0, 35.0, 37.0, 44.0, 56.0, 67.0, 69.0, 53.0, 46.0, 50.0, 68.0, 47.0, 47.0, 57.0, 35.0, 35.0, 27.0, 33.0, 23.0, 13.0, 12.0, 8.0, 7.0, 3.0, 3.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0491107702255249, -0.04739895462989807, -0.04568713530898094, -0.04397531598806381, -0.04226350039243698, -0.04055168479681015, -0.03883986547589302, -0.03712804615497589, -0.03541623055934906, -0.03370441496372223, -0.0319925956428051, -0.03028077818453312, -0.02856896072626114, -0.02685714326798916, -0.02514532580971718, -0.023433508351445198, -0.021721690893173218, -0.020009873434901237, -0.018298055976629257, -0.016586238518357277, -0.014874421060085297, -0.013162603601813316, -0.011450786143541336, -0.009738968685269356, -0.008027151226997375, -0.006315333768725395, -0.004603516310453415, -0.0028916988521814346, -0.0011798813939094543, 0.0005319360643625259, 0.0022437535226345062, 0.0039555709809064865, 0.005667388439178467, 0.007379205897450447, 0.009091023355722427, 0.010802840813994408, 0.012514658272266388, 0.014226475730538368, 0.01593829318881035, 0.01765011064708233, 0.01936192810535431, 0.02107374556362629, 0.02278556302189827, 0.02449738048017025, 0.02620919793844223, 0.02792101539671421, 0.02963283285498619, 0.03134465217590332, 0.03305646777153015, 0.03476828336715698, 0.03648010268807411, 0.03819192200899124, 0.03990373760461807, 0.041615553200244904, 0.04332737252116203, 0.04503919184207916, 0.046751007437705994, 0.048462823033332825, 0.050174642354249954, 0.051886461675167084, 0.053598277270793915, 0.055310092866420746, 0.057021912187337875, 0.058733731508255005, 0.060445547103881836]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 5.0, 3.0, 14.0, 18.0, 22.0, 40.0, 67.0, 94.0, 176.0, 291.0, 690.0, 1688.0, 5250.0, 22088.0, 211442.0, 3821694.0, 109224.0, 15567.0, 3601.0, 1225.0, 484.0, 232.0, 165.0, 80.0, 40.0, 26.0, 27.0, 14.0, 9.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0299072265625, -0.029062271118164062, -0.028217315673828125, -0.027372360229492188, -0.02652740478515625, -0.025682449340820312, -0.024837493896484375, -0.023992538452148438, -0.0231475830078125, -0.022302627563476562, -0.021457672119140625, -0.020612716674804688, -0.01976776123046875, -0.018922805786132812, -0.018077850341796875, -0.017232894897460938, -0.016387939453125, -0.015542984008789062, -0.014698028564453125, -0.013853073120117188, -0.01300811767578125, -0.012163162231445312, -0.011318206787109375, -0.010473251342773438, -0.0096282958984375, -0.008783340454101562, -0.007938385009765625, -0.0070934295654296875, -0.00624847412109375, -0.0054035186767578125, -0.004558563232421875, -0.0037136077880859375, -0.00286865234375, -0.0020236968994140625, -0.001178741455078125, -0.0003337860107421875, 0.00051116943359375, 0.0013561248779296875, 0.002201080322265625, 0.0030460357666015625, 0.0038909912109375, 0.0047359466552734375, 0.005580902099609375, 0.0064258575439453125, 0.00727081298828125, 0.008115768432617188, 0.008960723876953125, 0.009805679321289062, 0.010650634765625, 0.011495590209960938, 0.012340545654296875, 0.013185501098632812, 0.01403045654296875, 0.014875411987304688, 0.015720367431640625, 0.016565322875976562, 0.0174102783203125, 0.018255233764648438, 0.019100189208984375, 0.019945144653320312, 0.02079010009765625, 0.021635055541992188, 0.022480010986328125, 0.023324966430664062, 0.024169921875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 8.0, 12.0, 18.0, 27.0, 28.0, 31.0, 38.0, 67.0, 59.0, 78.0, 69.0, 81.0, 91.0, 72.0, 66.0, 61.0, 59.0, 42.0, 25.0, 27.0, 14.0, 13.0, 11.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007904052734375, -0.007662057876586914, -0.007420063018798828, -0.007178068161010742, -0.006936073303222656, -0.00669407844543457, -0.006452083587646484, -0.0062100887298583984, -0.0059680938720703125, -0.0057260990142822266, -0.005484104156494141, -0.005242109298706055, -0.005000114440917969, -0.004758119583129883, -0.004516124725341797, -0.004274129867553711, -0.004032135009765625, -0.003790140151977539, -0.003548145294189453, -0.003306150436401367, -0.0030641555786132812, -0.0028221607208251953, -0.0025801658630371094, -0.0023381710052490234, -0.0020961761474609375, -0.0018541812896728516, -0.0016121864318847656, -0.0013701915740966797, -0.0011281967163085938, -0.0008862018585205078, -0.0006442070007324219, -0.00040221214294433594, -0.00016021728515625, 8.177757263183594e-05, 0.0003237724304199219, 0.0005657672882080078, 0.0008077621459960938, 0.0010497570037841797, 0.0012917518615722656, 0.0015337467193603516, 0.0017757415771484375, 0.0020177364349365234, 0.0022597312927246094, 0.0025017261505126953, 0.0027437210083007812, 0.002985715866088867, 0.003227710723876953, 0.003469705581665039, 0.003711700439453125, 0.003953695297241211, 0.004195690155029297, 0.004437685012817383, 0.004679679870605469, 0.004921674728393555, 0.005163669586181641, 0.0054056644439697266, 0.0056476593017578125, 0.0058896541595458984, 0.006131649017333984, 0.00637364387512207, 0.006615638732910156, 0.006857633590698242, 0.007099628448486328, 0.007341623306274414, 0.0075836181640625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 12.0, 21.0, 22.0, 25.0, 50.0, 71.0, 118.0, 227.0, 530.0, 1854.0, 10407.0, 141899.0, 3918529.0, 108626.0, 9175.0, 1603.0, 524.0, 210.0, 130.0, 81.0, 53.0, 43.0, 17.0, 17.0, 12.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03717041015625, -0.03609180450439453, -0.03501319885253906, -0.033934593200683594, -0.032855987548828125, -0.031777381896972656, -0.030698776245117188, -0.02962017059326172, -0.02854156494140625, -0.02746295928955078, -0.026384353637695312, -0.025305747985839844, -0.024227142333984375, -0.023148536682128906, -0.022069931030273438, -0.02099132537841797, -0.0199127197265625, -0.01883411407470703, -0.017755508422851562, -0.016676902770996094, -0.015598297119140625, -0.014519691467285156, -0.013441085815429688, -0.012362480163574219, -0.01128387451171875, -0.010205268859863281, -0.009126663208007812, -0.008048057556152344, -0.006969451904296875, -0.005890846252441406, -0.0048122406005859375, -0.0037336349487304688, -0.002655029296875, -0.0015764236450195312, -0.0004978179931640625, 0.0005807876586914062, 0.001659393310546875, 0.0027379989624023438, 0.0038166046142578125, 0.004895210266113281, 0.00597381591796875, 0.007052421569824219, 0.008131027221679688, 0.009209632873535156, 0.010288238525390625, 0.011366844177246094, 0.012445449829101562, 0.013524055480957031, 0.0146026611328125, 0.01568126678466797, 0.016759872436523438, 0.017838478088378906, 0.018917083740234375, 0.019995689392089844, 0.021074295043945312, 0.02215290069580078, 0.02323150634765625, 0.02431011199951172, 0.025388717651367188, 0.026467323303222656, 0.027545928955078125, 0.028624534606933594, 0.029703140258789062, 0.03078174591064453, 0.0318603515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 3.0, 6.0, 14.0, 16.0, 15.0, 29.0, 30.0, 45.0, 70.0, 89.0, 131.0, 210.0, 517.0, 1094.0, 900.0, 375.0, 174.0, 96.0, 63.0, 52.0, 34.0, 29.0, 18.0, 22.0, 7.0, 12.0, 6.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01049041748046875, -0.010084152221679688, -0.009677886962890625, -0.009271621704101562, -0.0088653564453125, -0.008459091186523438, -0.008052825927734375, -0.0076465606689453125, -0.00724029541015625, -0.0068340301513671875, -0.006427764892578125, -0.0060214996337890625, -0.005615234375, -0.0052089691162109375, -0.004802703857421875, -0.0043964385986328125, -0.00399017333984375, -0.0035839080810546875, -0.003177642822265625, -0.0027713775634765625, -0.0023651123046875, -0.0019588470458984375, -0.001552581787109375, -0.0011463165283203125, -0.00074005126953125, -0.0003337860107421875, 7.2479248046875e-05, 0.0004787445068359375, 0.000885009765625, 0.0012912750244140625, 0.001697540283203125, 0.0021038055419921875, 0.00251007080078125, 0.0029163360595703125, 0.003322601318359375, 0.0037288665771484375, 0.0041351318359375, 0.0045413970947265625, 0.004947662353515625, 0.0053539276123046875, 0.00576019287109375, 0.0061664581298828125, 0.006572723388671875, 0.0069789886474609375, 0.00738525390625, 0.0077915191650390625, 0.008197784423828125, 0.008604049682617188, 0.00901031494140625, 0.009416580200195312, 0.009822845458984375, 0.010229110717773438, 0.0106353759765625, 0.011041641235351562, 0.011447906494140625, 0.011854171752929688, 0.01226043701171875, 0.012666702270507812, 0.013072967529296875, 0.013479232788085938, 0.013885498046875, 0.014291763305664062, 0.014698028564453125, 0.015104293823242188, 0.01551055908203125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 12.0, 48.0, 149.0, 287.0, 275.0, 110.0, 55.0, 28.0, 13.0, 9.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09855466336011887, -0.09514329582452774, -0.09173192083835602, -0.08832055330276489, -0.08490918576717377, -0.08149781823158264, -0.07808645069599152, -0.0746750757098198, -0.07126370817422867, -0.06785234063863754, -0.06444096565246582, -0.061029598116874695, -0.05761823058128357, -0.054206863045692444, -0.05079549178481102, -0.047384120523929596, -0.04397275298833847, -0.040561385452747345, -0.03715001419186592, -0.0337386429309845, -0.03032727539539337, -0.026915905997157097, -0.023504536598920822, -0.020093167200684547, -0.016681797802448273, -0.013270428404211998, -0.009859059005975723, -0.0064476896077394485, -0.003036320209503174, 0.0003750491887331009, 0.0037864185869693756, 0.00719778798520565, 0.010609157383441925, 0.0140205267816782, 0.017431896179914474, 0.02084326557815075, 0.024254634976387024, 0.0276660043746233, 0.031077373772859573, 0.034488745033741, 0.03790011256933212, 0.04131148010492325, 0.04472285136580467, 0.048134222626686096, 0.05154559016227722, 0.05495695769786835, 0.05836832895874977, 0.061779700219631195, 0.06519106775522232, 0.06860243529081345, 0.07201381027698517, 0.0754251778125763, 0.07883654534816742, 0.08224791288375854, 0.08565928041934967, 0.08907065540552139, 0.09248202294111252, 0.09589339047670364, 0.09930476546287537, 0.10271613299846649, 0.10612750053405762, 0.10953886806964874, 0.11295023560523987, 0.11636161059141159, 0.11977297812700272]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 6.0, 8.0, 6.0, 12.0, 5.0, 16.0, 21.0, 18.0, 19.0, 24.0, 36.0, 31.0, 35.0, 40.0, 45.0, 38.0, 42.0, 54.0, 44.0, 40.0, 52.0, 50.0, 48.0, 40.0, 32.0, 44.0, 30.0, 31.0, 25.0, 18.0, 23.0, 15.0, 10.0, 6.0, 9.0, 4.0, 7.0, 2.0, 4.0, 2.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.027832746505737305, -0.02683647722005844, -0.025840207934379578, -0.024843938648700714, -0.02384766936302185, -0.022851400077342987, -0.021855130791664124, -0.02085886150598526, -0.019862592220306396, -0.018866322934627533, -0.01787005364894867, -0.016873784363269806, -0.015877515077590942, -0.014881245791912079, -0.013884976506233215, -0.012888707220554352, -0.011892437934875488, -0.010896168649196625, -0.009899899363517761, -0.008903630077838898, -0.007907360792160034, -0.006911091506481171, -0.005914822220802307, -0.004918552935123444, -0.00392228364944458, -0.0029260143637657166, -0.001929745078086853, -0.0009334757924079895, 6.279349327087402e-05, 0.0010590627789497375, 0.002055332064628601, 0.0030516013503074646, 0.004047870635986328, 0.005044139921665192, 0.006040409207344055, 0.007036678493022919, 0.008032947778701782, 0.009029217064380646, 0.01002548635005951, 0.011021755635738373, 0.012018024921417236, 0.0130142942070961, 0.014010563492774963, 0.015006832778453827, 0.01600310206413269, 0.016999371349811554, 0.017995640635490417, 0.01899190992116928, 0.019988179206848145, 0.020984448492527008, 0.02198071777820587, 0.022976987063884735, 0.0239732563495636, 0.024969525635242462, 0.025965794920921326, 0.02696206420660019, 0.027958333492279053, 0.028954602777957916, 0.02995087206363678, 0.030947141349315643, 0.03194341063499451, 0.03293967992067337, 0.033935949206352234, 0.0349322184920311, 0.03592848777770996]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 11.0, 14.0, 22.0, 35.0, 56.0, 70.0, 112.0, 205.0, 391.0, 739.0, 2024.0, 6273.0, 24193.0, 118649.0, 569674.0, 262367.0, 47182.0, 11059.0, 3178.0, 1133.0, 489.0, 241.0, 147.0, 104.0, 57.0, 33.0, 33.0, 17.0, 8.0, 13.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0267791748046875, -0.02584671974182129, -0.024914264678955078, -0.023981809616088867, -0.023049354553222656, -0.022116899490356445, -0.021184444427490234, -0.020251989364624023, -0.019319534301757812, -0.0183870792388916, -0.01745462417602539, -0.01652216911315918, -0.015589714050292969, -0.014657258987426758, -0.013724803924560547, -0.012792348861694336, -0.011859893798828125, -0.010927438735961914, -0.009994983673095703, -0.009062528610229492, -0.008130073547363281, -0.00719761848449707, -0.006265163421630859, -0.0053327083587646484, -0.0044002532958984375, -0.0034677982330322266, -0.0025353431701660156, -0.0016028881072998047, -0.0006704330444335938, 0.0002620220184326172, 0.0011944770812988281, 0.002126932144165039, 0.00305938720703125, 0.003991842269897461, 0.004924297332763672, 0.005856752395629883, 0.006789207458496094, 0.007721662521362305, 0.008654117584228516, 0.009586572647094727, 0.010519027709960938, 0.011451482772827148, 0.01238393783569336, 0.01331639289855957, 0.014248847961425781, 0.015181303024291992, 0.016113758087158203, 0.017046213150024414, 0.017978668212890625, 0.018911123275756836, 0.019843578338623047, 0.020776033401489258, 0.02170848846435547, 0.02264094352722168, 0.02357339859008789, 0.0245058536529541, 0.025438308715820312, 0.026370763778686523, 0.027303218841552734, 0.028235673904418945, 0.029168128967285156, 0.030100584030151367, 0.031033039093017578, 0.03196549415588379, 0.03289794921875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 9.0, 22.0, 21.0, 25.0, 41.0, 40.0, 69.0, 68.0, 70.0, 93.0, 79.0, 80.0, 71.0, 70.0, 65.0, 38.0, 52.0, 30.0, 26.0, 13.0, 10.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007198333740234375, -0.006962597370147705, -0.006726861000061035, -0.006491124629974365, -0.006255388259887695, -0.006019651889801025, -0.0057839155197143555, -0.0055481791496276855, -0.005312442779541016, -0.005076706409454346, -0.004840970039367676, -0.004605233669281006, -0.004369497299194336, -0.004133760929107666, -0.003898024559020996, -0.003662288188934326, -0.0034265518188476562, -0.0031908154487609863, -0.0029550790786743164, -0.0027193427085876465, -0.0024836063385009766, -0.0022478699684143066, -0.0020121335983276367, -0.0017763972282409668, -0.0015406608581542969, -0.001304924488067627, -0.001069188117980957, -0.0008334517478942871, -0.0005977153778076172, -0.00036197900772094727, -0.00012624263763427734, 0.00010949373245239258, 0.0003452301025390625, 0.0005809664726257324, 0.0008167028427124023, 0.0010524392127990723, 0.0012881755828857422, 0.0015239119529724121, 0.001759648323059082, 0.001995384693145752, 0.002231121063232422, 0.002466857433319092, 0.0027025938034057617, 0.0029383301734924316, 0.0031740665435791016, 0.0034098029136657715, 0.0036455392837524414, 0.0038812756538391113, 0.004117012023925781, 0.004352748394012451, 0.004588484764099121, 0.004824221134185791, 0.005059957504272461, 0.005295693874359131, 0.005531430244445801, 0.005767166614532471, 0.006002902984619141, 0.0062386393547058105, 0.0064743757247924805, 0.00671011209487915, 0.00694584846496582, 0.00718158483505249, 0.00741732120513916, 0.00765305757522583, 0.0078887939453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 7.0, 11.0, 11.0, 19.0, 16.0, 31.0, 39.0, 54.0, 66.0, 109.0, 166.0, 284.0, 454.0, 775.0, 1501.0, 3258.0, 9076.0, 28911.0, 114708.0, 514264.0, 286666.0, 60337.0, 16953.0, 5641.0, 2363.0, 1143.0, 601.0, 334.0, 233.0, 163.0, 99.0, 71.0, 48.0, 43.0, 27.0, 20.0, 13.0, 15.0, 7.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02099609375, -0.02033543586730957, -0.01967477798461914, -0.01901412010192871, -0.01835346221923828, -0.01769280433654785, -0.017032146453857422, -0.016371488571166992, -0.015710830688476562, -0.015050172805786133, -0.014389514923095703, -0.013728857040405273, -0.013068199157714844, -0.012407541275024414, -0.011746883392333984, -0.011086225509643555, -0.010425567626953125, -0.009764909744262695, -0.009104251861572266, -0.008443593978881836, -0.007782936096191406, -0.0071222782135009766, -0.006461620330810547, -0.005800962448120117, -0.0051403045654296875, -0.004479646682739258, -0.003818988800048828, -0.0031583309173583984, -0.0024976730346679688, -0.001837015151977539, -0.0011763572692871094, -0.0005156993865966797, 0.00014495849609375, 0.0008056163787841797, 0.0014662742614746094, 0.002126932144165039, 0.0027875900268554688, 0.0034482479095458984, 0.004108905792236328, 0.004769563674926758, 0.0054302215576171875, 0.006090879440307617, 0.006751537322998047, 0.0074121952056884766, 0.008072853088378906, 0.008733510971069336, 0.009394168853759766, 0.010054826736450195, 0.010715484619140625, 0.011376142501831055, 0.012036800384521484, 0.012697458267211914, 0.013358116149902344, 0.014018774032592773, 0.014679431915283203, 0.015340089797973633, 0.016000747680664062, 0.016661405563354492, 0.017322063446044922, 0.01798272132873535, 0.01864337921142578, 0.01930403709411621, 0.01996469497680664, 0.02062535285949707, 0.0212860107421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 6.0, 6.0, 3.0, 10.0, 13.0, 14.0, 10.0, 26.0, 23.0, 30.0, 28.0, 37.0, 31.0, 33.0, 34.0, 36.0, 37.0, 57.0, 50.0, 47.0, 58.0, 37.0, 37.0, 35.0, 37.0, 38.0, 23.0, 33.0, 29.0, 23.0, 17.0, 15.0, 13.0, 14.0, 11.0, 10.0, 8.0, 4.0, 4.0, 10.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.01244354248046875, -0.012094616889953613, -0.011745691299438477, -0.01139676570892334, -0.011047840118408203, -0.010698914527893066, -0.01034998893737793, -0.010001063346862793, -0.009652137756347656, -0.00930321216583252, -0.008954286575317383, -0.008605360984802246, -0.00825643539428711, -0.007907509803771973, -0.007558584213256836, -0.007209658622741699, -0.0068607330322265625, -0.006511807441711426, -0.006162881851196289, -0.005813956260681152, -0.005465030670166016, -0.005116105079650879, -0.004767179489135742, -0.0044182538986206055, -0.004069328308105469, -0.003720402717590332, -0.0033714771270751953, -0.0030225515365600586, -0.002673625946044922, -0.002324700355529785, -0.0019757747650146484, -0.0016268491744995117, -0.001277923583984375, -0.0009289979934692383, -0.0005800724029541016, -0.00023114681243896484, 0.00011777877807617188, 0.0004667043685913086, 0.0008156299591064453, 0.001164555549621582, 0.0015134811401367188, 0.0018624067306518555, 0.002211332321166992, 0.002560257911682129, 0.0029091835021972656, 0.0032581090927124023, 0.003607034683227539, 0.003955960273742676, 0.0043048858642578125, 0.004653811454772949, 0.005002737045288086, 0.005351662635803223, 0.005700588226318359, 0.006049513816833496, 0.006398439407348633, 0.0067473649978637695, 0.007096290588378906, 0.007445216178894043, 0.00779414176940918, 0.008143067359924316, 0.008491992950439453, 0.00884091854095459, 0.009189844131469727, 0.009538769721984863, 0.0098876953125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 14.0, 3.0, 8.0, 5.0, 7.0, 5.0, 12.0, 14.0, 18.0, 26.0, 35.0, 41.0, 53.0, 104.0, 208.0, 355.0, 768.0, 1835.0, 5211.0, 20825.0, 175882.0, 713976.0, 106916.0, 15106.0, 4127.0, 1483.0, 662.0, 299.0, 161.0, 106.0, 77.0, 52.0, 30.0, 36.0, 23.0, 17.0, 10.0, 12.0, 6.0, 8.0, 9.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005889892578125, -0.005689561367034912, -0.005489230155944824, -0.005288898944854736, -0.0050885677337646484, -0.0048882365226745605, -0.004687905311584473, -0.004487574100494385, -0.004287242889404297, -0.004086911678314209, -0.003886580467224121, -0.003686249256134033, -0.0034859180450439453, -0.0032855868339538574, -0.0030852556228637695, -0.0028849244117736816, -0.0026845932006835938, -0.002484261989593506, -0.002283930778503418, -0.00208359956741333, -0.0018832683563232422, -0.0016829371452331543, -0.0014826059341430664, -0.0012822747230529785, -0.0010819435119628906, -0.0008816123008728027, -0.0006812810897827148, -0.00048094987869262695, -0.00028061866760253906, -8.028745651245117e-05, 0.00012004375457763672, 0.0003203749656677246, 0.0005207061767578125, 0.0007210373878479004, 0.0009213685989379883, 0.0011216998100280762, 0.001322031021118164, 0.001522362232208252, 0.0017226934432983398, 0.0019230246543884277, 0.0021233558654785156, 0.0023236870765686035, 0.0025240182876586914, 0.0027243494987487793, 0.002924680709838867, 0.003125011920928955, 0.003325343132019043, 0.003525674343109131, 0.0037260055541992188, 0.003926336765289307, 0.0041266679763793945, 0.004326999187469482, 0.00452733039855957, 0.004727661609649658, 0.004927992820739746, 0.005128324031829834, 0.005328655242919922, 0.00552898645401001, 0.005729317665100098, 0.0059296488761901855, 0.0061299800872802734, 0.006330311298370361, 0.006530642509460449, 0.006730973720550537, 0.006931304931640625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 6.0, 7.0, 5.0, 0.0, 10.0, 10.0, 14.0, 12.0, 19.0, 24.0, 26.0, 30.0, 38.0, 37.0, 0.0, 53.0, 53.0, 63.0, 45.0, 61.0, 50.0, 42.0, 42.0, 52.0, 0.0, 40.0, 44.0, 42.0, 40.0, 24.0, 27.0, 16.0, 13.0, 16.0, 7.0, 0.0, 8.0, 7.0, 9.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.430511474609375e-06, -1.3764947652816772e-06, -1.3224780559539795e-06, -1.2684613466262817e-06, -1.214444637298584e-06, -1.1604279279708862e-06, -1.1064112186431885e-06, -1.0523945093154907e-06, -9.98377799987793e-07, -9.443610906600952e-07, -8.903443813323975e-07, -8.363276720046997e-07, -7.82310962677002e-07, -7.282942533493042e-07, -6.742775440216064e-07, -6.202608346939087e-07, -5.662441253662109e-07, -5.122274160385132e-07, -4.5821070671081543e-07, -4.041939973831177e-07, -3.501772880554199e-07, -2.9616057872772217e-07, -2.421438694000244e-07, -1.8812716007232666e-07, -1.341104507446289e-07, -8.009374141693115e-08, -2.60770320892334e-08, 2.7939677238464355e-08, 8.195638656616211e-08, 1.3597309589385986e-07, 1.8998980522155762e-07, 2.4400651454925537e-07, 2.980232238769531e-07, 3.520399332046509e-07, 4.0605664253234863e-07, 4.600733518600464e-07, 5.140900611877441e-07, 5.681067705154419e-07, 6.221234798431396e-07, 6.761401891708374e-07, 7.301568984985352e-07, 7.841736078262329e-07, 8.381903171539307e-07, 8.922070264816284e-07, 9.462237358093262e-07, 1.000240445137024e-06, 1.0542571544647217e-06, 1.1082738637924194e-06, 1.1622905731201172e-06, 1.216307282447815e-06, 1.2703239917755127e-06, 1.3243407011032104e-06, 1.3783574104309082e-06, 1.432374119758606e-06, 1.4863908290863037e-06, 1.5404075384140015e-06, 1.5944242477416992e-06, 1.648440957069397e-06, 1.7024576663970947e-06, 1.7564743757247925e-06, 1.8104910850524902e-06, 1.864507794380188e-06, 1.9185245037078857e-06, 1.9725412130355835e-06, 2.0265579223632812e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 8.0, 9.0, 14.0, 20.0, 25.0, 26.0, 66.0, 107.0, 189.0, 394.0, 886.0, 2258.0, 9477.0, 107040.0, 853129.0, 64301.0, 7260.0, 1926.0, 731.0, 303.0, 154.0, 89.0, 52.0, 33.0, 13.0, 10.0, 6.0, 4.0, 7.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01078033447265625, -0.010457754135131836, -0.010135173797607422, -0.009812593460083008, -0.009490013122558594, -0.00916743278503418, -0.008844852447509766, -0.008522272109985352, -0.008199691772460938, -0.007877111434936523, -0.007554531097412109, -0.007231950759887695, -0.006909370422363281, -0.006586790084838867, -0.006264209747314453, -0.005941629409790039, -0.005619049072265625, -0.005296468734741211, -0.004973888397216797, -0.004651308059692383, -0.004328727722167969, -0.004006147384643555, -0.0036835670471191406, -0.0033609867095947266, -0.0030384063720703125, -0.0027158260345458984, -0.0023932456970214844, -0.0020706653594970703, -0.0017480850219726562, -0.0014255046844482422, -0.0011029243469238281, -0.0007803440093994141, -0.000457763671875, -0.00013518333435058594, 0.00018739700317382812, 0.0005099773406982422, 0.0008325576782226562, 0.0011551380157470703, 0.0014777183532714844, 0.0018002986907958984, 0.0021228790283203125, 0.0024454593658447266, 0.0027680397033691406, 0.0030906200408935547, 0.0034132003784179688, 0.003735780715942383, 0.004058361053466797, 0.004380941390991211, 0.004703521728515625, 0.005026102066040039, 0.005348682403564453, 0.005671262741088867, 0.005993843078613281, 0.006316423416137695, 0.006639003753662109, 0.0069615840911865234, 0.0072841644287109375, 0.0076067447662353516, 0.007929325103759766, 0.00825190544128418, 0.008574485778808594, 0.008897066116333008, 0.009219646453857422, 0.009542226791381836, 0.00986480712890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 9.0, 3.0, 5.0, 18.0, 27.0, 30.0, 60.0, 91.0, 151.0, 152.0, 152.0, 110.0, 73.0, 44.0, 28.0, 18.0, 12.0, 5.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00650787353515625, -0.0063343048095703125, -0.006160736083984375, -0.0059871673583984375, -0.0058135986328125, -0.0056400299072265625, -0.005466461181640625, -0.0052928924560546875, -0.00511932373046875, -0.0049457550048828125, -0.004772186279296875, -0.0045986175537109375, -0.004425048828125, -0.0042514801025390625, -0.004077911376953125, -0.0039043426513671875, -0.00373077392578125, -0.0035572052001953125, -0.003383636474609375, -0.0032100677490234375, -0.0030364990234375, -0.0028629302978515625, -0.002689361572265625, -0.0025157928466796875, -0.00234222412109375, -0.0021686553955078125, -0.001995086669921875, -0.0018215179443359375, -0.00164794921875, -0.0014743804931640625, -0.001300811767578125, -0.0011272430419921875, -0.00095367431640625, -0.0007801055908203125, -0.000606536865234375, -0.0004329681396484375, -0.0002593994140625, -8.58306884765625e-05, 8.7738037109375e-05, 0.0002613067626953125, 0.00043487548828125, 0.0006084442138671875, 0.000782012939453125, 0.0009555816650390625, 0.001129150390625, 0.0013027191162109375, 0.001476287841796875, 0.0016498565673828125, 0.00182342529296875, 0.0019969940185546875, 0.002170562744140625, 0.0023441314697265625, 0.0025177001953125, 0.0026912689208984375, 0.002864837646484375, 0.0030384063720703125, 0.00321197509765625, 0.0033855438232421875, 0.003559112548828125, 0.0037326812744140625, 0.00390625, 0.0040798187255859375, 0.004253387451171875, 0.0044269561767578125, 0.00460052490234375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 10.0, 70.0, 572.0, 314.0, 33.0, 9.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31873905658721924, -0.31008777022361755, -0.30143651366233826, -0.2927852272987366, -0.2841339409351349, -0.2754826843738556, -0.2668313980102539, -0.2581801116466522, -0.24952885508537292, -0.24087758362293243, -0.23222629725933075, -0.22357502579689026, -0.21492375433444977, -0.20627248287200928, -0.1976211965084076, -0.1889699250459671, -0.18031863868236542, -0.17166736721992493, -0.16301608085632324, -0.15436480939388275, -0.14571353793144226, -0.13706225156784058, -0.12841098010540009, -0.1197597086429596, -0.11110842972993851, -0.10245715081691742, -0.09380587935447693, -0.08515460044145584, -0.07650332152843475, -0.06785205006599426, -0.059200771152973175, -0.050549495965242386, -0.04189823567867279, -0.033246960490942, -0.024595683440566063, -0.015944406390190125, -0.007293131202459335, 0.0013581439852714539, 0.010009422898292542, 0.01866069808602333, 0.02731197327375412, 0.03596324846148491, 0.0446145236492157, 0.053265802562236786, 0.061917077749967575, 0.07056835293769836, 0.07921963185071945, 0.08787091076374054, 0.09652218222618103, 0.10517346113920212, 0.11382473260164261, 0.1224760115146637, 0.1311272829771042, 0.13977855443954468, 0.14842984080314636, 0.15708111226558685, 0.16573238372802734, 0.17438365519046783, 0.18303494155406952, 0.19168621301651, 0.2003374844789505, 0.208988755941391, 0.21764004230499268, 0.22629131376743317, 0.23494260013103485]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 4.0, 7.0, 12.0, 9.0, 8.0, 14.0, 21.0, 20.0, 23.0, 24.0, 40.0, 32.0, 36.0, 47.0, 55.0, 40.0, 49.0, 43.0, 42.0, 48.0, 44.0, 50.0, 43.0, 42.0, 47.0, 34.0, 25.0, 23.0, 26.0, 16.0, 14.0, 18.0, 9.0, 10.0, 4.0, 8.0, 4.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031600356101989746, -0.030321698635816574, -0.029043039306998253, -0.02776437997817993, -0.02648572251200676, -0.025207065045833588, -0.023928405717015266, -0.022649746388196945, -0.021371088922023773, -0.0200924314558506, -0.01881377212703228, -0.01753511279821396, -0.016256455332040787, -0.01497779693454504, -0.013699138537049294, -0.012420480139553547, -0.0111418217420578, -0.009863163344562054, -0.008584504947066307, -0.0073058465495705605, -0.006027188152074814, -0.004748529754579067, -0.0034698713570833206, -0.002191212959587574, -0.0009125545620918274, 0.0003661038354039192, 0.0016447622328996658, 0.0029234206303954124, 0.004202079027891159, 0.005480737425386906, 0.006759395822882652, 0.008038054220378399, 0.009316712617874146, 0.010595371015369892, 0.011874029412865639, 0.013152687810361385, 0.014431346207857132, 0.015710003674030304, 0.016988663002848625, 0.018267322331666946, 0.01954597979784012, 0.02082463726401329, 0.02210329659283161, 0.023381955921649933, 0.024660613387823105, 0.025939270853996277, 0.027217930182814598, 0.02849658951163292, 0.02977524697780609, 0.031053904443979263, 0.032332561910152435, 0.033611223101615906, 0.03488988056778908, 0.03616853803396225, 0.03744719922542572, 0.03872585669159889, 0.040004514157772064, 0.041283171623945236, 0.04256182909011841, 0.04384049028158188, 0.04511914774775505, 0.04639780521392822, 0.04767646640539169, 0.048955123871564865, 0.05023378133773804]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 8.0, 10.0, 8.0, 15.0, 17.0, 19.0, 25.0, 20.0, 45.0, 46.0, 80.0, 115.0, 156.0, 279.0, 477.0, 886.0, 1754.0, 4164.0, 10099.0, 30317.0, 132793.0, 2951413.0, 963189.0, 66001.0, 19889.0, 6987.0, 2780.0, 1195.0, 599.0, 285.0, 200.0, 113.0, 89.0, 62.0, 43.0, 33.0, 21.0, 10.0, 11.0, 9.0, 5.0, 3.0, 7.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.015289306640625, -0.01486217975616455, -0.014435052871704102, -0.014007925987243652, -0.013580799102783203, -0.013153672218322754, -0.012726545333862305, -0.012299418449401855, -0.011872291564941406, -0.011445164680480957, -0.011018037796020508, -0.010590910911560059, -0.01016378402709961, -0.00973665714263916, -0.009309530258178711, -0.008882403373718262, -0.008455276489257812, -0.008028149604797363, -0.007601022720336914, -0.007173895835876465, -0.006746768951416016, -0.006319642066955566, -0.005892515182495117, -0.005465388298034668, -0.005038261413574219, -0.0046111345291137695, -0.00418400764465332, -0.003756880760192871, -0.003329753875732422, -0.0029026269912719727, -0.0024755001068115234, -0.0020483732223510742, -0.001621246337890625, -0.0011941194534301758, -0.0007669925689697266, -0.00033986568450927734, 8.726119995117188e-05, 0.0005143880844116211, 0.0009415149688720703, 0.0013686418533325195, 0.0017957687377929688, 0.002222895622253418, 0.002650022506713867, 0.0030771493911743164, 0.0035042762756347656, 0.003931403160095215, 0.004358530044555664, 0.004785656929016113, 0.0052127838134765625, 0.005639910697937012, 0.006067037582397461, 0.00649416446685791, 0.006921291351318359, 0.007348418235778809, 0.007775545120239258, 0.008202672004699707, 0.008629798889160156, 0.009056925773620605, 0.009484052658081055, 0.009911179542541504, 0.010338306427001953, 0.010765433311462402, 0.011192560195922852, 0.0116196870803833, 0.01204681396484375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 12.0, 23.0, 27.0, 27.0, 43.0, 47.0, 85.0, 90.0, 85.0, 71.0, 84.0, 86.0, 72.0, 64.0, 58.0, 33.0, 23.0, 22.0, 20.0, 14.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00939178466796875, -0.009120821952819824, -0.008849859237670898, -0.008578896522521973, -0.008307933807373047, -0.008036971092224121, -0.007766008377075195, -0.0074950456619262695, -0.007224082946777344, -0.006953120231628418, -0.006682157516479492, -0.006411194801330566, -0.006140232086181641, -0.005869269371032715, -0.005598306655883789, -0.005327343940734863, -0.0050563812255859375, -0.004785418510437012, -0.004514455795288086, -0.00424349308013916, -0.003972530364990234, -0.0037015676498413086, -0.003430604934692383, -0.003159642219543457, -0.0028886795043945312, -0.0026177167892456055, -0.0023467540740966797, -0.002075791358947754, -0.0018048286437988281, -0.0015338659286499023, -0.0012629032135009766, -0.0009919404983520508, -0.000720977783203125, -0.0004500150680541992, -0.00017905235290527344, 9.191036224365234e-05, 0.0003628730773925781, 0.0006338357925415039, 0.0009047985076904297, 0.0011757612228393555, 0.0014467239379882812, 0.001717686653137207, 0.001988649368286133, 0.0022596120834350586, 0.0025305747985839844, 0.00280153751373291, 0.003072500228881836, 0.0033434629440307617, 0.0036144256591796875, 0.0038853883743286133, 0.004156351089477539, 0.004427313804626465, 0.004698276519775391, 0.004969239234924316, 0.005240201950073242, 0.005511164665222168, 0.005782127380371094, 0.0060530900955200195, 0.006324052810668945, 0.006595015525817871, 0.006865978240966797, 0.007136940956115723, 0.0074079036712646484, 0.007678866386413574, 0.0079498291015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 9.0, 13.0, 5.0, 11.0, 21.0, 31.0, 38.0, 56.0, 82.0, 130.0, 295.0, 653.0, 1816.0, 5705.0, 22015.0, 164401.0, 3770109.0, 195077.0, 24227.0, 6068.0, 1989.0, 751.0, 308.0, 159.0, 105.0, 55.0, 41.0, 31.0, 19.0, 16.0, 11.0, 7.0, 7.0, 6.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0223388671875, -0.02171015739440918, -0.02108144760131836, -0.02045273780822754, -0.01982402801513672, -0.0191953182220459, -0.018566608428955078, -0.017937898635864258, -0.017309188842773438, -0.016680479049682617, -0.016051769256591797, -0.015423059463500977, -0.014794349670410156, -0.014165639877319336, -0.013536930084228516, -0.012908220291137695, -0.012279510498046875, -0.011650800704956055, -0.011022090911865234, -0.010393381118774414, -0.009764671325683594, -0.009135961532592773, -0.008507251739501953, -0.007878541946411133, -0.0072498321533203125, -0.006621122360229492, -0.005992412567138672, -0.0053637027740478516, -0.004734992980957031, -0.004106283187866211, -0.0034775733947753906, -0.0028488636016845703, -0.00222015380859375, -0.0015914440155029297, -0.0009627342224121094, -0.00033402442932128906, 0.00029468536376953125, 0.0009233951568603516, 0.0015521049499511719, 0.002180814743041992, 0.0028095245361328125, 0.003438234329223633, 0.004066944122314453, 0.0046956539154052734, 0.005324363708496094, 0.005953073501586914, 0.006581783294677734, 0.007210493087768555, 0.007839202880859375, 0.008467912673950195, 0.009096622467041016, 0.009725332260131836, 0.010354042053222656, 0.010982751846313477, 0.011611461639404297, 0.012240171432495117, 0.012868881225585938, 0.013497591018676758, 0.014126300811767578, 0.014755010604858398, 0.015383720397949219, 0.01601243019104004, 0.01664113998413086, 0.01726984977722168, 0.0178985595703125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 7.0, 8.0, 4.0, 12.0, 9.0, 9.0, 12.0, 28.0, 40.0, 39.0, 49.0, 69.0, 89.0, 169.0, 390.0, 866.0, 1128.0, 541.0, 224.0, 100.0, 73.0, 41.0, 41.0, 25.0, 24.0, 14.0, 14.0, 11.0, 5.0, 5.0, 6.0, 5.0, 2.0, 3.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0097198486328125, -0.009374260902404785, -0.00902867317199707, -0.008683085441589355, -0.00833749771118164, -0.007991909980773926, -0.007646322250366211, -0.007300734519958496, -0.006955146789550781, -0.006609559059143066, -0.0062639713287353516, -0.005918383598327637, -0.005572795867919922, -0.005227208137512207, -0.004881620407104492, -0.004536032676696777, -0.0041904449462890625, -0.0038448572158813477, -0.003499269485473633, -0.003153681755065918, -0.002808094024658203, -0.0024625062942504883, -0.0021169185638427734, -0.0017713308334350586, -0.0014257431030273438, -0.001080155372619629, -0.0007345676422119141, -0.0003889799118041992, -4.3392181396484375e-05, 0.00030219554901123047, 0.0006477832794189453, 0.0009933710098266602, 0.001338958740234375, 0.0016845464706420898, 0.0020301342010498047, 0.0023757219314575195, 0.0027213096618652344, 0.0030668973922729492, 0.003412485122680664, 0.003758072853088379, 0.004103660583496094, 0.004449248313903809, 0.0047948360443115234, 0.005140423774719238, 0.005486011505126953, 0.005831599235534668, 0.006177186965942383, 0.006522774696350098, 0.0068683624267578125, 0.007213950157165527, 0.007559537887573242, 0.007905125617980957, 0.008250713348388672, 0.008596301078796387, 0.008941888809204102, 0.009287476539611816, 0.009633064270019531, 0.009978652000427246, 0.010324239730834961, 0.010669827461242676, 0.01101541519165039, 0.011361002922058105, 0.01170659065246582, 0.012052178382873535, 0.01239776611328125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 9.0, 13.0, 22.0, 40.0, 116.0, 159.0, 240.0, 192.0, 108.0, 53.0, 15.0, 11.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07353758066892624, -0.07120957970619202, -0.0688815712928772, -0.06655357033014297, -0.06422556936740875, -0.06189756095409393, -0.05956955999135971, -0.05724155530333519, -0.05491355061531067, -0.05258554592728615, -0.050257544964551926, -0.047929540276527405, -0.045601535588502884, -0.04327353090047836, -0.04094552993774414, -0.03861752524971962, -0.0362895242869854, -0.033961519598960876, -0.031633518636226654, -0.029305513948202133, -0.026977509260177612, -0.02464950643479824, -0.02232150360941887, -0.019993498921394348, -0.017665496096014977, -0.01533749233931303, -0.013009488582611084, -0.010681485757231712, -0.008353482000529766, -0.00602547824382782, -0.003697475418448448, -0.0013694707304239273, 0.0009585320949554443, 0.003286535618826747, 0.0056145391426980495, 0.007942542433738708, 0.010270546190440655, 0.012598549947142601, 0.014926552772521973, 0.017254557460546494, 0.019582560285925865, 0.021910563111305237, 0.024238567799329758, 0.02656657062470913, 0.0288945734500885, 0.031222578138113022, 0.03355058282613754, 0.035878583788871765, 0.038206588476896286, 0.04053459316492081, 0.04286259412765503, 0.04519059881567955, 0.04751860350370407, 0.04984660446643829, 0.052174609154462814, 0.054502613842487335, 0.05683061480522156, 0.05915861949324608, 0.0614866204559803, 0.06381462514400482, 0.06614262610673904, 0.06847063452005386, 0.07079863548278809, 0.0731266438961029, 0.07545464485883713]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 4.0, 12.0, 10.0, 5.0, 11.0, 13.0, 7.0, 16.0, 16.0, 24.0, 23.0, 29.0, 29.0, 24.0, 29.0, 34.0, 36.0, 42.0, 36.0, 36.0, 50.0, 41.0, 51.0, 44.0, 41.0, 40.0, 28.0, 40.0, 31.0, 28.0, 17.0, 23.0, 19.0, 21.0, 11.0, 12.0, 12.0, 8.0, 9.0, 8.0, 10.0, 1.0, 6.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0], "bins": [-0.027862370014190674, -0.027080954983830452, -0.02629953995347023, -0.025518124923110008, -0.024736709892749786, -0.023955294862389565, -0.023173879832029343, -0.02239246480166912, -0.0216110497713089, -0.020829634740948677, -0.020048219710588455, -0.019266804680228233, -0.01848538964986801, -0.01770397461950779, -0.016922559589147568, -0.016141144558787346, -0.015359729528427124, -0.014578314498066902, -0.01379689946770668, -0.013015484437346458, -0.012234069406986237, -0.011452654376626015, -0.010671239346265793, -0.009889824315905571, -0.009108409285545349, -0.008326994255185127, -0.007545579224824905, -0.0067641641944646835, -0.005982749164104462, -0.00520133413374424, -0.004419919103384018, -0.003638504073023796, -0.0028570890426635742, -0.0020756740123033524, -0.0012942589819431305, -0.0005128439515829086, 0.00026857107877731323, 0.001049986109137535, 0.001831401139497757, 0.002612816169857979, 0.0033942312002182007, 0.0041756462305784225, 0.004957061260938644, 0.005738476291298866, 0.006519891321659088, 0.00730130635201931, 0.008082721382379532, 0.008864136412739754, 0.009645551443099976, 0.010426966473460197, 0.01120838150382042, 0.011989796534180641, 0.012771211564540863, 0.013552626594901085, 0.014334041625261307, 0.015115456655621529, 0.01589687168598175, 0.016678286716341972, 0.017459701746702194, 0.018241116777062416, 0.019022531807422638, 0.01980394683778286, 0.02058536186814308, 0.021366776898503304, 0.022148191928863525]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 8.0, 13.0, 14.0, 24.0, 26.0, 42.0, 94.0, 136.0, 227.0, 449.0, 1157.0, 3312.0, 11949.0, 63801.0, 455578.0, 434116.0, 60812.0, 11482.0, 3164.0, 1073.0, 479.0, 226.0, 134.0, 78.0, 42.0, 41.0, 23.0, 15.0, 6.0, 12.0, 5.0, 4.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0265350341796875, -0.025730609893798828, -0.024926185607910156, -0.024121761322021484, -0.023317337036132812, -0.02251291275024414, -0.02170848846435547, -0.020904064178466797, -0.020099639892578125, -0.019295215606689453, -0.01849079132080078, -0.01768636703491211, -0.016881942749023438, -0.016077518463134766, -0.015273094177246094, -0.014468669891357422, -0.01366424560546875, -0.012859821319580078, -0.012055397033691406, -0.011250972747802734, -0.010446548461914062, -0.00964212417602539, -0.008837699890136719, -0.008033275604248047, -0.007228851318359375, -0.006424427032470703, -0.005620002746582031, -0.004815578460693359, -0.0040111541748046875, -0.0032067298889160156, -0.0024023056030273438, -0.0015978813171386719, -0.00079345703125, 1.0967254638671875e-05, 0.0008153915405273438, 0.0016198158264160156, 0.0024242401123046875, 0.0032286643981933594, 0.004033088684082031, 0.004837512969970703, 0.005641937255859375, 0.006446361541748047, 0.007250785827636719, 0.00805521011352539, 0.008859634399414062, 0.009664058685302734, 0.010468482971191406, 0.011272907257080078, 0.01207733154296875, 0.012881755828857422, 0.013686180114746094, 0.014490604400634766, 0.015295028686523438, 0.01609945297241211, 0.01690387725830078, 0.017708301544189453, 0.018512725830078125, 0.019317150115966797, 0.02012157440185547, 0.02092599868774414, 0.021730422973632812, 0.022534847259521484, 0.023339271545410156, 0.024143695831298828, 0.0249481201171875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 8.0, 13.0, 15.0, 34.0, 28.0, 40.0, 75.0, 79.0, 79.0, 73.0, 89.0, 84.0, 76.0, 58.0, 66.0, 54.0, 47.0, 28.0, 22.0, 19.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.008392333984375, -0.00814288854598999, -0.00789344310760498, -0.007643997669219971, -0.007394552230834961, -0.007145106792449951, -0.006895661354064941, -0.006646215915679932, -0.006396770477294922, -0.006147325038909912, -0.005897879600524902, -0.005648434162139893, -0.005398988723754883, -0.005149543285369873, -0.004900097846984863, -0.0046506524085998535, -0.004401206970214844, -0.004151761531829834, -0.0039023160934448242, -0.0036528706550598145, -0.0034034252166748047, -0.003153979778289795, -0.002904534339904785, -0.0026550889015197754, -0.0024056434631347656, -0.002156198024749756, -0.001906752586364746, -0.0016573071479797363, -0.0014078617095947266, -0.0011584162712097168, -0.000908970832824707, -0.0006595253944396973, -0.0004100799560546875, -0.00016063451766967773, 8.881092071533203e-05, 0.0003382563591003418, 0.0005877017974853516, 0.0008371472358703613, 0.001086592674255371, 0.0013360381126403809, 0.0015854835510253906, 0.0018349289894104004, 0.00208437442779541, 0.00233381986618042, 0.0025832653045654297, 0.0028327107429504395, 0.0030821561813354492, 0.003331601619720459, 0.0035810470581054688, 0.0038304924964904785, 0.004079937934875488, 0.004329383373260498, 0.004578828811645508, 0.004828274250030518, 0.005077719688415527, 0.005327165126800537, 0.005576610565185547, 0.005826056003570557, 0.006075501441955566, 0.006324946880340576, 0.006574392318725586, 0.006823837757110596, 0.0070732831954956055, 0.007322728633880615, 0.007572174072265625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 7.0, 15.0, 11.0, 15.0, 28.0, 44.0, 48.0, 65.0, 75.0, 114.0, 171.0, 215.0, 324.0, 489.0, 879.0, 1633.0, 3747.0, 9632.0, 29699.0, 108193.0, 473545.0, 314844.0, 70466.0, 20671.0, 7260.0, 2857.0, 1350.0, 703.0, 418.0, 288.0, 196.0, 149.0, 102.0, 83.0, 57.0, 50.0, 25.0, 28.0, 18.0, 8.0, 11.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.015899658203125, -0.015384197235107422, -0.014868736267089844, -0.014353275299072266, -0.013837814331054688, -0.01332235336303711, -0.012806892395019531, -0.012291431427001953, -0.011775970458984375, -0.011260509490966797, -0.010745048522949219, -0.01022958755493164, -0.009714126586914062, -0.009198665618896484, -0.008683204650878906, -0.008167743682861328, -0.00765228271484375, -0.007136821746826172, -0.006621360778808594, -0.006105899810791016, -0.0055904388427734375, -0.005074977874755859, -0.004559516906738281, -0.004044055938720703, -0.003528594970703125, -0.003013134002685547, -0.0024976730346679688, -0.0019822120666503906, -0.0014667510986328125, -0.0009512901306152344, -0.00043582916259765625, 7.963180541992188e-05, 0.0005950927734375, 0.0011105537414550781, 0.0016260147094726562, 0.0021414756774902344, 0.0026569366455078125, 0.0031723976135253906, 0.0036878585815429688, 0.004203319549560547, 0.004718780517578125, 0.005234241485595703, 0.005749702453613281, 0.006265163421630859, 0.0067806243896484375, 0.007296085357666016, 0.007811546325683594, 0.008327007293701172, 0.00884246826171875, 0.009357929229736328, 0.009873390197753906, 0.010388851165771484, 0.010904312133789062, 0.01141977310180664, 0.011935234069824219, 0.012450695037841797, 0.012966156005859375, 0.013481616973876953, 0.013997077941894531, 0.01451253890991211, 0.015027999877929688, 0.015543460845947266, 0.016058921813964844, 0.016574382781982422, 0.01708984375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 5.0, 6.0, 7.0, 8.0, 11.0, 15.0, 17.0, 17.0, 23.0, 19.0, 30.0, 33.0, 39.0, 44.0, 34.0, 50.0, 41.0, 41.0, 44.0, 40.0, 38.0, 37.0, 50.0, 41.0, 35.0, 34.0, 39.0, 32.0, 26.0, 20.0, 23.0, 21.0, 15.0, 11.0, 15.0, 7.0, 11.0, 7.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.01308441162109375, -0.01271212100982666, -0.01233983039855957, -0.01196753978729248, -0.01159524917602539, -0.0112229585647583, -0.010850667953491211, -0.010478377342224121, -0.010106086730957031, -0.009733796119689941, -0.009361505508422852, -0.008989214897155762, -0.008616924285888672, -0.008244633674621582, -0.007872343063354492, -0.007500052452087402, -0.0071277618408203125, -0.006755471229553223, -0.006383180618286133, -0.006010890007019043, -0.005638599395751953, -0.005266308784484863, -0.0048940181732177734, -0.004521727561950684, -0.004149436950683594, -0.003777146339416504, -0.003404855728149414, -0.0030325651168823242, -0.0026602745056152344, -0.0022879838943481445, -0.0019156932830810547, -0.0015434026718139648, -0.001171112060546875, -0.0007988214492797852, -0.0004265308380126953, -5.424022674560547e-05, 0.0003180503845214844, 0.0006903409957885742, 0.001062631607055664, 0.001434922218322754, 0.0018072128295898438, 0.0021795034408569336, 0.0025517940521240234, 0.0029240846633911133, 0.003296375274658203, 0.003668665885925293, 0.004040956497192383, 0.004413247108459473, 0.0047855377197265625, 0.005157828330993652, 0.005530118942260742, 0.005902409553527832, 0.006274700164794922, 0.006646990776062012, 0.0070192813873291016, 0.007391571998596191, 0.007763862609863281, 0.008136153221130371, 0.008508443832397461, 0.00888073444366455, 0.00925302505493164, 0.00962531566619873, 0.00999760627746582, 0.01036989688873291, 0.0107421875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 8.0, 3.0, 16.0, 9.0, 15.0, 21.0, 45.0, 42.0, 83.0, 114.0, 232.0, 376.0, 719.0, 1464.0, 3360.0, 9858.0, 33861.0, 161718.0, 577134.0, 200561.0, 40370.0, 11116.0, 3912.0, 1645.0, 821.0, 456.0, 209.0, 135.0, 80.0, 50.0, 41.0, 20.0, 15.0, 16.0, 9.0, 6.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031604766845703125, -0.0030498206615448, -0.002939164638519287, -0.0028285086154937744, -0.0027178525924682617, -0.002607196569442749, -0.0024965405464172363, -0.0023858845233917236, -0.002275228500366211, -0.0021645724773406982, -0.0020539164543151855, -0.0019432604312896729, -0.0018326044082641602, -0.0017219483852386475, -0.0016112923622131348, -0.001500636339187622, -0.0013899803161621094, -0.0012793242931365967, -0.001168668270111084, -0.0010580122470855713, -0.0009473562240600586, -0.0008367002010345459, -0.0007260441780090332, -0.0006153881549835205, -0.0005047321319580078, -0.0003940761089324951, -0.0002834200859069824, -0.00017276406288146973, -6.210803985595703e-05, 4.8547983169555664e-05, 0.00015920400619506836, 0.00026986002922058105, 0.00038051605224609375, 0.0004911720752716064, 0.0006018280982971191, 0.0007124841213226318, 0.0008231401443481445, 0.0009337961673736572, 0.00104445219039917, 0.0011551082134246826, 0.0012657642364501953, 0.001376420259475708, 0.0014870762825012207, 0.0015977323055267334, 0.001708388328552246, 0.0018190443515777588, 0.0019297003746032715, 0.002040356397628784, 0.002151012420654297, 0.0022616684436798096, 0.0023723244667053223, 0.002482980489730835, 0.0025936365127563477, 0.0027042925357818604, 0.002814948558807373, 0.0029256045818328857, 0.0030362606048583984, 0.003146916627883911, 0.003257572650909424, 0.0033682286739349365, 0.0034788846969604492, 0.003589540719985962, 0.0037001967430114746, 0.0038108527660369873, 0.0039215087890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 9.0, 5.0, 0.0, 10.0, 11.0, 15.0, 15.0, 0.0, 24.0, 33.0, 47.0, 0.0, 45.0, 51.0, 51.0, 0.0, 50.0, 64.0, 70.0, 0.0, 55.0, 70.0, 56.0, 66.0, 0.0, 58.0, 44.0, 28.0, 0.0, 29.0, 20.0, 26.0, 0.0, 18.0, 6.0, 9.0, 0.0, 9.0, 3.0, 2.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3709068298339844e-06, -1.325272023677826e-06, -1.2796372175216675e-06, -1.234002411365509e-06, -1.1883676052093506e-06, -1.1427327990531921e-06, -1.0970979928970337e-06, -1.0514631867408752e-06, -1.0058283805847168e-06, -9.601935744285583e-07, -9.145587682723999e-07, -8.689239621162415e-07, -8.23289155960083e-07, -7.776543498039246e-07, -7.320195436477661e-07, -6.863847374916077e-07, -6.407499313354492e-07, -5.951151251792908e-07, -5.494803190231323e-07, -5.038455128669739e-07, -4.5821070671081543e-07, -4.12575900554657e-07, -3.6694109439849854e-07, -3.213062882423401e-07, -2.7567148208618164e-07, -2.300366759300232e-07, -1.8440186977386475e-07, -1.387670636177063e-07, -9.313225746154785e-08, -4.7497451305389404e-08, -1.862645149230957e-09, 4.377216100692749e-08, 8.940696716308594e-08, 1.3504177331924438e-07, 1.8067657947540283e-07, 2.2631138563156128e-07, 2.7194619178771973e-07, 3.175809979438782e-07, 3.632158041000366e-07, 4.0885061025619507e-07, 4.544854164123535e-07, 5.00120222568512e-07, 5.457550287246704e-07, 5.913898348808289e-07, 6.370246410369873e-07, 6.826594471931458e-07, 7.282942533493042e-07, 7.739290595054626e-07, 8.195638656616211e-07, 8.651986718177795e-07, 9.10833477973938e-07, 9.564682841300964e-07, 1.0021030902862549e-06, 1.0477378964424133e-06, 1.0933727025985718e-06, 1.1390075087547302e-06, 1.1846423149108887e-06, 1.2302771210670471e-06, 1.2759119272232056e-06, 1.321546733379364e-06, 1.3671815395355225e-06, 1.412816345691681e-06, 1.4584511518478394e-06, 1.5040859580039978e-06, 1.5497207641601562e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 3.0, 10.0, 9.0, 10.0, 18.0, 17.0, 21.0, 34.0, 47.0, 48.0, 83.0, 97.0, 116.0, 186.0, 313.0, 498.0, 815.0, 1387.0, 2700.0, 5508.0, 12667.0, 34528.0, 117659.0, 417692.0, 323240.0, 84574.0, 26361.0, 10006.0, 4475.0, 2167.0, 1201.0, 718.0, 431.0, 260.0, 169.0, 119.0, 74.0, 72.0, 42.0, 36.0, 25.0, 23.0, 17.0, 14.0, 15.0, 10.0, 12.0, 9.0, 2.0, 1.0, 4.0, 5.0, 4.0, 2.0, 1.0], "bins": [-0.003055572509765625, -0.0029626190662384033, -0.0028696656227111816, -0.00277671217918396, -0.0026837587356567383, -0.0025908052921295166, -0.002497851848602295, -0.0024048984050750732, -0.0023119449615478516, -0.00221899151802063, -0.002126038074493408, -0.0020330846309661865, -0.0019401311874389648, -0.0018471777439117432, -0.0017542243003845215, -0.0016612708568572998, -0.0015683174133300781, -0.0014753639698028564, -0.0013824105262756348, -0.001289457082748413, -0.0011965036392211914, -0.0011035501956939697, -0.001010596752166748, -0.0009176433086395264, -0.0008246898651123047, -0.000731736421585083, -0.0006387829780578613, -0.0005458295345306396, -0.00045287609100341797, -0.0003599226474761963, -0.0002669692039489746, -0.00017401576042175293, -8.106231689453125e-05, 1.189112663269043e-05, 0.00010484457015991211, 0.0001977980136871338, 0.00029075145721435547, 0.00038370490074157715, 0.00047665834426879883, 0.0005696117877960205, 0.0006625652313232422, 0.0007555186748504639, 0.0008484721183776855, 0.0009414255619049072, 0.001034379005432129, 0.0011273324489593506, 0.0012202858924865723, 0.001313239336013794, 0.0014061927795410156, 0.0014991462230682373, 0.001592099666595459, 0.0016850531101226807, 0.0017780065536499023, 0.001870959997177124, 0.0019639134407043457, 0.0020568668842315674, 0.002149820327758789, 0.0022427737712860107, 0.0023357272148132324, 0.002428680658340454, 0.0025216341018676758, 0.0026145875453948975, 0.002707540988922119, 0.002800494432449341, 0.0028934478759765625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 12.0, 14.0, 7.0, 8.0, 13.0, 14.0, 14.0, 22.0, 30.0, 38.0, 33.0, 45.0, 56.0, 43.0, 47.0, 54.0, 61.0, 60.0, 65.0, 57.0, 52.0, 50.0, 28.0, 29.0, 23.0, 19.0, 21.0, 17.0, 7.0, 7.0, 10.0, 8.0, 4.0, 8.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0021610260009765625, -0.002096027135848999, -0.0020310282707214355, -0.001966029405593872, -0.0019010305404663086, -0.0018360316753387451, -0.0017710328102111816, -0.0017060339450836182, -0.0016410350799560547, -0.0015760362148284912, -0.0015110373497009277, -0.0014460384845733643, -0.0013810396194458008, -0.0013160407543182373, -0.0012510418891906738, -0.0011860430240631104, -0.0011210441589355469, -0.0010560452938079834, -0.00099104642868042, -0.0009260475635528564, -0.000861048698425293, -0.0007960498332977295, -0.000731050968170166, -0.0006660521030426025, -0.0006010532379150391, -0.0005360543727874756, -0.0004710555076599121, -0.00040605664253234863, -0.00034105777740478516, -0.0002760589122772217, -0.0002110600471496582, -0.00014606118202209473, -8.106231689453125e-05, -1.6063451766967773e-05, 4.89354133605957e-05, 0.00011393427848815918, 0.00017893314361572266, 0.00024393200874328613, 0.0003089308738708496, 0.0003739297389984131, 0.00043892860412597656, 0.00050392746925354, 0.0005689263343811035, 0.000633925199508667, 0.0006989240646362305, 0.0007639229297637939, 0.0008289217948913574, 0.0008939206600189209, 0.0009589195251464844, 0.0010239183902740479, 0.0010889172554016113, 0.0011539161205291748, 0.0012189149856567383, 0.0012839138507843018, 0.0013489127159118652, 0.0014139115810394287, 0.0014789104461669922, 0.0015439093112945557, 0.0016089081764221191, 0.0016739070415496826, 0.001738905906677246, 0.0018039047718048096, 0.001868903636932373, 0.0019339025020599365, 0.0019989013671875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 9.0, 19.0, 65.0, 114.0, 257.0, 309.0, 132.0, 57.0, 14.0, 12.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0476766973733902, -0.04489632695913315, -0.0421159602701664, -0.03933558985590935, -0.0365552194416523, -0.03377485275268555, -0.030994482338428497, -0.028214111924171448, -0.025433743372559547, -0.022653374820947647, -0.019873004406690598, -0.017092635855078697, -0.014312266372144222, -0.011531896889209747, -0.008751528337597847, -0.005971157923340797, -0.003190789371728897, -0.0004104201216250658, 0.0023699491284787655, 0.005150318145751953, 0.007930687628686428, 0.010711057111620903, 0.013491425663232803, 0.016271796077489853, 0.019052164629101753, 0.021832533180713654, 0.024612903594970703, 0.027393272146582603, 0.030173640698194504, 0.03295401111245155, 0.035734377801418304, 0.038514748215675354, 0.041295118629932404, 0.04407548904418945, 0.046855855733156204, 0.049636226147413254, 0.0524165965616703, 0.055196963250637054, 0.057977333664894104, 0.060757704079151154, 0.0635380744934082, 0.06631844490766525, 0.0690988153219223, 0.07187917828559875, 0.0746595486998558, 0.07743991911411285, 0.0802202895283699, 0.08300065994262695, 0.0857810229063034, 0.08856139332056046, 0.0913417637348175, 0.09412212669849396, 0.09690249711275101, 0.09968286752700806, 0.1024632379412651, 0.10524360835552216, 0.1080239787697792, 0.11080434918403625, 0.1135847195982933, 0.11636509001255035, 0.1191454529762268, 0.12192582339048386, 0.1247061938047409, 0.12748655676841736, 0.130266934633255]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 7.0, 2.0, 13.0, 6.0, 9.0, 11.0, 10.0, 15.0, 20.0, 18.0, 19.0, 31.0, 23.0, 28.0, 29.0, 41.0, 30.0, 34.0, 35.0, 47.0, 38.0, 40.0, 40.0, 47.0, 33.0, 32.0, 30.0, 27.0, 40.0, 27.0, 21.0, 34.0, 28.0, 15.0, 27.0, 19.0, 9.0, 14.0, 14.0, 5.0, 6.0, 9.0, 5.0, 2.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.030215144157409668, -0.029230134561657906, -0.028245124965906143, -0.02726011537015438, -0.02627510577440262, -0.025290096178650856, -0.024305086582899094, -0.02332007698714733, -0.02233506739139557, -0.021350057795643806, -0.020365048199892044, -0.01938003860414028, -0.01839502900838852, -0.017410019412636757, -0.016425009816884995, -0.015440000221133232, -0.01445499062538147, -0.013469981029629707, -0.012484971433877945, -0.011499961838126183, -0.01051495224237442, -0.009529942646622658, -0.008544933050870895, -0.007559923455119133, -0.006574913859367371, -0.005589904263615608, -0.004604894667863846, -0.0036198850721120834, -0.002634875476360321, -0.0016498658806085587, -0.0006648562848567963, 0.0003201533108949661, 0.0013051629066467285, 0.002290172502398491, 0.0032751820981502533, 0.004260191693902016, 0.005245201289653778, 0.0062302108854055405, 0.007215220481157303, 0.008200230076909065, 0.009185239672660828, 0.01017024926841259, 0.011155258864164352, 0.012140268459916115, 0.013125278055667877, 0.01411028765141964, 0.015095297247171402, 0.016080306842923164, 0.017065316438674927, 0.01805032603442669, 0.01903533563017845, 0.020020345225930214, 0.021005354821681976, 0.02199036441743374, 0.0229753740131855, 0.023960383608937263, 0.024945393204689026, 0.02593040280044079, 0.02691541239619255, 0.027900421991944313, 0.028885431587696075, 0.029870441183447838, 0.0308554507791996, 0.03184045851230621, 0.032825469970703125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 10.0, 4.0, 13.0, 10.0, 18.0, 19.0, 25.0, 37.0, 53.0, 89.0, 90.0, 158.0, 293.0, 495.0, 971.0, 2256.0, 5955.0, 19733.0, 92509.0, 2998034.0, 994727.0, 56134.0, 14658.0, 4544.0, 1624.0, 748.0, 371.0, 246.0, 135.0, 96.0, 58.0, 56.0, 42.0, 17.0, 15.0, 13.0, 8.0, 14.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016571044921875, -0.01605081558227539, -0.015530586242675781, -0.015010356903076172, -0.014490127563476562, -0.013969898223876953, -0.013449668884277344, -0.012929439544677734, -0.012409210205078125, -0.011888980865478516, -0.011368751525878906, -0.010848522186279297, -0.010328292846679688, -0.009808063507080078, -0.009287834167480469, -0.00876760482788086, -0.00824737548828125, -0.007727146148681641, -0.007206916809082031, -0.006686687469482422, -0.0061664581298828125, -0.005646228790283203, -0.005125999450683594, -0.004605770111083984, -0.004085540771484375, -0.0035653114318847656, -0.0030450820922851562, -0.002524852752685547, -0.0020046234130859375, -0.0014843940734863281, -0.0009641647338867188, -0.0004439353942871094, 7.62939453125e-05, 0.0005965232849121094, 0.0011167526245117188, 0.0016369819641113281, 0.0021572113037109375, 0.002677440643310547, 0.0031976699829101562, 0.0037178993225097656, 0.004238128662109375, 0.004758358001708984, 0.005278587341308594, 0.005798816680908203, 0.0063190460205078125, 0.006839275360107422, 0.007359504699707031, 0.00787973403930664, 0.00839996337890625, 0.00892019271850586, 0.009440422058105469, 0.009960651397705078, 0.010480880737304688, 0.011001110076904297, 0.011521339416503906, 0.012041568756103516, 0.012561798095703125, 0.013082027435302734, 0.013602256774902344, 0.014122486114501953, 0.014642715454101562, 0.015162944793701172, 0.01568317413330078, 0.01620340347290039, 0.0167236328125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 8.0, 13.0, 25.0, 26.0, 69.0, 47.0, 64.0, 78.0, 110.0, 93.0, 92.0, 78.0, 70.0, 39.0, 53.0, 44.0, 35.0, 29.0, 11.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0093231201171875, -0.009054303169250488, -0.008785486221313477, -0.008516669273376465, -0.008247852325439453, -0.007979035377502441, -0.00771021842956543, -0.007441401481628418, -0.007172584533691406, -0.0069037675857543945, -0.006634950637817383, -0.006366133689880371, -0.006097316741943359, -0.005828499794006348, -0.005559682846069336, -0.005290865898132324, -0.0050220489501953125, -0.004753232002258301, -0.004484415054321289, -0.004215598106384277, -0.003946781158447266, -0.003677964210510254, -0.003409147262573242, -0.0031403303146362305, -0.0028715133666992188, -0.002602696418762207, -0.0023338794708251953, -0.0020650625228881836, -0.0017962455749511719, -0.0015274286270141602, -0.0012586116790771484, -0.0009897947311401367, -0.000720977783203125, -0.0004521608352661133, -0.00018334388732910156, 8.547306060791016e-05, 0.0003542900085449219, 0.0006231069564819336, 0.0008919239044189453, 0.001160740852355957, 0.0014295578002929688, 0.0016983747482299805, 0.001967191696166992, 0.002236008644104004, 0.0025048255920410156, 0.0027736425399780273, 0.003042459487915039, 0.0033112764358520508, 0.0035800933837890625, 0.0038489103317260742, 0.004117727279663086, 0.004386544227600098, 0.004655361175537109, 0.004924178123474121, 0.005192995071411133, 0.0054618120193481445, 0.005730628967285156, 0.005999445915222168, 0.00626826286315918, 0.006537079811096191, 0.006805896759033203, 0.007074713706970215, 0.0073435306549072266, 0.007612347602844238, 0.00788116455078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 11.0, 5.0, 17.0, 31.0, 38.0, 51.0, 74.0, 167.0, 330.0, 851.0, 2184.0, 8688.0, 46561.0, 704681.0, 3322410.0, 89200.0, 13741.0, 3263.0, 1054.0, 422.0, 197.0, 121.0, 71.0, 44.0, 28.0, 15.0, 11.0, 9.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.02142333984375, -0.020889878273010254, -0.020356416702270508, -0.01982295513153076, -0.019289493560791016, -0.01875603199005127, -0.018222570419311523, -0.017689108848571777, -0.01715564727783203, -0.016622185707092285, -0.01608872413635254, -0.015555262565612793, -0.015021800994873047, -0.0144883394241333, -0.013954877853393555, -0.013421416282653809, -0.012887954711914062, -0.012354493141174316, -0.01182103157043457, -0.011287569999694824, -0.010754108428955078, -0.010220646858215332, -0.009687185287475586, -0.00915372371673584, -0.008620262145996094, -0.008086800575256348, -0.0075533390045166016, -0.0070198774337768555, -0.006486415863037109, -0.005952954292297363, -0.005419492721557617, -0.004886031150817871, -0.004352569580078125, -0.003819108009338379, -0.003285646438598633, -0.0027521848678588867, -0.0022187232971191406, -0.0016852617263793945, -0.0011518001556396484, -0.0006183385848999023, -8.487701416015625e-05, 0.00044858455657958984, 0.000982046127319336, 0.001515507698059082, 0.002048969268798828, 0.0025824308395385742, 0.0031158924102783203, 0.0036493539810180664, 0.0041828155517578125, 0.004716277122497559, 0.005249738693237305, 0.005783200263977051, 0.006316661834716797, 0.006850123405456543, 0.007383584976196289, 0.007917046546936035, 0.008450508117675781, 0.008983969688415527, 0.009517431259155273, 0.01005089282989502, 0.010584354400634766, 0.011117815971374512, 0.011651277542114258, 0.012184739112854004, 0.01271820068359375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 8.0, 9.0, 5.0, 17.0, 25.0, 30.0, 27.0, 47.0, 65.0, 83.0, 131.0, 244.0, 578.0, 1269.0, 829.0, 281.0, 132.0, 91.0, 63.0, 42.0, 27.0, 22.0, 14.0, 6.0, 9.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01251220703125, -0.012179851531982422, -0.011847496032714844, -0.011515140533447266, -0.011182785034179688, -0.01085042953491211, -0.010518074035644531, -0.010185718536376953, -0.009853363037109375, -0.009521007537841797, -0.009188652038574219, -0.00885629653930664, -0.008523941040039062, -0.008191585540771484, -0.007859230041503906, -0.007526874542236328, -0.00719451904296875, -0.006862163543701172, -0.006529808044433594, -0.006197452545166016, -0.0058650970458984375, -0.005532741546630859, -0.005200386047363281, -0.004868030548095703, -0.004535675048828125, -0.004203319549560547, -0.0038709640502929688, -0.0035386085510253906, -0.0032062530517578125, -0.0028738975524902344, -0.0025415420532226562, -0.002209186553955078, -0.0018768310546875, -0.0015444755554199219, -0.0012121200561523438, -0.0008797645568847656, -0.0005474090576171875, -0.00021505355834960938, 0.00011730194091796875, 0.0004496574401855469, 0.000782012939453125, 0.0011143684387207031, 0.0014467239379882812, 0.0017790794372558594, 0.0021114349365234375, 0.0024437904357910156, 0.0027761459350585938, 0.003108501434326172, 0.00344085693359375, 0.003773212432861328, 0.004105567932128906, 0.004437923431396484, 0.0047702789306640625, 0.005102634429931641, 0.005434989929199219, 0.005767345428466797, 0.006099700927734375, 0.006432056427001953, 0.006764411926269531, 0.007096767425537109, 0.0074291229248046875, 0.007761478424072266, 0.008093833923339844, 0.008426189422607422, 0.008758544921875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 17.0, 79.0, 579.0, 287.0, 31.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11486508697271347, -0.10841178894042969, -0.1019584909081459, -0.09550519287586212, -0.08905189484357834, -0.08259859681129456, -0.07614530622959137, -0.06969200074672699, -0.0632387101650238, -0.05678541213274002, -0.05033211410045624, -0.043878816068172455, -0.03742551803588867, -0.030972223728895187, -0.024518925696611404, -0.01806562766432762, -0.01161232590675354, -0.005159028340131044, 0.0012942692264914513, 0.00774756632745266, 0.014200864359736443, 0.020654160529375076, 0.02710745856165886, 0.03356075659394264, 0.040014054626226425, 0.04646735265851021, 0.05292065069079399, 0.059373944997787476, 0.06582724303007126, 0.07228054106235504, 0.07873383909463882, 0.08518713712692261, 0.0916404277086258, 0.09809372574090958, 0.10454702377319336, 0.11100032180547714, 0.11745361983776093, 0.12390691041946411, 0.1303602159023285, 0.13681350648403168, 0.14326681196689606, 0.14972010254859924, 0.15617340803146362, 0.1626266986131668, 0.1690800040960312, 0.17553329467773438, 0.18198660016059875, 0.18843989074230194, 0.19489318132400513, 0.2013464719057083, 0.2077997773885727, 0.21425306797027588, 0.22070637345314026, 0.22715966403484344, 0.23361296951770782, 0.240066260099411, 0.2465195655822754, 0.25297287106513977, 0.25942614674568176, 0.26587945222854614, 0.2723327577114105, 0.2787860631942749, 0.2852393388748169, 0.2916926443576813, 0.29814594984054565]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 1.0, 5.0, 6.0, 4.0, 4.0, 12.0, 8.0, 11.0, 23.0, 19.0, 20.0, 21.0, 23.0, 32.0, 37.0, 33.0, 46.0, 38.0, 42.0, 40.0, 49.0, 58.0, 44.0, 45.0, 36.0, 41.0, 40.0, 51.0, 33.0, 23.0, 27.0, 23.0, 18.0, 13.0, 18.0, 12.0, 12.0, 14.0, 6.0, 6.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.026488184928894043, -0.025721199810504913, -0.024954216554760933, -0.024187233299016953, -0.023420248180627823, -0.022653263062238693, -0.021886279806494713, -0.021119296550750732, -0.020352311432361603, -0.019585326313972473, -0.018818343058228493, -0.018051359802484512, -0.017284374684095383, -0.016517389565706253, -0.015750406309962273, -0.014983422122895718, -0.014216437935829163, -0.013449453748762608, -0.012682469561696053, -0.011915485374629498, -0.011148501187562943, -0.010381517000496387, -0.009614532813429832, -0.008847548626363277, -0.008080564439296722, -0.007313580252230167, -0.006546596065163612, -0.005779611878097057, -0.005012627691030502, -0.004245643503963947, -0.0034786593168973923, -0.0027116751298308372, -0.0019446909427642822, -0.0011777067556977272, -0.0004107225686311722, 0.00035626161843538284, 0.0011232458055019379, 0.0018902299925684929, 0.002657214179635048, 0.003424198366701603, 0.004191182553768158, 0.004958166740834713, 0.005725150927901268, 0.006492135114967823, 0.007259119302034378, 0.008026103489100933, 0.008793087676167488, 0.009560071863234043, 0.010327056050300598, 0.011094040237367153, 0.011861024424433708, 0.012628008611500263, 0.013394992798566818, 0.014161976985633373, 0.014928961172699928, 0.01569594442844391, 0.01646292954683304, 0.017229914665222168, 0.01799689792096615, 0.01876388117671013, 0.01953086629509926, 0.020297851413488388, 0.02106483466923237, 0.02183181792497635, 0.02259880304336548]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 10.0, 16.0, 19.0, 27.0, 46.0, 73.0, 97.0, 147.0, 231.0, 424.0, 879.0, 1972.0, 5755.0, 21707.0, 109465.0, 556932.0, 285342.0, 48326.0, 11034.0, 3344.0, 1254.0, 567.0, 331.0, 199.0, 119.0, 67.0, 51.0, 43.0, 24.0, 18.0, 11.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0206146240234375, -0.019944429397583008, -0.019274234771728516, -0.018604040145874023, -0.01793384552001953, -0.01726365089416504, -0.016593456268310547, -0.015923261642456055, -0.015253067016601562, -0.01458287239074707, -0.013912677764892578, -0.013242483139038086, -0.012572288513183594, -0.011902093887329102, -0.01123189926147461, -0.010561704635620117, -0.009891510009765625, -0.009221315383911133, -0.00855112075805664, -0.007880926132202148, -0.007210731506347656, -0.006540536880493164, -0.005870342254638672, -0.00520014762878418, -0.0045299530029296875, -0.0038597583770751953, -0.003189563751220703, -0.002519369125366211, -0.0018491744995117188, -0.0011789798736572266, -0.0005087852478027344, 0.0001614093780517578, 0.00083160400390625, 0.0015017986297607422, 0.0021719932556152344, 0.0028421878814697266, 0.0035123825073242188, 0.004182577133178711, 0.004852771759033203, 0.005522966384887695, 0.0061931610107421875, 0.00686335563659668, 0.007533550262451172, 0.008203744888305664, 0.008873939514160156, 0.009544134140014648, 0.01021432876586914, 0.010884523391723633, 0.011554718017578125, 0.012224912643432617, 0.01289510726928711, 0.013565301895141602, 0.014235496520996094, 0.014905691146850586, 0.015575885772705078, 0.01624608039855957, 0.016916275024414062, 0.017586469650268555, 0.018256664276123047, 0.01892685890197754, 0.01959705352783203, 0.020267248153686523, 0.020937442779541016, 0.021607637405395508, 0.02227783203125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 8.0, 9.0, 8.0, 20.0, 18.0, 53.0, 48.0, 70.0, 69.0, 91.0, 103.0, 111.0, 71.0, 72.0, 61.0, 61.0, 45.0, 39.0, 21.0, 13.0, 9.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0081939697265625, -0.00793921947479248, -0.007684469223022461, -0.007429718971252441, -0.007174968719482422, -0.006920218467712402, -0.006665468215942383, -0.006410717964172363, -0.006155967712402344, -0.005901217460632324, -0.005646467208862305, -0.005391716957092285, -0.005136966705322266, -0.004882216453552246, -0.0046274662017822266, -0.004372715950012207, -0.0041179656982421875, -0.003863215446472168, -0.0036084651947021484, -0.003353714942932129, -0.0030989646911621094, -0.00284421443939209, -0.0025894641876220703, -0.0023347139358520508, -0.0020799636840820312, -0.0018252134323120117, -0.0015704631805419922, -0.0013157129287719727, -0.0010609626770019531, -0.0008062124252319336, -0.0005514621734619141, -0.00029671192169189453, -4.1961669921875e-05, 0.00021278858184814453, 0.00046753883361816406, 0.0007222890853881836, 0.0009770393371582031, 0.0012317895889282227, 0.0014865398406982422, 0.0017412900924682617, 0.0019960403442382812, 0.0022507905960083008, 0.0025055408477783203, 0.00276029109954834, 0.0030150413513183594, 0.003269791603088379, 0.0035245418548583984, 0.003779292106628418, 0.0040340423583984375, 0.004288792610168457, 0.0045435428619384766, 0.004798293113708496, 0.005053043365478516, 0.005307793617248535, 0.005562543869018555, 0.005817294120788574, 0.006072044372558594, 0.006326794624328613, 0.006581544876098633, 0.006836295127868652, 0.007091045379638672, 0.007345795631408691, 0.007600545883178711, 0.00785529613494873, 0.00811004638671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 10.0, 6.0, 5.0, 19.0, 26.0, 49.0, 52.0, 74.0, 81.0, 99.0, 165.0, 255.0, 367.0, 741.0, 1542.0, 3413.0, 8756.0, 23108.0, 68085.0, 218214.0, 434512.0, 192891.0, 60705.0, 21017.0, 7913.0, 3203.0, 1334.0, 702.0, 357.0, 277.0, 161.0, 115.0, 72.0, 57.0, 47.0, 30.0, 29.0, 17.0, 13.0, 8.0, 10.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0108795166015625, -0.010533571243286133, -0.010187625885009766, -0.009841680526733398, -0.009495735168457031, -0.009149789810180664, -0.008803844451904297, -0.00845789909362793, -0.008111953735351562, -0.007766008377075195, -0.007420063018798828, -0.007074117660522461, -0.006728172302246094, -0.0063822269439697266, -0.006036281585693359, -0.005690336227416992, -0.005344390869140625, -0.004998445510864258, -0.004652500152587891, -0.0043065547943115234, -0.003960609436035156, -0.003614664077758789, -0.003268718719482422, -0.0029227733612060547, -0.0025768280029296875, -0.0022308826446533203, -0.0018849372863769531, -0.001538991928100586, -0.0011930465698242188, -0.0008471012115478516, -0.0005011558532714844, -0.0001552104949951172, 0.00019073486328125, 0.0005366802215576172, 0.0008826255798339844, 0.0012285709381103516, 0.0015745162963867188, 0.001920461654663086, 0.002266407012939453, 0.0026123523712158203, 0.0029582977294921875, 0.0033042430877685547, 0.003650188446044922, 0.003996133804321289, 0.004342079162597656, 0.0046880245208740234, 0.005033969879150391, 0.005379915237426758, 0.005725860595703125, 0.006071805953979492, 0.006417751312255859, 0.0067636966705322266, 0.007109642028808594, 0.007455587387084961, 0.007801532745361328, 0.008147478103637695, 0.008493423461914062, 0.00883936882019043, 0.009185314178466797, 0.009531259536743164, 0.009877204895019531, 0.010223150253295898, 0.010569095611572266, 0.010915040969848633, 0.011260986328125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 5.0, 2.0, 14.0, 7.0, 13.0, 21.0, 21.0, 16.0, 15.0, 23.0, 29.0, 31.0, 39.0, 39.0, 34.0, 40.0, 36.0, 33.0, 44.0, 44.0, 43.0, 42.0, 39.0, 33.0, 41.0, 31.0, 26.0, 37.0, 30.0, 20.0, 21.0, 22.0, 18.0, 18.0, 14.0, 16.0, 9.0, 3.0, 9.0, 3.0, 6.0, 7.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0085906982421875, -0.008310079574584961, -0.008029460906982422, -0.007748842239379883, -0.007468223571777344, -0.007187604904174805, -0.006906986236572266, -0.0066263675689697266, -0.0063457489013671875, -0.0060651302337646484, -0.005784511566162109, -0.00550389289855957, -0.005223274230957031, -0.004942655563354492, -0.004662036895751953, -0.004381418228149414, -0.004100799560546875, -0.003820180892944336, -0.003539562225341797, -0.003258943557739258, -0.0029783248901367188, -0.0026977062225341797, -0.0024170875549316406, -0.0021364688873291016, -0.0018558502197265625, -0.0015752315521240234, -0.0012946128845214844, -0.0010139942169189453, -0.0007333755493164062, -0.0004527568817138672, -0.00017213821411132812, 0.00010848045349121094, 0.00038909912109375, 0.0006697177886962891, 0.0009503364562988281, 0.0012309551239013672, 0.0015115737915039062, 0.0017921924591064453, 0.0020728111267089844, 0.0023534297943115234, 0.0026340484619140625, 0.0029146671295166016, 0.0031952857971191406, 0.0034759044647216797, 0.0037565231323242188, 0.004037141799926758, 0.004317760467529297, 0.004598379135131836, 0.004878997802734375, 0.005159616470336914, 0.005440235137939453, 0.005720853805541992, 0.006001472473144531, 0.00628209114074707, 0.006562709808349609, 0.0068433284759521484, 0.0071239471435546875, 0.0074045658111572266, 0.007685184478759766, 0.007965803146362305, 0.008246421813964844, 0.008527040481567383, 0.008807659149169922, 0.009088277816772461, 0.009368896484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 10.0, 16.0, 12.0, 27.0, 31.0, 48.0, 73.0, 145.0, 228.0, 410.0, 737.0, 1613.0, 3244.0, 7635.0, 20192.0, 62150.0, 220204.0, 451842.0, 193512.0, 54827.0, 18235.0, 7105.0, 3059.0, 1461.0, 756.0, 378.0, 221.0, 154.0, 70.0, 58.0, 34.0, 20.0, 17.0, 8.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002475738525390625, -0.0023887157440185547, -0.0023016929626464844, -0.002214670181274414, -0.0021276473999023438, -0.0020406246185302734, -0.001953601837158203, -0.0018665790557861328, -0.0017795562744140625, -0.0016925334930419922, -0.0016055107116699219, -0.0015184879302978516, -0.0014314651489257812, -0.001344442367553711, -0.0012574195861816406, -0.0011703968048095703, -0.0010833740234375, -0.0009963512420654297, -0.0009093284606933594, -0.0008223056793212891, -0.0007352828979492188, -0.0006482601165771484, -0.0005612373352050781, -0.0004742145538330078, -0.0003871917724609375, -0.0003001689910888672, -0.00021314620971679688, -0.00012612342834472656, -3.910064697265625e-05, 4.792213439941406e-05, 0.00013494491577148438, 0.0002219676971435547, 0.000308990478515625, 0.0003960132598876953, 0.0004830360412597656, 0.0005700588226318359, 0.0006570816040039062, 0.0007441043853759766, 0.0008311271667480469, 0.0009181499481201172, 0.0010051727294921875, 0.0010921955108642578, 0.0011792182922363281, 0.0012662410736083984, 0.0013532638549804688, 0.001440286636352539, 0.0015273094177246094, 0.0016143321990966797, 0.00170135498046875, 0.0017883777618408203, 0.0018754005432128906, 0.001962423324584961, 0.0020494461059570312, 0.0021364688873291016, 0.002223491668701172, 0.002310514450073242, 0.0023975372314453125, 0.002484560012817383, 0.002571582794189453, 0.0026586055755615234, 0.0027456283569335938, 0.002832651138305664, 0.0029196739196777344, 0.0030066967010498047, 0.003093719482421875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 9.0, 0.0, 7.0, 8.0, 15.0, 20.0, 12.0, 0.0, 21.0, 35.0, 36.0, 41.0, 41.0, 0.0, 41.0, 48.0, 55.0, 65.0, 57.0, 0.0, 73.0, 66.0, 47.0, 48.0, 0.0, 45.0, 40.0, 36.0, 29.0, 20.0, 0.0, 21.0, 15.0, 9.0, 9.0, 12.0, 0.0, 7.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.430511474609375e-06, -1.3811513781547546e-06, -1.3317912817001343e-06, -1.282431185245514e-06, -1.2330710887908936e-06, -1.1837109923362732e-06, -1.1343508958816528e-06, -1.0849907994270325e-06, -1.0356307029724121e-06, -9.862706065177917e-07, -9.369105100631714e-07, -8.87550413608551e-07, -8.381903171539307e-07, -7.888302206993103e-07, -7.394701242446899e-07, -6.901100277900696e-07, -6.407499313354492e-07, -5.913898348808289e-07, -5.420297384262085e-07, -4.926696419715881e-07, -4.4330954551696777e-07, -3.939494490623474e-07, -3.4458935260772705e-07, -2.952292561531067e-07, -2.4586915969848633e-07, -1.9650906324386597e-07, -1.471489667892456e-07, -9.778887033462524e-08, -4.842877388000488e-08, 9.313225746154785e-10, 5.029141902923584e-08, 9.96515154838562e-08, 1.4901161193847656e-07, 1.9837170839309692e-07, 2.477318048477173e-07, 2.9709190130233765e-07, 3.46451997756958e-07, 3.9581209421157837e-07, 4.4517219066619873e-07, 4.945322871208191e-07, 5.438923835754395e-07, 5.932524800300598e-07, 6.426125764846802e-07, 6.919726729393005e-07, 7.413327693939209e-07, 7.906928658485413e-07, 8.400529623031616e-07, 8.89413058757782e-07, 9.387731552124023e-07, 9.881332516670227e-07, 1.037493348121643e-06, 1.0868534445762634e-06, 1.1362135410308838e-06, 1.1855736374855042e-06, 1.2349337339401245e-06, 1.2842938303947449e-06, 1.3336539268493652e-06, 1.3830140233039856e-06, 1.432374119758606e-06, 1.4817342162132263e-06, 1.5310943126678467e-06, 1.580454409122467e-06, 1.6298145055770874e-06, 1.6791746020317078e-06, 1.7285346984863281e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 8.0, 8.0, 12.0, 21.0, 40.0, 53.0, 93.0, 167.0, 369.0, 842.0, 2182.0, 6579.0, 25198.0, 135756.0, 622561.0, 206397.0, 35073.0, 8530.0, 2689.0, 1063.0, 422.0, 201.0, 116.0, 67.0, 44.0, 24.0, 19.0, 12.0, 7.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0044403076171875, -0.004295229911804199, -0.0041501522064208984, -0.004005074501037598, -0.003859996795654297, -0.003714919090270996, -0.0035698413848876953, -0.0034247636795043945, -0.0032796859741210938, -0.003134608268737793, -0.002989530563354492, -0.0028444528579711914, -0.0026993751525878906, -0.00255429744720459, -0.002409219741821289, -0.0022641420364379883, -0.0021190643310546875, -0.0019739866256713867, -0.001828908920288086, -0.0016838312149047852, -0.0015387535095214844, -0.0013936758041381836, -0.0012485980987548828, -0.001103520393371582, -0.0009584426879882812, -0.0008133649826049805, -0.0006682872772216797, -0.0005232095718383789, -0.0003781318664550781, -0.00023305416107177734, -8.797645568847656e-05, 5.710124969482422e-05, 0.000202178955078125, 0.0003472566604614258, 0.0004923343658447266, 0.0006374120712280273, 0.0007824897766113281, 0.0009275674819946289, 0.0010726451873779297, 0.0012177228927612305, 0.0013628005981445312, 0.001507878303527832, 0.0016529560089111328, 0.0017980337142944336, 0.0019431114196777344, 0.002088189125061035, 0.002233266830444336, 0.0023783445358276367, 0.0025234222412109375, 0.0026684999465942383, 0.002813577651977539, 0.00295865535736084, 0.0031037330627441406, 0.0032488107681274414, 0.003393888473510742, 0.003538966178894043, 0.0036840438842773438, 0.0038291215896606445, 0.003974199295043945, 0.004119277000427246, 0.004264354705810547, 0.004409432411193848, 0.0045545101165771484, 0.004699587821960449, 0.00484466552734375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 7.0, 6.0, 9.0, 15.0, 16.0, 20.0, 22.0, 28.0, 37.0, 38.0, 42.0, 60.0, 66.0, 64.0, 74.0, 60.0, 59.0, 55.0, 58.0, 46.0, 38.0, 34.0, 29.0, 25.0, 22.0, 14.0, 15.0, 10.0, 9.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017786026000976562, -0.0017040818929672241, -0.001629561185836792, -0.0015550404787063599, -0.0014805197715759277, -0.0014059990644454956, -0.0013314783573150635, -0.0012569576501846313, -0.0011824369430541992, -0.001107916235923767, -0.001033395528793335, -0.0009588748216629028, -0.0008843541145324707, -0.0008098334074020386, -0.0007353127002716064, -0.0006607919931411743, -0.0005862712860107422, -0.0005117505788803101, -0.00043722987174987793, -0.0003627091646194458, -0.00028818845748901367, -0.00021366775035858154, -0.00013914704322814941, -6.462633609771729e-05, 9.894371032714844e-06, 8.441507816314697e-05, 0.0001589357852935791, 0.00023345649242401123, 0.00030797719955444336, 0.0003824979066848755, 0.0004570186138153076, 0.0005315393209457397, 0.0006060600280761719, 0.000680580735206604, 0.0007551014423370361, 0.0008296221494674683, 0.0009041428565979004, 0.0009786635637283325, 0.0010531842708587646, 0.0011277049779891968, 0.001202225685119629, 0.001276746392250061, 0.0013512670993804932, 0.0014257878065109253, 0.0015003085136413574, 0.0015748292207717896, 0.0016493499279022217, 0.0017238706350326538, 0.001798391342163086, 0.001872912049293518, 0.0019474327564239502, 0.0020219534635543823, 0.0020964741706848145, 0.0021709948778152466, 0.0022455155849456787, 0.002320036292076111, 0.002394556999206543, 0.002469077706336975, 0.0025435984134674072, 0.0026181191205978394, 0.0026926398277282715, 0.0027671605348587036, 0.0028416812419891357, 0.002916201949119568, 0.00299072265625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 7.0, 21.0, 140.0, 682.0, 143.0, 19.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04277254641056061, -0.036234356462955475, -0.02969617024064064, -0.023157982155680656, -0.016619794070720673, -0.01008160412311554, -0.003543417900800705, 0.0029947683215141296, 0.009532958269119263, 0.016071146354079247, 0.02260933443903923, 0.029147522523999214, 0.0356857106089592, 0.04222390055656433, 0.048762086778879166, 0.055300273001194, 0.06183846294879913, 0.06837665289640427, 0.0749148428440094, 0.08145302534103394, 0.08799121528863907, 0.0945294052362442, 0.10106758773326874, 0.10760577768087387, 0.114143967628479, 0.12068215757608414, 0.12722034752368927, 0.1337585300207138, 0.14029672741889954, 0.14683490991592407, 0.1533730924129486, 0.15991127490997314, 0.16644948720932007, 0.1729876697063446, 0.17952586710453033, 0.18606404960155487, 0.1926022469997406, 0.19914042949676514, 0.20567861199378967, 0.2122167944908142, 0.21875499188899994, 0.22529317438602448, 0.2318313717842102, 0.23836955428123474, 0.24490773677825928, 0.2514459490776062, 0.25798413157463074, 0.2645223140716553, 0.2710604965686798, 0.27759867906570435, 0.2841368615627289, 0.2906750738620758, 0.29721325635910034, 0.3037514388561249, 0.3102896213531494, 0.31682780385017395, 0.3233659863471985, 0.329904168844223, 0.33644235134124756, 0.3429805636405945, 0.349518746137619, 0.35605692863464355, 0.3625951111316681, 0.3691332936286926, 0.37567150592803955]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 8.0, 4.0, 6.0, 5.0, 6.0, 15.0, 10.0, 16.0, 24.0, 15.0, 18.0, 16.0, 19.0, 27.0, 36.0, 24.0, 46.0, 45.0, 45.0, 40.0, 39.0, 36.0, 35.0, 50.0, 63.0, 38.0, 42.0, 33.0, 41.0, 32.0, 38.0, 17.0, 21.0, 17.0, 14.0, 7.0, 8.0, 8.0, 10.0, 7.0, 8.0, 6.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024968445301055908, -0.024116385728120804, -0.0232643261551857, -0.022412266582250595, -0.02156020700931549, -0.020708147436380386, -0.019856087863445282, -0.019004028290510178, -0.018151968717575073, -0.01729990914463997, -0.016447849571704865, -0.01559578999876976, -0.014743730425834656, -0.013891670852899551, -0.013039611279964447, -0.012187551707029343, -0.011335492134094238, -0.010483432561159134, -0.00963137298822403, -0.008779313415288925, -0.00792725384235382, -0.007075194269418716, -0.006223134696483612, -0.005371075123548508, -0.004519015550613403, -0.003666955977678299, -0.0028148964047431946, -0.00196283683180809, -0.0011107772588729858, -0.00025871768593788147, 0.0005933418869972229, 0.0014454014599323273, 0.0022974610328674316, 0.003149520605802536, 0.00400158017873764, 0.004853639751672745, 0.005705699324607849, 0.0065577588975429535, 0.007409818470478058, 0.008261878043413162, 0.009113937616348267, 0.009965997189283371, 0.010818056762218475, 0.01167011633515358, 0.012522175908088684, 0.013374235481023788, 0.014226295053958893, 0.015078354626893997, 0.0159304141998291, 0.016782473772764206, 0.01763453334569931, 0.018486592918634415, 0.01933865249156952, 0.020190712064504623, 0.021042771637439728, 0.021894831210374832, 0.022746890783309937, 0.02359895035624504, 0.024451009929180145, 0.02530306950211525, 0.026155129075050354, 0.02700718864798546, 0.027859248220920563, 0.028711307793855667, 0.02956336736679077]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 9.0, 10.0, 10.0, 6.0, 19.0, 24.0, 22.0, 40.0, 70.0, 94.0, 121.0, 207.0, 369.0, 688.0, 1507.0, 3889.0, 13612.0, 57645.0, 1433656.0, 2579692.0, 79476.0, 15315.0, 4539.0, 1647.0, 655.0, 316.0, 206.0, 115.0, 84.0, 58.0, 45.0, 32.0, 29.0, 18.0, 16.0, 7.0, 6.0, 8.0, 2.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.01291656494140625, -0.012537479400634766, -0.012158393859863281, -0.011779308319091797, -0.011400222778320312, -0.011021137237548828, -0.010642051696777344, -0.01026296615600586, -0.009883880615234375, -0.00950479507446289, -0.009125709533691406, -0.008746623992919922, -0.008367538452148438, -0.007988452911376953, -0.007609367370605469, -0.007230281829833984, -0.0068511962890625, -0.006472110748291016, -0.006093025207519531, -0.005713939666748047, -0.0053348541259765625, -0.004955768585205078, -0.004576683044433594, -0.004197597503662109, -0.003818511962890625, -0.0034394264221191406, -0.0030603408813476562, -0.002681255340576172, -0.0023021697998046875, -0.0019230842590332031, -0.0015439987182617188, -0.0011649131774902344, -0.00078582763671875, -0.0004067420959472656, -2.765655517578125e-05, 0.0003514289855957031, 0.0007305145263671875, 0.0011096000671386719, 0.0014886856079101562, 0.0018677711486816406, 0.002246856689453125, 0.0026259422302246094, 0.0030050277709960938, 0.003384113311767578, 0.0037631988525390625, 0.004142284393310547, 0.004521369934082031, 0.004900455474853516, 0.005279541015625, 0.005658626556396484, 0.006037712097167969, 0.006416797637939453, 0.0067958831787109375, 0.007174968719482422, 0.007554054260253906, 0.00793313980102539, 0.008312225341796875, 0.00869131088256836, 0.009070396423339844, 0.009449481964111328, 0.009828567504882812, 0.010207653045654297, 0.010586738586425781, 0.010965824127197266, 0.01134490966796875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 6.0, 9.0, 9.0, 24.0, 34.0, 39.0, 39.0, 65.0, 66.0, 68.0, 102.0, 111.0, 82.0, 80.0, 54.0, 50.0, 50.0, 39.0, 33.0, 15.0, 15.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007160186767578125, -0.006924092769622803, -0.0066879987716674805, -0.006451904773712158, -0.006215810775756836, -0.005979716777801514, -0.005743622779846191, -0.005507528781890869, -0.005271434783935547, -0.005035340785980225, -0.004799246788024902, -0.00456315279006958, -0.004327058792114258, -0.0040909647941589355, -0.0038548707962036133, -0.003618776798248291, -0.0033826828002929688, -0.0031465888023376465, -0.0029104948043823242, -0.002674400806427002, -0.0024383068084716797, -0.0022022128105163574, -0.001966118812561035, -0.0017300248146057129, -0.0014939308166503906, -0.0012578368186950684, -0.001021742820739746, -0.0007856488227844238, -0.0005495548248291016, -0.0003134608268737793, -7.736682891845703e-05, 0.00015872716903686523, 0.0003948211669921875, 0.0006309151649475098, 0.000867009162902832, 0.0011031031608581543, 0.0013391971588134766, 0.0015752911567687988, 0.001811385154724121, 0.0020474791526794434, 0.0022835731506347656, 0.002519667148590088, 0.00275576114654541, 0.0029918551445007324, 0.0032279491424560547, 0.003464043140411377, 0.0037001371383666992, 0.0039362311363220215, 0.004172325134277344, 0.004408419132232666, 0.004644513130187988, 0.0048806071281433105, 0.005116701126098633, 0.005352795124053955, 0.005588889122009277, 0.0058249831199646, 0.006061077117919922, 0.006297171115875244, 0.006533265113830566, 0.006769359111785889, 0.007005453109741211, 0.007241547107696533, 0.0074776411056518555, 0.007713735103607178, 0.0079498291015625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 11.0, 5.0, 11.0, 15.0, 28.0, 44.0, 57.0, 71.0, 137.0, 243.0, 381.0, 669.0, 1143.0, 2081.0, 3982.0, 7806.0, 17255.0, 44430.0, 152640.0, 1745339.0, 1978934.0, 159609.0, 45219.0, 17631.0, 7831.0, 3917.0, 2046.0, 1144.0, 642.0, 355.0, 232.0, 133.0, 87.0, 39.0, 32.0, 25.0, 17.0, 14.0, 9.0, 5.0, 2.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.006855010986328125, -0.006653487682342529, -0.006451964378356934, -0.006250441074371338, -0.006048917770385742, -0.0058473944664001465, -0.005645871162414551, -0.005444347858428955, -0.005242824554443359, -0.005041301250457764, -0.004839777946472168, -0.004638254642486572, -0.0044367313385009766, -0.004235208034515381, -0.004033684730529785, -0.0038321614265441895, -0.0036306381225585938, -0.003429114818572998, -0.0032275915145874023, -0.0030260682106018066, -0.002824544906616211, -0.0026230216026306152, -0.0024214982986450195, -0.002219974994659424, -0.002018451690673828, -0.0018169283866882324, -0.0016154050827026367, -0.001413881778717041, -0.0012123584747314453, -0.0010108351707458496, -0.0008093118667602539, -0.0006077885627746582, -0.0004062652587890625, -0.0002047419548034668, -3.2186508178710938e-06, 0.0001983046531677246, 0.0003998279571533203, 0.000601351261138916, 0.0008028745651245117, 0.0010043978691101074, 0.0012059211730957031, 0.0014074444770812988, 0.0016089677810668945, 0.0018104910850524902, 0.002012014389038086, 0.0022135376930236816, 0.0024150609970092773, 0.002616584300994873, 0.0028181076049804688, 0.0030196309089660645, 0.00322115421295166, 0.003422677516937256, 0.0036242008209228516, 0.0038257241249084473, 0.004027247428894043, 0.004228770732879639, 0.004430294036865234, 0.00463181734085083, 0.004833340644836426, 0.0050348639488220215, 0.005236387252807617, 0.005437910556793213, 0.005639433860778809, 0.005840957164764404, 0.00604248046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 1.0, 5.0, 5.0, 4.0, 3.0, 7.0, 6.0, 8.0, 13.0, 13.0, 16.0, 16.0, 31.0, 37.0, 42.0, 42.0, 71.0, 107.0, 182.0, 322.0, 648.0, 1072.0, 612.0, 320.0, 160.0, 97.0, 57.0, 34.0, 27.0, 19.0, 18.0, 12.0, 18.0, 13.0, 7.0, 8.0, 2.0, 8.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005779266357421875, -0.005600392818450928, -0.0054215192794799805, -0.005242645740509033, -0.005063772201538086, -0.004884898662567139, -0.004706025123596191, -0.004527151584625244, -0.004348278045654297, -0.00416940450668335, -0.003990530967712402, -0.003811657428741455, -0.003632783889770508, -0.0034539103507995605, -0.0032750368118286133, -0.003096163272857666, -0.0029172897338867188, -0.0027384161949157715, -0.0025595426559448242, -0.002380669116973877, -0.0022017955780029297, -0.0020229220390319824, -0.0018440485000610352, -0.0016651749610900879, -0.0014863014221191406, -0.0013074278831481934, -0.001128554344177246, -0.0009496808052062988, -0.0007708072662353516, -0.0005919337272644043, -0.00041306018829345703, -0.00023418664932250977, -5.53131103515625e-05, 0.00012356042861938477, 0.00030243396759033203, 0.0004813075065612793, 0.0006601810455322266, 0.0008390545845031738, 0.001017928123474121, 0.0011968016624450684, 0.0013756752014160156, 0.0015545487403869629, 0.0017334222793579102, 0.0019122958183288574, 0.0020911693572998047, 0.002270042896270752, 0.0024489164352416992, 0.0026277899742126465, 0.0028066635131835938, 0.002985537052154541, 0.0031644105911254883, 0.0033432841300964355, 0.003522157669067383, 0.00370103120803833, 0.0038799047470092773, 0.004058778285980225, 0.004237651824951172, 0.004416525363922119, 0.004595398902893066, 0.004774272441864014, 0.004953145980834961, 0.005132019519805908, 0.0053108930587768555, 0.005489766597747803, 0.00566864013671875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 5.0, 29.0, 69.0, 273.0, 396.0, 173.0, 37.0, 13.0, 6.0, 2.0, 1.0, 1.0], "bins": [-0.13596530258655548, -0.1335551142692566, -0.1311449110507965, -0.12873472273349762, -0.12632451951503754, -0.12391433119773865, -0.12150413542985916, -0.11909393966197968, -0.11668375134468079, -0.1142735555768013, -0.11186335980892181, -0.10945317149162292, -0.10704297572374344, -0.10463277995586395, -0.10222258418798447, -0.09981238842010498, -0.0974021926522255, -0.09499199688434601, -0.09258180111646652, -0.09017161279916763, -0.08776141703128815, -0.08535122126340866, -0.08294102549552917, -0.08053082972764969, -0.0781206339597702, -0.07571043819189072, -0.07330024242401123, -0.07089005410671234, -0.06847985833883286, -0.06606966257095337, -0.06365946680307388, -0.0612492710351944, -0.058839090168476105, -0.05642889440059662, -0.05401870235800743, -0.051608506590127945, -0.04919831454753876, -0.04678811877965927, -0.044377923011779785, -0.0419677272439003, -0.03955753147602081, -0.03714733570814133, -0.03473714366555214, -0.03232694789767265, -0.029916753992438316, -0.02750656008720398, -0.025096364319324493, -0.022686170414090157, -0.02027597837150097, -0.017865784466266632, -0.01545558962970972, -0.01304539479315281, -0.010635200887918472, -0.008225006982684135, -0.005814812146127224, -0.0034046173095703125, -0.0009944234043359756, 0.0014157709665596485, 0.0038259653374552727, 0.006236159708350897, 0.008646354079246521, 0.011056547984480858, 0.01346674282103777, 0.01587693765759468, 0.018287131562829018]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 8.0, 3.0, 8.0, 10.0, 17.0, 12.0, 15.0, 27.0, 21.0, 39.0, 32.0, 38.0, 36.0, 36.0, 35.0, 39.0, 50.0, 51.0, 39.0, 34.0, 57.0, 56.0, 38.0, 42.0, 37.0, 46.0, 28.0, 26.0, 23.0, 18.0, 20.0, 16.0, 7.0, 8.0, 5.0, 8.0, 3.0, 6.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.019405722618103027, -0.018849719315767288, -0.01829371601343155, -0.01773771271109581, -0.01718170940876007, -0.01662570610642433, -0.016069702804088593, -0.015513699501752853, -0.014957696199417114, -0.014401692897081375, -0.013845689594745636, -0.013289686292409897, -0.012733682990074158, -0.012177679687738419, -0.01162167638540268, -0.01106567308306694, -0.010509669780731201, -0.009953666478395462, -0.009397663176059723, -0.008841659873723984, -0.008285656571388245, -0.0077296532690525055, -0.007173649966716766, -0.006617646664381027, -0.006061643362045288, -0.005505640059709549, -0.00494963675737381, -0.004393633455038071, -0.0038376301527023315, -0.0032816268503665924, -0.0027256235480308533, -0.002169620245695114, -0.001613616943359375, -0.0010576136410236359, -0.0005016103386878967, 5.439296364784241e-05, 0.0006103962659835815, 0.0011663995683193207, 0.0017224028706550598, 0.002278406172990799, 0.002834409475326538, 0.0033904127776622772, 0.003946416079998016, 0.0045024193823337555, 0.005058422684669495, 0.005614425987005234, 0.006170429289340973, 0.006726432591676712, 0.007282435894012451, 0.00783843919634819, 0.00839444249868393, 0.008950445801019669, 0.009506449103355408, 0.010062452405691147, 0.010618455708026886, 0.011174459010362625, 0.011730462312698364, 0.012286465615034103, 0.012842468917369843, 0.013398472219705582, 0.01395447552204132, 0.01451047882437706, 0.015066482126712799, 0.015622485429048538, 0.016178488731384277]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 2.0, 2.0, 6.0, 9.0, 12.0, 11.0, 10.0, 20.0, 31.0, 43.0, 50.0, 87.0, 93.0, 147.0, 248.0, 315.0, 587.0, 1171.0, 2450.0, 6537.0, 21737.0, 87259.0, 435664.0, 384799.0, 76605.0, 19442.0, 6186.0, 2377.0, 1050.0, 526.0, 341.0, 211.0, 151.0, 104.0, 72.0, 52.0, 29.0, 30.0, 25.0, 9.0, 14.0, 13.0, 6.0, 5.0, 6.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.01430511474609375, -0.013857483863830566, -0.013409852981567383, -0.0129622220993042, -0.012514591217041016, -0.012066960334777832, -0.011619329452514648, -0.011171698570251465, -0.010724067687988281, -0.010276436805725098, -0.009828805923461914, -0.00938117504119873, -0.008933544158935547, -0.008485913276672363, -0.00803828239440918, -0.007590651512145996, -0.0071430206298828125, -0.006695389747619629, -0.006247758865356445, -0.005800127983093262, -0.005352497100830078, -0.0049048662185668945, -0.004457235336303711, -0.004009604454040527, -0.0035619735717773438, -0.00311434268951416, -0.0026667118072509766, -0.002219080924987793, -0.0017714500427246094, -0.0013238191604614258, -0.0008761882781982422, -0.0004285573959350586, 1.9073486328125e-05, 0.0004667043685913086, 0.0009143352508544922, 0.0013619661331176758, 0.0018095970153808594, 0.002257227897644043, 0.0027048587799072266, 0.00315248966217041, 0.0036001205444335938, 0.004047751426696777, 0.004495382308959961, 0.0049430131912231445, 0.005390644073486328, 0.005838274955749512, 0.006285905838012695, 0.006733536720275879, 0.0071811676025390625, 0.007628798484802246, 0.00807642936706543, 0.008524060249328613, 0.008971691131591797, 0.00941932201385498, 0.009866952896118164, 0.010314583778381348, 0.010762214660644531, 0.011209845542907715, 0.011657476425170898, 0.012105107307434082, 0.012552738189697266, 0.01300036907196045, 0.013447999954223633, 0.013895630836486816, 0.01434326171875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 20.0, 9.0, 24.0, 37.0, 55.0, 59.0, 87.0, 99.0, 103.0, 111.0, 87.0, 85.0, 60.0, 51.0, 50.0, 30.0, 25.0, 4.0, 1.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.008331298828125, -0.008071184158325195, -0.007811069488525391, -0.007550954818725586, -0.007290840148925781, -0.0070307254791259766, -0.006770610809326172, -0.006510496139526367, -0.0062503814697265625, -0.005990266799926758, -0.005730152130126953, -0.0054700374603271484, -0.005209922790527344, -0.004949808120727539, -0.004689693450927734, -0.00442957878112793, -0.004169464111328125, -0.00390934944152832, -0.0036492347717285156, -0.003389120101928711, -0.0031290054321289062, -0.0028688907623291016, -0.002608776092529297, -0.002348661422729492, -0.0020885467529296875, -0.0018284320831298828, -0.0015683174133300781, -0.0013082027435302734, -0.0010480880737304688, -0.0007879734039306641, -0.0005278587341308594, -0.0002677440643310547, -7.62939453125e-06, 0.0002524852752685547, 0.0005125999450683594, 0.0007727146148681641, 0.0010328292846679688, 0.0012929439544677734, 0.0015530586242675781, 0.0018131732940673828, 0.0020732879638671875, 0.002333402633666992, 0.002593517303466797, 0.0028536319732666016, 0.0031137466430664062, 0.003373861312866211, 0.0036339759826660156, 0.0038940906524658203, 0.004154205322265625, 0.00441431999206543, 0.004674434661865234, 0.004934549331665039, 0.005194664001464844, 0.0054547786712646484, 0.005714893341064453, 0.005975008010864258, 0.0062351226806640625, 0.006495237350463867, 0.006755352020263672, 0.0070154666900634766, 0.007275581359863281, 0.007535696029663086, 0.007795810699462891, 0.008055925369262695, 0.0083160400390625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 4.0, 7.0, 12.0, 18.0, 23.0, 26.0, 48.0, 44.0, 55.0, 123.0, 241.0, 508.0, 1075.0, 2872.0, 8999.0, 32516.0, 138224.0, 541844.0, 247789.0, 53010.0, 13966.0, 4274.0, 1497.0, 609.0, 296.0, 161.0, 107.0, 53.0, 49.0, 25.0, 23.0, 15.0, 12.0, 7.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01073455810546875, -0.010360240936279297, -0.009985923767089844, -0.00961160659790039, -0.009237289428710938, -0.008862972259521484, -0.008488655090332031, -0.008114337921142578, -0.007740020751953125, -0.007365703582763672, -0.006991386413574219, -0.006617069244384766, -0.0062427520751953125, -0.005868434906005859, -0.005494117736816406, -0.005119800567626953, -0.0047454833984375, -0.004371166229248047, -0.003996849060058594, -0.0036225318908691406, -0.0032482147216796875, -0.0028738975524902344, -0.0024995803833007812, -0.002125263214111328, -0.001750946044921875, -0.0013766288757324219, -0.0010023117065429688, -0.0006279945373535156, -0.0002536773681640625, 0.00012063980102539062, 0.0004949569702148438, 0.0008692741394042969, 0.00124359130859375, 0.0016179084777832031, 0.0019922256469726562, 0.0023665428161621094, 0.0027408599853515625, 0.0031151771545410156, 0.0034894943237304688, 0.003863811492919922, 0.004238128662109375, 0.004612445831298828, 0.004986763000488281, 0.005361080169677734, 0.0057353973388671875, 0.006109714508056641, 0.006484031677246094, 0.006858348846435547, 0.007232666015625, 0.007606983184814453, 0.007981300354003906, 0.00835561752319336, 0.008729934692382812, 0.009104251861572266, 0.009478569030761719, 0.009852886199951172, 0.010227203369140625, 0.010601520538330078, 0.010975837707519531, 0.011350154876708984, 0.011724472045898438, 0.01209878921508789, 0.012473106384277344, 0.012847423553466797, 0.01322174072265625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 4.0, 5.0, 16.0, 19.0, 15.0, 14.0, 17.0, 26.0, 27.0, 29.0, 30.0, 38.0, 35.0, 30.0, 40.0, 37.0, 42.0, 50.0, 32.0, 44.0, 36.0, 34.0, 36.0, 36.0, 32.0, 36.0, 38.0, 26.0, 21.0, 24.0, 20.0, 20.0, 14.0, 13.0, 15.0, 14.0, 8.0, 7.0, 5.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0092315673828125, -0.008970677852630615, -0.00870978832244873, -0.008448898792266846, -0.008188009262084961, -0.007927119731903076, -0.007666230201721191, -0.007405340671539307, -0.007144451141357422, -0.006883561611175537, -0.006622672080993652, -0.006361782550811768, -0.006100893020629883, -0.005840003490447998, -0.005579113960266113, -0.0053182244300842285, -0.005057334899902344, -0.004796445369720459, -0.004535555839538574, -0.0042746663093566895, -0.004013776779174805, -0.00375288724899292, -0.003491997718811035, -0.0032311081886291504, -0.0029702186584472656, -0.002709329128265381, -0.002448439598083496, -0.0021875500679016113, -0.0019266605377197266, -0.0016657710075378418, -0.001404881477355957, -0.0011439919471740723, -0.0008831024169921875, -0.0006222128868103027, -0.00036132335662841797, -0.0001004338264465332, 0.00016045570373535156, 0.00042134523391723633, 0.0006822347640991211, 0.0009431242942810059, 0.0012040138244628906, 0.0014649033546447754, 0.0017257928848266602, 0.001986682415008545, 0.0022475719451904297, 0.0025084614753723145, 0.0027693510055541992, 0.003030240535736084, 0.0032911300659179688, 0.0035520195960998535, 0.0038129091262817383, 0.004073798656463623, 0.004334688186645508, 0.004595577716827393, 0.004856467247009277, 0.005117356777191162, 0.005378246307373047, 0.005639135837554932, 0.005900025367736816, 0.006160914897918701, 0.006421804428100586, 0.006682693958282471, 0.0069435834884643555, 0.00720447301864624, 0.007465362548828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 13.0, 30.0, 30.0, 61.0, 97.0, 118.0, 210.0, 326.0, 554.0, 938.0, 1706.0, 3257.0, 6842.0, 15657.0, 41466.0, 129405.0, 374133.0, 314976.0, 99681.0, 33826.0, 13057.0, 5636.0, 2799.0, 1498.0, 849.0, 526.0, 320.0, 162.0, 130.0, 82.0, 52.0, 35.0, 20.0, 12.0, 5.0, 7.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.001972198486328125, -0.001912236213684082, -0.001852273941040039, -0.001792311668395996, -0.0017323493957519531, -0.0016723871231079102, -0.0016124248504638672, -0.0015524625778198242, -0.0014925003051757812, -0.0014325380325317383, -0.0013725757598876953, -0.0013126134872436523, -0.0012526512145996094, -0.0011926889419555664, -0.0011327266693115234, -0.0010727643966674805, -0.0010128021240234375, -0.0009528398513793945, -0.0008928775787353516, -0.0008329153060913086, -0.0007729530334472656, -0.0007129907608032227, -0.0006530284881591797, -0.0005930662155151367, -0.0005331039428710938, -0.0004731416702270508, -0.0004131793975830078, -0.00035321712493896484, -0.0002932548522949219, -0.0002332925796508789, -0.00017333030700683594, -0.00011336803436279297, -5.340576171875e-05, 6.556510925292969e-06, 6.651878356933594e-05, 0.0001264810562133789, 0.00018644332885742188, 0.00024640560150146484, 0.0003063678741455078, 0.0003663301467895508, 0.00042629241943359375, 0.0004862546920776367, 0.0005462169647216797, 0.0006061792373657227, 0.0006661415100097656, 0.0007261037826538086, 0.0007860660552978516, 0.0008460283279418945, 0.0009059906005859375, 0.0009659528732299805, 0.0010259151458740234, 0.0010858774185180664, 0.0011458396911621094, 0.0012058019638061523, 0.0012657642364501953, 0.0013257265090942383, 0.0013856887817382812, 0.0014456510543823242, 0.0015056133270263672, 0.0015655755996704102, 0.0016255378723144531, 0.001685500144958496, 0.001745462417602539, 0.001805424690246582, 0.001865386962890625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 0.0, 3.0, 5.0, 8.0, 0.0, 8.0, 13.0, 8.0, 18.0, 0.0, 42.0, 30.0, 36.0, 0.0, 43.0, 47.0, 53.0, 47.0, 0.0, 55.0, 55.0, 65.0, 0.0, 60.0, 60.0, 50.0, 47.0, 0.0, 39.0, 42.0, 26.0, 24.0, 0.0, 33.0, 17.0, 17.0, 0.0, 10.0, 15.0, 8.0, 9.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.430511474609375e-06, -1.383945345878601e-06, -1.3373792171478271e-06, -1.2908130884170532e-06, -1.2442469596862793e-06, -1.1976808309555054e-06, -1.1511147022247314e-06, -1.1045485734939575e-06, -1.0579824447631836e-06, -1.0114163160324097e-06, -9.648501873016357e-07, -9.182840585708618e-07, -8.717179298400879e-07, -8.25151801109314e-07, -7.7858567237854e-07, -7.320195436477661e-07, -6.854534149169922e-07, -6.388872861862183e-07, -5.923211574554443e-07, -5.457550287246704e-07, -4.991888999938965e-07, -4.5262277126312256e-07, -4.0605664253234863e-07, -3.594905138015747e-07, -3.129243850708008e-07, -2.6635825634002686e-07, -2.1979212760925293e-07, -1.73225998878479e-07, -1.2665987014770508e-07, -8.009374141693115e-08, -3.3527612686157227e-08, 1.30385160446167e-08, 5.960464477539063e-08, 1.0617077350616455e-07, 1.5273690223693848e-07, 1.993030309677124e-07, 2.4586915969848633e-07, 2.9243528842926025e-07, 3.390014171600342e-07, 3.855675458908081e-07, 4.3213367462158203e-07, 4.78699803352356e-07, 5.252659320831299e-07, 5.718320608139038e-07, 6.183981895446777e-07, 6.649643182754517e-07, 7.115304470062256e-07, 7.580965757369995e-07, 8.046627044677734e-07, 8.512288331985474e-07, 8.977949619293213e-07, 9.443610906600952e-07, 9.909272193908691e-07, 1.037493348121643e-06, 1.084059476852417e-06, 1.130625605583191e-06, 1.1771917343139648e-06, 1.2237578630447388e-06, 1.2703239917755127e-06, 1.3168901205062866e-06, 1.3634562492370605e-06, 1.4100223779678345e-06, 1.4565885066986084e-06, 1.5031546354293823e-06, 1.5497207641601562e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 16.0, 20.0, 30.0, 36.0, 63.0, 89.0, 164.0, 323.0, 643.0, 1678.0, 4722.0, 19466.0, 146281.0, 723624.0, 126856.0, 17227.0, 4390.0, 1466.0, 703.0, 324.0, 156.0, 98.0, 51.0, 42.0, 23.0, 14.0, 9.0, 8.0, 1.0, 7.0, 10.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00426483154296875, -0.0041201114654541016, -0.003975391387939453, -0.0038306713104248047, -0.0036859512329101562, -0.003541231155395508, -0.0033965110778808594, -0.003251791000366211, -0.0031070709228515625, -0.002962350845336914, -0.0028176307678222656, -0.002672910690307617, -0.0025281906127929688, -0.0023834705352783203, -0.002238750457763672, -0.0020940303802490234, -0.001949310302734375, -0.0018045902252197266, -0.0016598701477050781, -0.0015151500701904297, -0.0013704299926757812, -0.0012257099151611328, -0.0010809898376464844, -0.0009362697601318359, -0.0007915496826171875, -0.0006468296051025391, -0.0005021095275878906, -0.0003573894500732422, -0.00021266937255859375, -6.794929504394531e-05, 7.677078247070312e-05, 0.00022149085998535156, 0.0003662109375, 0.0005109310150146484, 0.0006556510925292969, 0.0008003711700439453, 0.0009450912475585938, 0.0010898113250732422, 0.0012345314025878906, 0.001379251480102539, 0.0015239715576171875, 0.001668691635131836, 0.0018134117126464844, 0.001958131790161133, 0.0021028518676757812, 0.0022475719451904297, 0.002392292022705078, 0.0025370121002197266, 0.002681732177734375, 0.0028264522552490234, 0.002971172332763672, 0.0031158924102783203, 0.0032606124877929688, 0.003405332565307617, 0.0035500526428222656, 0.003694772720336914, 0.0038394927978515625, 0.003984212875366211, 0.004128932952880859, 0.004273653030395508, 0.004418373107910156, 0.004563093185424805, 0.004707813262939453, 0.0048525333404541016, 0.00499725341796875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 4.0, 7.0, 9.0, 18.0, 36.0, 49.0, 75.0, 102.0, 152.0, 175.0, 111.0, 99.0, 52.0, 38.0, 22.0, 20.0, 8.0, 4.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00274658203125, -0.0026285648345947266, -0.002510547637939453, -0.0023925304412841797, -0.0022745132446289062, -0.002156496047973633, -0.0020384788513183594, -0.001920461654663086, -0.0018024444580078125, -0.001684427261352539, -0.0015664100646972656, -0.0014483928680419922, -0.0013303756713867188, -0.0012123584747314453, -0.0010943412780761719, -0.0009763240814208984, -0.000858306884765625, -0.0007402896881103516, -0.0006222724914550781, -0.0005042552947998047, -0.00038623809814453125, -0.0002682209014892578, -0.00015020370483398438, -3.218650817871094e-05, 8.58306884765625e-05, 0.00020384788513183594, 0.0003218650817871094, 0.0004398822784423828, 0.0005578994750976562, 0.0006759166717529297, 0.0007939338684082031, 0.0009119510650634766, 0.00102996826171875, 0.0011479854583740234, 0.0012660026550292969, 0.0013840198516845703, 0.0015020370483398438, 0.0016200542449951172, 0.0017380714416503906, 0.001856088638305664, 0.0019741058349609375, 0.002092123031616211, 0.0022101402282714844, 0.002328157424926758, 0.0024461746215820312, 0.0025641918182373047, 0.002682209014892578, 0.0028002262115478516, 0.002918243408203125, 0.0030362606048583984, 0.003154277801513672, 0.0032722949981689453, 0.0033903121948242188, 0.003508329391479492, 0.0036263465881347656, 0.003744363784790039, 0.0038623809814453125, 0.003980398178100586, 0.004098415374755859, 0.004216432571411133, 0.004334449768066406, 0.00445246696472168, 0.004570484161376953, 0.0046885013580322266, 0.0048065185546875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 14.0, 152.0, 684.0, 147.0, 9.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056860022246837616, -0.051484424620866776, -0.04610882326960564, -0.040733225643634796, -0.03535762429237366, -0.029982026666402817, -0.024606429040431976, -0.019230827689170837, -0.013855230063199997, -0.008479630574584007, -0.003104032017290592, 0.002271566540002823, 0.0076471660286188126, 0.013022765517234802, 0.018398363143205643, 0.02377396449446678, 0.029149562120437622, 0.03452515974640846, 0.0399007610976696, 0.04527635872364044, 0.05065196007490158, 0.05602755770087242, 0.06140315532684326, 0.0667787566781044, 0.07215435802936554, 0.07752995938062668, 0.08290555328130722, 0.08828115463256836, 0.0936567559838295, 0.09903235733509064, 0.10440795123577118, 0.10978355258703232, 0.11515913903713226, 0.1205347403883934, 0.12591034173965454, 0.13128593564033508, 0.13666152954101562, 0.14203713834285736, 0.1474127322435379, 0.15278834104537964, 0.15816393494606018, 0.16353952884674072, 0.16891513764858246, 0.174290731549263, 0.17966632544994354, 0.18504193425178528, 0.19041752815246582, 0.19579312205314636, 0.2011687159538269, 0.20654430985450745, 0.21191991865634918, 0.21729551255702972, 0.22267110645771027, 0.228046715259552, 0.23342230916023254, 0.23879790306091309, 0.24417351186275482, 0.24954910576343536, 0.2549247145652771, 0.26030030846595764, 0.2656759023666382, 0.2710514962673187, 0.27642709016799927, 0.2818027138710022, 0.28717830777168274]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 11.0, 12.0, 9.0, 14.0, 11.0, 24.0, 29.0, 26.0, 32.0, 40.0, 41.0, 37.0, 48.0, 60.0, 57.0, 35.0, 43.0, 46.0, 49.0, 38.0, 48.0, 45.0, 44.0, 29.0, 29.0, 30.0, 23.0, 29.0, 11.0, 12.0, 15.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.029826879501342773, -0.02901492267847061, -0.0282029639929533, -0.02739100530743599, -0.026579048484563828, -0.025767091661691666, -0.024955132976174355, -0.024143174290657043, -0.02333121746778488, -0.02251926064491272, -0.02170730195939541, -0.020895343273878098, -0.020083386451005936, -0.019271429628133774, -0.018459470942616463, -0.01764751225709915, -0.01683555543422699, -0.016023598611354828, -0.015211639925837517, -0.01439968217164278, -0.013587724417448044, -0.012775766663253307, -0.01196380890905857, -0.011151851154863834, -0.010339893400669098, -0.009527935646474361, -0.008715977892279625, -0.007904020138084888, -0.007092062383890152, -0.0062801046296954155, -0.005468146875500679, -0.0046561891213059425, -0.003844231367111206, -0.0030322736129164696, -0.002220315858721733, -0.0014083581045269966, -0.0005964003503322601, 0.00021555740386247635, 0.0010275151580572128, 0.0018394729122519493, 0.002651430666446686, 0.0034633884206414223, 0.004275346174836159, 0.005087303929030895, 0.005899261683225632, 0.006711219437420368, 0.007523177191615105, 0.008335134945809841, 0.009147092700004578, 0.009959050454199314, 0.01077100820839405, 0.011582965962588787, 0.012394923716783524, 0.01320688147097826, 0.014018839225172997, 0.014830796979367733, 0.01564275473356247, 0.01645471155643463, 0.017266670241951942, 0.018078628927469254, 0.018890585750341415, 0.019702542573213577, 0.02051450125873089, 0.0213264599442482, 0.02213841676712036]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 3.0, 2.0, 6.0, 11.0, 9.0, 10.0, 7.0, 21.0, 33.0, 51.0, 50.0, 84.0, 133.0, 258.0, 440.0, 932.0, 2285.0, 8471.0, 42048.0, 2933729.0, 1164026.0, 30898.0, 6903.0, 2213.0, 779.0, 348.0, 184.0, 110.0, 82.0, 40.0, 25.0, 21.0, 16.0, 16.0, 6.0, 10.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.01447296142578125, -0.01408088207244873, -0.013688802719116211, -0.013296723365783691, -0.012904644012451172, -0.012512564659118652, -0.012120485305786133, -0.011728405952453613, -0.011336326599121094, -0.010944247245788574, -0.010552167892456055, -0.010160088539123535, -0.009768009185791016, -0.009375929832458496, -0.008983850479125977, -0.008591771125793457, -0.008199691772460938, -0.007807612419128418, -0.0074155330657958984, -0.007023453712463379, -0.006631374359130859, -0.00623929500579834, -0.00584721565246582, -0.005455136299133301, -0.005063056945800781, -0.004670977592468262, -0.004278898239135742, -0.0038868188858032227, -0.003494739532470703, -0.0031026601791381836, -0.002710580825805664, -0.0023185014724731445, -0.001926422119140625, -0.0015343427658081055, -0.001142263412475586, -0.0007501840591430664, -0.0003581047058105469, 3.3974647521972656e-05, 0.0004260540008544922, 0.0008181333541870117, 0.0012102127075195312, 0.0016022920608520508, 0.0019943714141845703, 0.00238645076751709, 0.0027785301208496094, 0.003170609474182129, 0.0035626888275146484, 0.003954768180847168, 0.0043468475341796875, 0.004738926887512207, 0.0051310062408447266, 0.005523085594177246, 0.005915164947509766, 0.006307244300842285, 0.006699323654174805, 0.007091403007507324, 0.007483482360839844, 0.007875561714172363, 0.008267641067504883, 0.008659720420837402, 0.009051799774169922, 0.009443879127502441, 0.009835958480834961, 0.01022803783416748, 0.0106201171875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 12.0, 13.0, 25.0, 32.0, 44.0, 79.0, 88.0, 118.0, 114.0, 101.0, 97.0, 82.0, 65.0, 39.0, 39.0, 25.0, 12.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00913238525390625, -0.008862137794494629, -0.008591890335083008, -0.008321642875671387, -0.008051395416259766, -0.0077811479568481445, -0.0075109004974365234, -0.007240653038024902, -0.006970405578613281, -0.00670015811920166, -0.006429910659790039, -0.006159663200378418, -0.005889415740966797, -0.005619168281555176, -0.005348920822143555, -0.005078673362731934, -0.0048084259033203125, -0.004538178443908691, -0.00426793098449707, -0.003997683525085449, -0.003727436065673828, -0.003457188606262207, -0.003186941146850586, -0.002916693687438965, -0.0026464462280273438, -0.0023761987686157227, -0.0021059513092041016, -0.0018357038497924805, -0.0015654563903808594, -0.0012952089309692383, -0.0010249614715576172, -0.0007547140121459961, -0.000484466552734375, -0.0002142190933227539, 5.602836608886719e-05, 0.0003262758255004883, 0.0005965232849121094, 0.0008667707443237305, 0.0011370182037353516, 0.0014072656631469727, 0.0016775131225585938, 0.0019477605819702148, 0.002218008041381836, 0.002488255500793457, 0.002758502960205078, 0.0030287504196166992, 0.0032989978790283203, 0.0035692453384399414, 0.0038394927978515625, 0.004109740257263184, 0.004379987716674805, 0.004650235176086426, 0.004920482635498047, 0.005190730094909668, 0.005460977554321289, 0.00573122501373291, 0.006001472473144531, 0.006271719932556152, 0.0065419673919677734, 0.0068122148513793945, 0.007082462310791016, 0.007352709770202637, 0.007622957229614258, 0.007893204689025879, 0.0081634521484375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 18.0, 15.0, 17.0, 28.0, 40.0, 43.0, 44.0, 67.0, 118.0, 190.0, 430.0, 886.0, 2046.0, 5483.0, 16796.0, 75750.0, 2197930.0, 1798171.0, 71249.0, 16017.0, 5109.0, 2001.0, 864.0, 391.0, 201.0, 117.0, 66.0, 48.0, 42.0, 27.0, 16.0, 18.0, 8.0, 12.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007320404052734375, -0.0070587992668151855, -0.006797194480895996, -0.006535589694976807, -0.006273984909057617, -0.006012380123138428, -0.005750775337219238, -0.005489170551300049, -0.005227565765380859, -0.00496596097946167, -0.0047043561935424805, -0.004442751407623291, -0.0041811466217041016, -0.003919541835784912, -0.0036579370498657227, -0.003396332263946533, -0.0031347274780273438, -0.0028731226921081543, -0.002611517906188965, -0.0023499131202697754, -0.002088308334350586, -0.0018267035484313965, -0.001565098762512207, -0.0013034939765930176, -0.0010418891906738281, -0.0007802844047546387, -0.0005186796188354492, -0.00025707483291625977, 4.5299530029296875e-06, 0.00026613473892211914, 0.0005277395248413086, 0.000789344310760498, 0.0010509490966796875, 0.001312553882598877, 0.0015741586685180664, 0.0018357634544372559, 0.0020973682403564453, 0.0023589730262756348, 0.0026205778121948242, 0.0028821825981140137, 0.003143787384033203, 0.0034053921699523926, 0.003666996955871582, 0.0039286017417907715, 0.004190206527709961, 0.00445181131362915, 0.00471341609954834, 0.004975020885467529, 0.005236625671386719, 0.005498230457305908, 0.005759835243225098, 0.006021440029144287, 0.0062830448150634766, 0.006544649600982666, 0.0068062543869018555, 0.007067859172821045, 0.007329463958740234, 0.007591068744659424, 0.007852673530578613, 0.008114278316497803, 0.008375883102416992, 0.008637487888336182, 0.008899092674255371, 0.00916069746017456, 0.00942230224609375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 12.0, 8.0, 23.0, 22.0, 48.0, 60.0, 107.0, 317.0, 1017.0, 1497.0, 561.0, 185.0, 83.0, 35.0, 23.0, 24.0, 13.0, 10.0, 5.0, 5.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00949859619140625, -0.009283840656280518, -0.009069085121154785, -0.008854329586029053, -0.00863957405090332, -0.008424818515777588, -0.008210062980651855, -0.007995307445526123, -0.007780551910400391, -0.007565796375274658, -0.007351040840148926, -0.007136285305023193, -0.006921529769897461, -0.0067067742347717285, -0.006492018699645996, -0.006277263164520264, -0.006062507629394531, -0.005847752094268799, -0.005632996559143066, -0.005418241024017334, -0.0052034854888916016, -0.004988729953765869, -0.004773974418640137, -0.004559218883514404, -0.004344463348388672, -0.0041297078132629395, -0.003914952278137207, -0.0037001967430114746, -0.003485441207885742, -0.0032706856727600098, -0.0030559301376342773, -0.002841174602508545, -0.0026264190673828125, -0.00241166353225708, -0.0021969079971313477, -0.0019821524620056152, -0.0017673969268798828, -0.0015526413917541504, -0.001337885856628418, -0.0011231303215026855, -0.0009083747863769531, -0.0006936192512512207, -0.0004788637161254883, -0.00026410818099975586, -4.935264587402344e-05, 0.00016540288925170898, 0.0003801584243774414, 0.0005949139595031738, 0.0008096694946289062, 0.0010244250297546387, 0.001239180564880371, 0.0014539361000061035, 0.001668691635131836, 0.0018834471702575684, 0.0020982027053833008, 0.002312958240509033, 0.0025277137756347656, 0.002742469310760498, 0.0029572248458862305, 0.003171980381011963, 0.0033867359161376953, 0.0036014914512634277, 0.00381624698638916, 0.004031002521514893, 0.004245758056640625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 10.0, 9.0, 21.0, 36.0, 103.0, 217.0, 272.0, 188.0, 89.0, 41.0, 11.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.056673627346754074, -0.05557158589363098, -0.05446954071521759, -0.0533674992620945, -0.05226545408368111, -0.051163412630558014, -0.05006136745214462, -0.04895932599902153, -0.04785728082060814, -0.046755239367485046, -0.045653194189071655, -0.04455115273594856, -0.04344910755753517, -0.04234706610441208, -0.04124502092599869, -0.040142979472875595, -0.0390409380197525, -0.03793889656662941, -0.03683685138821602, -0.035734809935092926, -0.034632764756679535, -0.03353072330355644, -0.03242867812514305, -0.03132663667201996, -0.030224591493606567, -0.029122548177838326, -0.028020504862070084, -0.026918461546301842, -0.0258164182305336, -0.024714374914765358, -0.023612331598997116, -0.022510290145874023, -0.021408241242170334, -0.020306197926402092, -0.01920415461063385, -0.018102111294865608, -0.017000067979097366, -0.015898024663329124, -0.014795982278883457, -0.013693938963115215, -0.012591896578669548, -0.011489853262901306, -0.010387809947133064, -0.009285766631364822, -0.00818372331559658, -0.007081680465489626, -0.005979637615382671, -0.0048775942996144295, -0.0037755509838461876, -0.0026735076680779457, -0.0015714645851403475, -0.00046942150220274925, 0.0006326218135654926, 0.0017346651293337345, 0.002836707979440689, 0.003938751295208931, 0.005040794610977173, 0.006142837926745415, 0.007244881242513657, 0.008346924558281898, 0.00944896787405014, 0.010551011189818382, 0.01165305357426405, 0.012755096890032291, 0.013857140205800533]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 6.0, 7.0, 8.0, 7.0, 11.0, 11.0, 15.0, 22.0, 21.0, 25.0, 24.0, 29.0, 33.0, 40.0, 35.0, 38.0, 39.0, 56.0, 39.0, 52.0, 60.0, 41.0, 37.0, 28.0, 36.0, 33.0, 34.0, 28.0, 37.0, 21.0, 19.0, 20.0, 20.0, 21.0, 14.0, 10.0, 7.0, 2.0, 5.0, 6.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.010714828968048096, -0.010388280265033245, -0.010061731562018394, -0.009735182859003544, -0.009408634155988693, -0.009082085452973843, -0.008755536749958992, -0.008428988046944141, -0.00810243934392929, -0.00777589064091444, -0.0074493419378995895, -0.007122793234884739, -0.006796244531869888, -0.006469695828855038, -0.006143147125840187, -0.0058165984228253365, -0.005490049719810486, -0.005163501016795635, -0.004836952313780785, -0.004510403610765934, -0.004183854907751083, -0.0038573062047362328, -0.003530757501721382, -0.0032042087987065315, -0.002877660095691681, -0.0025511113926768303, -0.0022245626896619797, -0.001898013986647129, -0.0015714652836322784, -0.0012449165806174278, -0.0009183678776025772, -0.0005918191745877266, -0.000265270471572876, 6.127823144197464e-05, 0.00038782693445682526, 0.0007143756374716759, 0.0010409243404865265, 0.001367473043501377, 0.0016940217465162277, 0.0020205704495310783, 0.002347119152545929, 0.0026736678555607796, 0.00300021655857563, 0.003326765261590481, 0.0036533139646053314, 0.003979862667620182, 0.004306411370635033, 0.004632960073649883, 0.004959508776664734, 0.0052860574796795845, 0.005612606182694435, 0.005939154885709286, 0.006265703588724136, 0.006592252291738987, 0.006918800994753838, 0.007245349697768688, 0.007571898400783539, 0.00789844710379839, 0.00822499580681324, 0.00855154450982809, 0.008878093212842941, 0.009204641915857792, 0.009531190618872643, 0.009857739321887493, 0.010184288024902344]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 5.0, 9.0, 11.0, 10.0, 23.0, 22.0, 45.0, 80.0, 89.0, 153.0, 290.0, 627.0, 1542.0, 5149.0, 24138.0, 186253.0, 709407.0, 99652.0, 15218.0, 3516.0, 1138.0, 507.0, 247.0, 149.0, 91.0, 55.0, 44.0, 27.0, 17.0, 13.0, 5.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.019775390625, -0.019164323806762695, -0.01855325698852539, -0.017942190170288086, -0.01733112335205078, -0.016720056533813477, -0.016108989715576172, -0.015497922897338867, -0.014886856079101562, -0.014275789260864258, -0.013664722442626953, -0.013053655624389648, -0.012442588806152344, -0.011831521987915039, -0.011220455169677734, -0.01060938835144043, -0.009998321533203125, -0.00938725471496582, -0.008776187896728516, -0.008165121078491211, -0.007554054260253906, -0.0069429874420166016, -0.006331920623779297, -0.005720853805541992, -0.0051097869873046875, -0.004498720169067383, -0.003887653350830078, -0.0032765865325927734, -0.0026655197143554688, -0.002054452896118164, -0.0014433860778808594, -0.0008323192596435547, -0.00022125244140625, 0.0003898143768310547, 0.0010008811950683594, 0.001611948013305664, 0.0022230148315429688, 0.0028340816497802734, 0.003445148468017578, 0.004056215286254883, 0.0046672821044921875, 0.005278348922729492, 0.005889415740966797, 0.0065004825592041016, 0.007111549377441406, 0.007722616195678711, 0.008333683013916016, 0.00894474983215332, 0.009555816650390625, 0.01016688346862793, 0.010777950286865234, 0.011389017105102539, 0.012000083923339844, 0.012611150741577148, 0.013222217559814453, 0.013833284378051758, 0.014444351196289062, 0.015055418014526367, 0.015666484832763672, 0.016277551651000977, 0.01688861846923828, 0.017499685287475586, 0.01811075210571289, 0.018721818923950195, 0.0193328857421875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 7.0, 22.0, 27.0, 35.0, 46.0, 73.0, 106.0, 80.0, 104.0, 100.0, 82.0, 82.0, 62.0, 54.0, 38.0, 30.0, 23.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.006946563720703125, -0.006705820560455322, -0.0064650774002075195, -0.006224334239959717, -0.005983591079711914, -0.005742847919464111, -0.005502104759216309, -0.005261361598968506, -0.005020618438720703, -0.0047798752784729, -0.004539132118225098, -0.004298388957977295, -0.004057645797729492, -0.0038169026374816895, -0.0035761594772338867, -0.003335416316986084, -0.0030946731567382812, -0.0028539299964904785, -0.0026131868362426758, -0.002372443675994873, -0.0021317005157470703, -0.0018909573554992676, -0.0016502141952514648, -0.0014094710350036621, -0.0011687278747558594, -0.0009279847145080566, -0.0006872415542602539, -0.00044649839401245117, -0.00020575523376464844, 3.49879264831543e-05, 0.00027573108673095703, 0.0005164742469787598, 0.0007572174072265625, 0.0009979605674743652, 0.001238703727722168, 0.0014794468879699707, 0.0017201900482177734, 0.001960933208465576, 0.002201676368713379, 0.0024424195289611816, 0.0026831626892089844, 0.002923905849456787, 0.00316464900970459, 0.0034053921699523926, 0.0036461353302001953, 0.003886878490447998, 0.004127621650695801, 0.0043683648109436035, 0.004609107971191406, 0.004849851131439209, 0.005090594291687012, 0.0053313374519348145, 0.005572080612182617, 0.00581282377243042, 0.006053566932678223, 0.006294310092926025, 0.006535053253173828, 0.006775796413421631, 0.007016539573669434, 0.007257282733917236, 0.007498025894165039, 0.007738769054412842, 0.007979512214660645, 0.008220255374908447, 0.00846099853515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 4.0, 7.0, 12.0, 15.0, 10.0, 30.0, 39.0, 79.0, 118.0, 235.0, 570.0, 1761.0, 6028.0, 26678.0, 165005.0, 665225.0, 149662.0, 24700.0, 5650.0, 1590.0, 557.0, 230.0, 126.0, 68.0, 54.0, 22.0, 22.0, 8.0, 13.0, 6.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0165863037109375, -0.016118764877319336, -0.015651226043701172, -0.015183687210083008, -0.014716148376464844, -0.01424860954284668, -0.013781070709228516, -0.013313531875610352, -0.012845993041992188, -0.012378454208374023, -0.01191091537475586, -0.011443376541137695, -0.010975837707519531, -0.010508298873901367, -0.010040760040283203, -0.009573221206665039, -0.009105682373046875, -0.008638143539428711, -0.008170604705810547, -0.007703065872192383, -0.007235527038574219, -0.006767988204956055, -0.006300449371337891, -0.0058329105377197266, -0.0053653717041015625, -0.0048978328704833984, -0.004430294036865234, -0.00396275520324707, -0.0034952163696289062, -0.003027677536010742, -0.002560138702392578, -0.002092599868774414, -0.00162506103515625, -0.001157522201538086, -0.0006899833679199219, -0.0002224445343017578, 0.00024509429931640625, 0.0007126331329345703, 0.0011801719665527344, 0.0016477108001708984, 0.0021152496337890625, 0.0025827884674072266, 0.0030503273010253906, 0.0035178661346435547, 0.003985404968261719, 0.004452943801879883, 0.004920482635498047, 0.005388021469116211, 0.005855560302734375, 0.006323099136352539, 0.006790637969970703, 0.007258176803588867, 0.007725715637207031, 0.008193254470825195, 0.00866079330444336, 0.009128332138061523, 0.009595870971679688, 0.010063409805297852, 0.010530948638916016, 0.01099848747253418, 0.011466026306152344, 0.011933565139770508, 0.012401103973388672, 0.012868642807006836, 0.013336181640625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 6.0, 7.0, 10.0, 9.0, 11.0, 18.0, 17.0, 19.0, 25.0, 26.0, 29.0, 34.0, 29.0, 41.0, 33.0, 46.0, 40.0, 37.0, 46.0, 36.0, 35.0, 35.0, 39.0, 37.0, 39.0, 34.0, 34.0, 25.0, 23.0, 38.0, 17.0, 27.0, 13.0, 14.0, 19.0, 9.0, 11.0, 7.0, 5.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0], "bins": [-0.00788116455078125, -0.00762486457824707, -0.007368564605712891, -0.007112264633178711, -0.006855964660644531, -0.0065996646881103516, -0.006343364715576172, -0.006087064743041992, -0.0058307647705078125, -0.005574464797973633, -0.005318164825439453, -0.0050618648529052734, -0.004805564880371094, -0.004549264907836914, -0.004292964935302734, -0.004036664962768555, -0.003780364990234375, -0.0035240650177001953, -0.0032677650451660156, -0.003011465072631836, -0.0027551651000976562, -0.0024988651275634766, -0.002242565155029297, -0.001986265182495117, -0.0017299652099609375, -0.0014736652374267578, -0.0012173652648925781, -0.0009610652923583984, -0.0007047653198242188, -0.00044846534729003906, -0.00019216537475585938, 6.413459777832031e-05, 0.0003204345703125, 0.0005767345428466797, 0.0008330345153808594, 0.001089334487915039, 0.0013456344604492188, 0.0016019344329833984, 0.0018582344055175781, 0.002114534378051758, 0.0023708343505859375, 0.002627134323120117, 0.002883434295654297, 0.0031397342681884766, 0.0033960342407226562, 0.003652334213256836, 0.003908634185791016, 0.004164934158325195, 0.004421234130859375, 0.004677534103393555, 0.004933834075927734, 0.005190134048461914, 0.005446434020996094, 0.0057027339935302734, 0.005959033966064453, 0.006215333938598633, 0.0064716339111328125, 0.006727933883666992, 0.006984233856201172, 0.0072405338287353516, 0.007496833801269531, 0.007753133773803711, 0.00800943374633789, 0.00826573371887207, 0.00852203369140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 6.0, 7.0, 6.0, 16.0, 35.0, 46.0, 87.0, 141.0, 249.0, 537.0, 1035.0, 2371.0, 5500.0, 14323.0, 43481.0, 166073.0, 526021.0, 208970.0, 51525.0, 16656.0, 6400.0, 2609.0, 1223.0, 560.0, 289.0, 152.0, 97.0, 51.0, 31.0, 20.0, 9.0, 9.0, 4.0, 4.0, 0.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0023059844970703125, -0.0022392868995666504, -0.0021725893020629883, -0.002105891704559326, -0.002039194107055664, -0.001972496509552002, -0.0019057989120483398, -0.0018391013145446777, -0.0017724037170410156, -0.0017057061195373535, -0.0016390085220336914, -0.0015723109245300293, -0.0015056133270263672, -0.001438915729522705, -0.001372218132019043, -0.0013055205345153809, -0.0012388229370117188, -0.0011721253395080566, -0.0011054277420043945, -0.0010387301445007324, -0.0009720325469970703, -0.0009053349494934082, -0.0008386373519897461, -0.000771939754486084, -0.0007052421569824219, -0.0006385445594787598, -0.0005718469619750977, -0.0005051493644714355, -0.00043845176696777344, -0.00037175416946411133, -0.0003050565719604492, -0.0002383589744567871, -0.000171661376953125, -0.00010496377944946289, -3.826618194580078e-05, 2.8431415557861328e-05, 9.512901306152344e-05, 0.00016182661056518555, 0.00022852420806884766, 0.00029522180557250977, 0.0003619194030761719, 0.000428617000579834, 0.0004953145980834961, 0.0005620121955871582, 0.0006287097930908203, 0.0006954073905944824, 0.0007621049880981445, 0.0008288025856018066, 0.0008955001831054688, 0.0009621977806091309, 0.001028895378112793, 0.001095592975616455, 0.0011622905731201172, 0.0012289881706237793, 0.0012956857681274414, 0.0013623833656311035, 0.0014290809631347656, 0.0014957785606384277, 0.0015624761581420898, 0.001629173755645752, 0.001695871353149414, 0.0017625689506530762, 0.0018292665481567383, 0.0018959641456604004, 0.0019626617431640625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 0.0, 4.0, 10.0, 7.0, 0.0, 10.0, 23.0, 15.0, 0.0, 25.0, 29.0, 33.0, 0.0, 41.0, 56.0, 46.0, 0.0, 56.0, 59.0, 60.0, 0.0, 54.0, 68.0, 55.0, 0.0, 53.0, 56.0, 40.0, 0.0, 30.0, 33.0, 37.0, 0.0, 23.0, 20.0, 15.0, 0.0, 15.0, 8.0, 4.0, 0.0, 4.0, 1.0, 6.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-1.6093254089355469e-06, -1.564621925354004e-06, -1.519918441772461e-06, -1.475214958190918e-06, -1.430511474609375e-06, -1.385807991027832e-06, -1.341104507446289e-06, -1.296401023864746e-06, -1.2516975402832031e-06, -1.2069940567016602e-06, -1.1622905731201172e-06, -1.1175870895385742e-06, -1.0728836059570312e-06, -1.0281801223754883e-06, -9.834766387939453e-07, -9.387731552124023e-07, -8.940696716308594e-07, -8.493661880493164e-07, -8.046627044677734e-07, -7.599592208862305e-07, -7.152557373046875e-07, -6.705522537231445e-07, -6.258487701416016e-07, -5.811452865600586e-07, -5.364418029785156e-07, -4.917383193969727e-07, -4.470348358154297e-07, -4.023313522338867e-07, -3.5762786865234375e-07, -3.129243850708008e-07, -2.682209014892578e-07, -2.2351741790771484e-07, -1.7881393432617188e-07, -1.341104507446289e-07, -8.940696716308594e-08, -4.470348358154297e-08, 0.0, 4.470348358154297e-08, 8.940696716308594e-08, 1.341104507446289e-07, 1.7881393432617188e-07, 2.2351741790771484e-07, 2.682209014892578e-07, 3.129243850708008e-07, 3.5762786865234375e-07, 4.023313522338867e-07, 4.470348358154297e-07, 4.917383193969727e-07, 5.364418029785156e-07, 5.811452865600586e-07, 6.258487701416016e-07, 6.705522537231445e-07, 7.152557373046875e-07, 7.599592208862305e-07, 8.046627044677734e-07, 8.493661880493164e-07, 8.940696716308594e-07, 9.387731552124023e-07, 9.834766387939453e-07, 1.0281801223754883e-06, 1.0728836059570312e-06, 1.1175870895385742e-06, 1.1622905731201172e-06, 1.2069940567016602e-06, 1.2516975402832031e-06]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 3.0, 5.0, 11.0, 16.0, 26.0, 31.0, 50.0, 77.0, 179.0, 263.0, 423.0, 759.0, 1455.0, 3082.0, 7024.0, 19125.0, 66556.0, 296964.0, 484386.0, 118411.0, 30728.0, 10441.0, 4321.0, 1928.0, 977.0, 529.0, 293.0, 177.0, 112.0, 57.0, 47.0, 32.0, 20.0, 14.0, 13.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025768280029296875, -0.0025014877319335938, -0.0024261474609375, -0.0023508071899414062, -0.0022754669189453125, -0.0022001266479492188, -0.002124786376953125, -0.0020494461059570312, -0.0019741058349609375, -0.0018987655639648438, -0.00182342529296875, -0.0017480850219726562, -0.0016727447509765625, -0.0015974044799804688, -0.001522064208984375, -0.0014467239379882812, -0.0013713836669921875, -0.0012960433959960938, -0.001220703125, -0.0011453628540039062, -0.0010700225830078125, -0.0009946823120117188, -0.000919342041015625, -0.0008440017700195312, -0.0007686614990234375, -0.0006933212280273438, -0.00061798095703125, -0.0005426406860351562, -0.0004673004150390625, -0.00039196014404296875, -0.000316619873046875, -0.00024127960205078125, -0.0001659393310546875, -9.059906005859375e-05, -1.52587890625e-05, 6.008148193359375e-05, 0.0001354217529296875, 0.00021076202392578125, 0.000286102294921875, 0.00036144256591796875, 0.0004367828369140625, 0.0005121231079101562, 0.00058746337890625, 0.0006628036499023438, 0.0007381439208984375, 0.0008134841918945312, 0.000888824462890625, 0.0009641647338867188, 0.0010395050048828125, 0.0011148452758789062, 0.001190185546875, 0.0012655258178710938, 0.0013408660888671875, 0.0014162063598632812, 0.001491546630859375, 0.0015668869018554688, 0.0016422271728515625, 0.0017175674438476562, 0.00179290771484375, 0.0018682479858398438, 0.0019435882568359375, 0.0020189285278320312, 0.002094268798828125, 0.0021696090698242188, 0.0022449493408203125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 8.0, 10.0, 9.0, 12.0, 17.0, 22.0, 25.0, 37.0, 44.0, 55.0, 76.0, 82.0, 97.0, 93.0, 81.0, 66.0, 47.0, 61.0, 39.0, 25.0, 21.0, 10.0, 10.0, 11.0, 8.0, 4.0, 8.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018329620361328125, -0.00176924467086792, -0.0017055273056030273, -0.0016418099403381348, -0.0015780925750732422, -0.0015143752098083496, -0.001450657844543457, -0.0013869404792785645, -0.0013232231140136719, -0.0012595057487487793, -0.0011957883834838867, -0.0011320710182189941, -0.0010683536529541016, -0.001004636287689209, -0.0009409189224243164, -0.0008772015571594238, -0.0008134841918945312, -0.0007497668266296387, -0.0006860494613647461, -0.0006223320960998535, -0.0005586147308349609, -0.0004948973655700684, -0.0004311800003051758, -0.0003674626350402832, -0.0003037452697753906, -0.00024002790451049805, -0.00017631053924560547, -0.00011259317398071289, -4.887580871582031e-05, 1.4841556549072266e-05, 7.855892181396484e-05, 0.00014227628707885742, 0.00020599365234375, 0.0002697110176086426, 0.00033342838287353516, 0.00039714574813842773, 0.0004608631134033203, 0.0005245804786682129, 0.0005882978439331055, 0.000652015209197998, 0.0007157325744628906, 0.0007794499397277832, 0.0008431673049926758, 0.0009068846702575684, 0.0009706020355224609, 0.0010343194007873535, 0.001098036766052246, 0.0011617541313171387, 0.0012254714965820312, 0.0012891888618469238, 0.0013529062271118164, 0.001416623592376709, 0.0014803409576416016, 0.0015440583229064941, 0.0016077756881713867, 0.0016714930534362793, 0.0017352104187011719, 0.0017989277839660645, 0.001862645149230957, 0.0019263625144958496, 0.001990079879760742, 0.0020537972450256348, 0.0021175146102905273, 0.00218123197555542, 0.0022449493408203125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 9.0, 4.0, 11.0, 23.0, 14.0, 29.0, 36.0, 77.0, 103.0, 134.0, 154.0, 131.0, 107.0, 72.0, 35.0, 22.0, 19.0, 12.0, 10.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043820466846227646, -0.04282276704907417, -0.0418250635266304, -0.04082736372947693, -0.03982966020703316, -0.038831960409879684, -0.03783425688743591, -0.03683655709028244, -0.03583885729312897, -0.034841157495975494, -0.03384345397353172, -0.03284575417637825, -0.03184805065393448, -0.030850350856781006, -0.029852649196982384, -0.02885494753718376, -0.02785724587738514, -0.026859544217586517, -0.025861842557787895, -0.024864140897989273, -0.0238664411008358, -0.022868739441037178, -0.021871037781238556, -0.020873336121439934, -0.01987563446164131, -0.01887793280184269, -0.017880231142044067, -0.016882531344890594, -0.015884829685091972, -0.01488712802529335, -0.013889426365494728, -0.012891724705696106, -0.011894023045897484, -0.010896321386098862, -0.009898620657622814, -0.008900918997824192, -0.007903218269348145, -0.006905516609549522, -0.0059078149497509, -0.0049101137556135654, -0.003912412561476231, -0.002914711367338896, -0.0019170099403709173, -0.0009193085134029388, 7.839268073439598e-05, 0.0010760938748717308, 0.002073795534670353, 0.0030714967288076878, 0.004069197922945023, 0.005066899117082357, 0.006064600311219692, 0.007062301971018314, 0.008060002699494362, 0.009057704359292984, 0.010055406019091606, 0.011053107678890228, 0.012050808407366276, 0.013048510067164898, 0.014046210795640945, 0.015043912455439568, 0.01604161411523819, 0.017039313912391663, 0.018037017434835434, 0.019034717231988907, 0.02003241889178753]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 7.0, 12.0, 11.0, 13.0, 8.0, 10.0, 16.0, 14.0, 24.0, 19.0, 32.0, 27.0, 32.0, 30.0, 47.0, 31.0, 47.0, 28.0, 50.0, 36.0, 55.0, 50.0, 28.0, 37.0, 38.0, 39.0, 29.0, 28.0, 26.0, 23.0, 15.0, 20.0, 14.0, 24.0, 17.0, 16.0, 9.0, 14.0, 8.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.021915435791015625, -0.02120683714747429, -0.020498238503932953, -0.019789639860391617, -0.01908104121685028, -0.018372442573308945, -0.01766384392976761, -0.016955245286226273, -0.016246646642684937, -0.0155380479991436, -0.014829449355602264, -0.014120850712060928, -0.013412252068519592, -0.012703653424978256, -0.01199505478143692, -0.011286456137895584, -0.010577857494354248, -0.009869258850812912, -0.009160660207271576, -0.00845206156373024, -0.007743462920188904, -0.007034864276647568, -0.006326265633106232, -0.005617666989564896, -0.00490906834602356, -0.0042004697024822235, -0.0034918710589408875, -0.0027832724153995514, -0.0020746737718582153, -0.0013660751283168793, -0.0006574764847755432, 5.112215876579285e-05, 0.0007597208023071289, 0.001468319445848465, 0.002176918089389801, 0.002885516732931137, 0.003594115376472473, 0.004302714020013809, 0.005011312663555145, 0.005719911307096481, 0.006428509950637817, 0.0071371085941791534, 0.00784570723772049, 0.008554305881261826, 0.009262904524803162, 0.009971503168344498, 0.010680101811885834, 0.01138870045542717, 0.012097299098968506, 0.012805897742509842, 0.013514496386051178, 0.014223095029592514, 0.01493169367313385, 0.015640292316675186, 0.016348890960216522, 0.01705748960375786, 0.017766088247299194, 0.01847468689084053, 0.019183285534381866, 0.019891884177923203, 0.02060048282146454, 0.021309081465005875, 0.02201768010854721, 0.022726278752088547, 0.023434877395629883]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 6.0, 5.0, 5.0, 4.0, 7.0, 9.0, 8.0, 17.0, 14.0, 23.0, 39.0, 52.0, 89.0, 108.0, 192.0, 323.0, 688.0, 1355.0, 3150.0, 9720.0, 43680.0, 1983354.0, 2091783.0, 44292.0, 9522.0, 3155.0, 1278.0, 578.0, 294.0, 161.0, 103.0, 67.0, 52.0, 45.0, 21.0, 11.0, 11.0, 10.0, 13.0, 6.0, 5.0, 8.0, 3.0, 6.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.011566162109375, -0.011215686798095703, -0.010865211486816406, -0.01051473617553711, -0.010164260864257812, -0.009813785552978516, -0.009463310241699219, -0.009112834930419922, -0.008762359619140625, -0.008411884307861328, -0.008061408996582031, -0.007710933685302734, -0.0073604583740234375, -0.007009983062744141, -0.006659507751464844, -0.006309032440185547, -0.00595855712890625, -0.005608081817626953, -0.005257606506347656, -0.004907131195068359, -0.0045566558837890625, -0.004206180572509766, -0.0038557052612304688, -0.003505229949951172, -0.003154754638671875, -0.002804279327392578, -0.0024538040161132812, -0.0021033287048339844, -0.0017528533935546875, -0.0014023780822753906, -0.0010519027709960938, -0.0007014274597167969, -0.0003509521484375, -4.76837158203125e-07, 0.00034999847412109375, 0.0007004737854003906, 0.0010509490966796875, 0.0014014244079589844, 0.0017518997192382812, 0.002102375030517578, 0.002452850341796875, 0.002803325653076172, 0.0031538009643554688, 0.0035042762756347656, 0.0038547515869140625, 0.004205226898193359, 0.004555702209472656, 0.004906177520751953, 0.00525665283203125, 0.005607128143310547, 0.005957603454589844, 0.006308078765869141, 0.0066585540771484375, 0.007009029388427734, 0.007359504699707031, 0.007709980010986328, 0.008060455322265625, 0.008410930633544922, 0.008761405944824219, 0.009111881256103516, 0.009462356567382812, 0.00981283187866211, 0.010163307189941406, 0.010513782501220703, 0.0108642578125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 1.0, 10.0, 16.0, 24.0, 30.0, 37.0, 66.0, 77.0, 80.0, 107.0, 94.0, 89.0, 76.0, 88.0, 60.0, 50.0, 28.0, 29.0, 14.0, 10.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007110595703125, -0.006877720355987549, -0.006644845008850098, -0.0064119696617126465, -0.006179094314575195, -0.005946218967437744, -0.005713343620300293, -0.005480468273162842, -0.005247592926025391, -0.0050147175788879395, -0.004781842231750488, -0.004548966884613037, -0.004316091537475586, -0.004083216190338135, -0.0038503408432006836, -0.0036174654960632324, -0.0033845901489257812, -0.00315171480178833, -0.002918839454650879, -0.0026859641075134277, -0.0024530887603759766, -0.0022202134132385254, -0.0019873380661010742, -0.001754462718963623, -0.0015215873718261719, -0.0012887120246887207, -0.0010558366775512695, -0.0008229613304138184, -0.0005900859832763672, -0.000357210636138916, -0.00012433528900146484, 0.00010854005813598633, 0.0003414154052734375, 0.0005742907524108887, 0.0008071660995483398, 0.001040041446685791, 0.0012729167938232422, 0.0015057921409606934, 0.0017386674880981445, 0.0019715428352355957, 0.002204418182373047, 0.002437293529510498, 0.0026701688766479492, 0.0029030442237854004, 0.0031359195709228516, 0.0033687949180603027, 0.003601670265197754, 0.003834545612335205, 0.004067420959472656, 0.004300296306610107, 0.004533171653747559, 0.00476604700088501, 0.004998922348022461, 0.005231797695159912, 0.005464673042297363, 0.0056975483894348145, 0.005930423736572266, 0.006163299083709717, 0.006396174430847168, 0.006629049777984619, 0.00686192512512207, 0.0070948004722595215, 0.007327675819396973, 0.007560551166534424, 0.007793426513671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 12.0, 4.0, 15.0, 20.0, 22.0, 39.0, 46.0, 66.0, 95.0, 138.0, 216.0, 322.0, 574.0, 946.0, 1606.0, 3131.0, 6785.0, 16993.0, 55321.0, 367516.0, 3414900.0, 253067.0, 45307.0, 14549.0, 5923.0, 2792.0, 1437.0, 881.0, 524.0, 327.0, 202.0, 160.0, 119.0, 60.0, 45.0, 32.0, 31.0, 16.0, 15.0, 11.0, 7.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.006683349609375, -0.006489217281341553, -0.0062950849533081055, -0.006100952625274658, -0.005906820297241211, -0.005712687969207764, -0.005518555641174316, -0.005324423313140869, -0.005130290985107422, -0.004936158657073975, -0.004742026329040527, -0.00454789400100708, -0.004353761672973633, -0.0041596293449401855, -0.003965497016906738, -0.003771364688873291, -0.0035772323608398438, -0.0033831000328063965, -0.0031889677047729492, -0.002994835376739502, -0.0028007030487060547, -0.0026065707206726074, -0.00241243839263916, -0.002218306064605713, -0.0020241737365722656, -0.0018300414085388184, -0.001635909080505371, -0.0014417767524719238, -0.0012476444244384766, -0.0010535120964050293, -0.000859379768371582, -0.0006652474403381348, -0.0004711151123046875, -0.00027698278427124023, -8.285045623779297e-05, 0.0001112818717956543, 0.00030541419982910156, 0.0004995465278625488, 0.0006936788558959961, 0.0008878111839294434, 0.0010819435119628906, 0.0012760758399963379, 0.0014702081680297852, 0.0016643404960632324, 0.0018584728240966797, 0.002052605152130127, 0.0022467374801635742, 0.0024408698081970215, 0.0026350021362304688, 0.002829134464263916, 0.0030232667922973633, 0.0032173991203308105, 0.003411531448364258, 0.003605663776397705, 0.0037997961044311523, 0.0039939284324646, 0.004188060760498047, 0.004382193088531494, 0.004576325416564941, 0.004770457744598389, 0.004964590072631836, 0.005158722400665283, 0.0053528547286987305, 0.005546987056732178, 0.005741119384765625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 5.0, 4.0, 8.0, 8.0, 9.0, 16.0, 15.0, 40.0, 49.0, 102.0, 218.0, 569.0, 1637.0, 782.0, 290.0, 127.0, 70.0, 40.0, 23.0, 15.0, 12.0, 10.0, 5.0, 5.0, 5.0, 6.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005889892578125, -0.005714774131774902, -0.005539655685424805, -0.005364537239074707, -0.005189418792724609, -0.005014300346374512, -0.004839181900024414, -0.004664063453674316, -0.004488945007324219, -0.004313826560974121, -0.0041387081146240234, -0.003963589668273926, -0.003788471221923828, -0.0036133527755737305, -0.003438234329223633, -0.003263115882873535, -0.0030879974365234375, -0.00291287899017334, -0.002737760543823242, -0.0025626420974731445, -0.002387523651123047, -0.0022124052047729492, -0.0020372867584228516, -0.001862168312072754, -0.0016870498657226562, -0.0015119314193725586, -0.001336812973022461, -0.0011616945266723633, -0.0009865760803222656, -0.000811457633972168, -0.0006363391876220703, -0.00046122074127197266, -0.000286102294921875, -0.00011098384857177734, 6.413459777832031e-05, 0.00023925304412841797, 0.0004143714904785156, 0.0005894899368286133, 0.0007646083831787109, 0.0009397268295288086, 0.0011148452758789062, 0.001289963722229004, 0.0014650821685791016, 0.0016402006149291992, 0.0018153190612792969, 0.0019904375076293945, 0.002165555953979492, 0.00234067440032959, 0.0025157928466796875, 0.002690911293029785, 0.002866029739379883, 0.0030411481857299805, 0.003216266632080078, 0.0033913850784301758, 0.0035665035247802734, 0.003741621971130371, 0.003916740417480469, 0.004091858863830566, 0.004266977310180664, 0.004442095756530762, 0.004617214202880859, 0.004792332649230957, 0.004967451095581055, 0.005142569541931152, 0.00531768798828125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 12.0, 13.0, 46.0, 118.0, 270.0, 291.0, 154.0, 73.0, 14.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06371309608221054, -0.062490664422512054, -0.06126823276281357, -0.06004580110311508, -0.058823369443416595, -0.05760094150900841, -0.05637850984930992, -0.055156078189611435, -0.05393364652991295, -0.05271121487021446, -0.051488783210515976, -0.05026635155081749, -0.0490439236164093, -0.047821491956710815, -0.04659906029701233, -0.04537662863731384, -0.044154196977615356, -0.04293176531791687, -0.041709333658218384, -0.0404869019985199, -0.03926447033882141, -0.03804204240441322, -0.03681961074471474, -0.03559717908501625, -0.034374747425317764, -0.03315231576561928, -0.03192988410592079, -0.030707454308867455, -0.029485022649168968, -0.028262590989470482, -0.027040161192417145, -0.02581772953271866, -0.024595297873020172, -0.023372866213321686, -0.0221504345536232, -0.020928004756569862, -0.019705573096871376, -0.01848314143717289, -0.017260711640119553, -0.016038279980421066, -0.01481584832072258, -0.013593416661024094, -0.012370985932648182, -0.01114855520427227, -0.009926123544573784, -0.008703691884875298, -0.007481261156499386, -0.006258830428123474, -0.005036398768424988, -0.0038139675743877888, -0.0025915363803505898, -0.0013691051863133907, -0.0001466739922761917, 0.0010757572017610073, 0.0022981883957982063, 0.003520619124174118, 0.004743050783872604, 0.005965481977909803, 0.007187913171947002, 0.008410343900322914, 0.0096327755600214, 0.010855207219719887, 0.012077637948095798, 0.01330006867647171, 0.014522500336170197]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 9.0, 5.0, 10.0, 5.0, 8.0, 13.0, 13.0, 17.0, 13.0, 20.0, 16.0, 26.0, 26.0, 28.0, 37.0, 43.0, 26.0, 36.0, 49.0, 35.0, 42.0, 31.0, 33.0, 46.0, 39.0, 52.0, 30.0, 31.0, 29.0, 29.0, 27.0, 28.0, 16.0, 21.0, 16.0, 16.0, 19.0, 15.0, 5.0, 6.0, 9.0, 2.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007452547550201416, -0.007194121368229389, -0.006935695186257362, -0.0066772690042853355, -0.006418842822313309, -0.006160416640341282, -0.005901990458369255, -0.005643564276397228, -0.005385138094425201, -0.005126711912453175, -0.004868285730481148, -0.004609859548509121, -0.004351433366537094, -0.004093007184565067, -0.0038345810025930405, -0.0035761548206210136, -0.003317728638648987, -0.00305930245667696, -0.002800876274704933, -0.0025424500927329063, -0.0022840239107608795, -0.0020255977287888527, -0.0017671715468168259, -0.001508745364844799, -0.0012503191828727722, -0.0009918930009007454, -0.0007334668189287186, -0.00047504063695669174, -0.00021661445498466492, 4.181172698736191e-05, 0.00030023790895938873, 0.0005586640909314156, 0.0008170902729034424, 0.0010755164548754692, 0.001333942636847496, 0.0015923688188195229, 0.0018507950007915497, 0.0021092211827635765, 0.0023676473647356033, 0.00262607354670763, 0.002884499728679657, 0.003142925910651684, 0.0034013520926237106, 0.0036597782745957375, 0.003918204456567764, 0.004176630638539791, 0.004435056820511818, 0.004693483002483845, 0.004951909184455872, 0.005210335366427898, 0.005468761548399925, 0.005727187730371952, 0.005985613912343979, 0.006244040094316006, 0.0065024662762880325, 0.006760892458260059, 0.007019318640232086, 0.007277744822204113, 0.00753617100417614, 0.007794597186148167, 0.008053023368120193, 0.00831144955009222, 0.008569875732064247, 0.008828301914036274, 0.0090867280960083]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 9.0, 10.0, 15.0, 17.0, 23.0, 40.0, 59.0, 100.0, 149.0, 249.0, 445.0, 1014.0, 2357.0, 7251.0, 30166.0, 205809.0, 680213.0, 95311.0, 17227.0, 4678.0, 1690.0, 714.0, 426.0, 194.0, 142.0, 85.0, 42.0, 41.0, 12.0, 17.0, 17.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01548004150390625, -0.014913439750671387, -0.014346837997436523, -0.01378023624420166, -0.013213634490966797, -0.012647032737731934, -0.01208043098449707, -0.011513829231262207, -0.010947227478027344, -0.01038062572479248, -0.009814023971557617, -0.009247422218322754, -0.00868082046508789, -0.008114218711853027, -0.007547616958618164, -0.006981015205383301, -0.0064144134521484375, -0.005847811698913574, -0.005281209945678711, -0.004714608192443848, -0.004148006439208984, -0.003581404685974121, -0.003014802932739258, -0.0024482011795043945, -0.0018815994262695312, -0.001314997673034668, -0.0007483959197998047, -0.0001817941665649414, 0.0003848075866699219, 0.0009514093399047852, 0.0015180110931396484, 0.0020846128463745117, 0.002651214599609375, 0.0032178163528442383, 0.0037844181060791016, 0.004351019859313965, 0.004917621612548828, 0.005484223365783691, 0.006050825119018555, 0.006617426872253418, 0.007184028625488281, 0.0077506303787231445, 0.008317232131958008, 0.008883833885192871, 0.009450435638427734, 0.010017037391662598, 0.010583639144897461, 0.011150240898132324, 0.011716842651367188, 0.01228344440460205, 0.012850046157836914, 0.013416647911071777, 0.01398324966430664, 0.014549851417541504, 0.015116453170776367, 0.01568305492401123, 0.016249656677246094, 0.016816258430480957, 0.01738286018371582, 0.017949461936950684, 0.018516063690185547, 0.01908266544342041, 0.019649267196655273, 0.020215868949890137, 0.020782470703125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 5.0, 2.0, 7.0, 8.0, 19.0, 26.0, 37.0, 47.0, 91.0, 84.0, 110.0, 102.0, 97.0, 91.0, 77.0, 70.0, 52.0, 29.0, 21.0, 10.0, 11.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007587432861328125, -0.00734025239944458, -0.007093071937561035, -0.00684589147567749, -0.006598711013793945, -0.0063515305519104, -0.0061043500900268555, -0.0058571696281433105, -0.005609989166259766, -0.005362808704376221, -0.005115628242492676, -0.004868447780609131, -0.004621267318725586, -0.004374086856842041, -0.004126906394958496, -0.003879725933074951, -0.0036325454711914062, -0.0033853650093078613, -0.0031381845474243164, -0.0028910040855407715, -0.0026438236236572266, -0.0023966431617736816, -0.0021494626998901367, -0.0019022822380065918, -0.0016551017761230469, -0.001407921314239502, -0.001160740852355957, -0.0009135603904724121, -0.0006663799285888672, -0.00041919946670532227, -0.00017201900482177734, 7.516145706176758e-05, 0.0003223419189453125, 0.0005695223808288574, 0.0008167028427124023, 0.0010638833045959473, 0.0013110637664794922, 0.0015582442283630371, 0.001805424690246582, 0.002052605152130127, 0.002299785614013672, 0.002546966075897217, 0.0027941465377807617, 0.0030413269996643066, 0.0032885074615478516, 0.0035356879234313965, 0.0037828683853149414, 0.004030048847198486, 0.004277229309082031, 0.004524409770965576, 0.004771590232849121, 0.005018770694732666, 0.005265951156616211, 0.005513131618499756, 0.005760312080383301, 0.006007492542266846, 0.006254673004150391, 0.0065018534660339355, 0.0067490339279174805, 0.006996214389801025, 0.00724339485168457, 0.007490575313568115, 0.00773775577545166, 0.007984936237335205, 0.00823211669921875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 9.0, 6.0, 15.0, 14.0, 7.0, 21.0, 42.0, 42.0, 59.0, 101.0, 145.0, 314.0, 567.0, 1352.0, 3368.0, 9094.0, 27584.0, 103239.0, 456883.0, 337955.0, 74639.0, 21066.0, 7100.0, 2656.0, 1063.0, 498.0, 270.0, 150.0, 91.0, 56.0, 34.0, 26.0, 19.0, 14.0, 13.0, 6.0, 6.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.01042938232421875, -0.010121583938598633, -0.009813785552978516, -0.009505987167358398, -0.009198188781738281, -0.008890390396118164, -0.008582592010498047, -0.00827479362487793, -0.007966995239257812, -0.007659196853637695, -0.007351398468017578, -0.007043600082397461, -0.006735801696777344, -0.0064280033111572266, -0.006120204925537109, -0.005812406539916992, -0.005504608154296875, -0.005196809768676758, -0.004889011383056641, -0.0045812129974365234, -0.004273414611816406, -0.003965616226196289, -0.003657817840576172, -0.0033500194549560547, -0.0030422210693359375, -0.0027344226837158203, -0.002426624298095703, -0.002118825912475586, -0.0018110275268554688, -0.0015032291412353516, -0.0011954307556152344, -0.0008876323699951172, -0.000579833984375, -0.0002720355987548828, 3.5762786865234375e-05, 0.00034356117248535156, 0.0006513595581054688, 0.0009591579437255859, 0.0012669563293457031, 0.0015747547149658203, 0.0018825531005859375, 0.0021903514862060547, 0.002498149871826172, 0.002805948257446289, 0.0031137466430664062, 0.0034215450286865234, 0.0037293434143066406, 0.004037141799926758, 0.004344940185546875, 0.004652738571166992, 0.004960536956787109, 0.0052683353424072266, 0.005576133728027344, 0.005883932113647461, 0.006191730499267578, 0.006499528884887695, 0.0068073272705078125, 0.00711512565612793, 0.007422924041748047, 0.007730722427368164, 0.008038520812988281, 0.008346319198608398, 0.008654117584228516, 0.008961915969848633, 0.00926971435546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 2.0, 3.0, 5.0, 9.0, 8.0, 11.0, 8.0, 17.0, 15.0, 21.0, 18.0, 36.0, 36.0, 28.0, 31.0, 37.0, 45.0, 61.0, 52.0, 47.0, 46.0, 52.0, 38.0, 52.0, 43.0, 34.0, 32.0, 40.0, 26.0, 33.0, 21.0, 22.0, 14.0, 13.0, 12.0, 10.0, 10.0, 5.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0078125, -0.007526516914367676, -0.0072405338287353516, -0.006954550743103027, -0.006668567657470703, -0.006382584571838379, -0.006096601486206055, -0.0058106184005737305, -0.005524635314941406, -0.005238652229309082, -0.004952669143676758, -0.004666686058044434, -0.004380702972412109, -0.004094719886779785, -0.003808736801147461, -0.0035227537155151367, -0.0032367706298828125, -0.0029507875442504883, -0.002664804458618164, -0.00237882137298584, -0.0020928382873535156, -0.0018068552017211914, -0.0015208721160888672, -0.001234889030456543, -0.0009489059448242188, -0.0006629228591918945, -0.0003769397735595703, -9.09566879272461e-05, 0.00019502639770507812, 0.00048100948333740234, 0.0007669925689697266, 0.0010529756546020508, 0.001338958740234375, 0.0016249418258666992, 0.0019109249114990234, 0.0021969079971313477, 0.002482891082763672, 0.002768874168395996, 0.0030548572540283203, 0.0033408403396606445, 0.0036268234252929688, 0.003912806510925293, 0.004198789596557617, 0.004484772682189941, 0.004770755767822266, 0.00505673885345459, 0.005342721939086914, 0.005628705024719238, 0.0059146881103515625, 0.006200671195983887, 0.006486654281616211, 0.006772637367248535, 0.007058620452880859, 0.007344603538513184, 0.007630586624145508, 0.007916569709777832, 0.008202552795410156, 0.00848853588104248, 0.008774518966674805, 0.009060502052307129, 0.009346485137939453, 0.009632468223571777, 0.009918451309204102, 0.010204434394836426, 0.01049041748046875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 8.0, 13.0, 17.0, 31.0, 43.0, 45.0, 93.0, 152.0, 236.0, 413.0, 716.0, 1383.0, 3135.0, 8137.0, 24687.0, 99395.0, 579790.0, 259720.0, 47162.0, 14086.0, 4922.0, 2040.0, 1012.0, 524.0, 297.0, 177.0, 115.0, 73.0, 48.0, 33.0, 19.0, 12.0, 7.0, 2.0, 7.0, 1.0, 3.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030231475830078125, -0.0029180049896240234, -0.0028128623962402344, -0.0027077198028564453, -0.0026025772094726562, -0.002497434616088867, -0.002392292022705078, -0.002287149429321289, -0.0021820068359375, -0.002076864242553711, -0.001971721649169922, -0.0018665790557861328, -0.0017614364624023438, -0.0016562938690185547, -0.0015511512756347656, -0.0014460086822509766, -0.0013408660888671875, -0.0012357234954833984, -0.0011305809020996094, -0.0010254383087158203, -0.0009202957153320312, -0.0008151531219482422, -0.0007100105285644531, -0.0006048679351806641, -0.000499725341796875, -0.00039458274841308594, -0.0002894401550292969, -0.0001842975616455078, -7.915496826171875e-05, 2.5987625122070312e-05, 0.00013113021850585938, 0.00023627281188964844, 0.0003414154052734375, 0.00044655799865722656, 0.0005517005920410156, 0.0006568431854248047, 0.0007619857788085938, 0.0008671283721923828, 0.0009722709655761719, 0.001077413558959961, 0.00118255615234375, 0.001287698745727539, 0.0013928413391113281, 0.0014979839324951172, 0.0016031265258789062, 0.0017082691192626953, 0.0018134117126464844, 0.0019185543060302734, 0.0020236968994140625, 0.0021288394927978516, 0.0022339820861816406, 0.0023391246795654297, 0.0024442672729492188, 0.002549409866333008, 0.002654552459716797, 0.002759695053100586, 0.002864837646484375, 0.002969980239868164, 0.003075122833251953, 0.003180265426635742, 0.0032854080200195312, 0.0033905506134033203, 0.0034956932067871094, 0.0036008358001708984, 0.0037059783935546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 5.0, 8.0, 12.0, 11.0, 18.0, 25.0, 23.0, 34.0, 52.0, 41.0, 53.0, 54.0, 66.0, 58.0, 70.0, 56.0, 52.0, 50.0, 49.0, 44.0, 30.0, 42.0, 29.0, 34.0, 20.0, 10.0, 12.0, 9.0, 10.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.1457672119140625e-06, -2.086162567138672e-06, -2.0265579223632812e-06, -1.9669532775878906e-06, -1.9073486328125e-06, -1.8477439880371094e-06, -1.7881393432617188e-06, -1.7285346984863281e-06, -1.6689300537109375e-06, -1.6093254089355469e-06, -1.5497207641601562e-06, -1.4901161193847656e-06, -1.430511474609375e-06, -1.3709068298339844e-06, -1.3113021850585938e-06, -1.2516975402832031e-06, -1.1920928955078125e-06, -1.1324882507324219e-06, -1.0728836059570312e-06, -1.0132789611816406e-06, -9.5367431640625e-07, -8.940696716308594e-07, -8.344650268554688e-07, -7.748603820800781e-07, -7.152557373046875e-07, -6.556510925292969e-07, -5.960464477539062e-07, -5.364418029785156e-07, -4.76837158203125e-07, -4.172325134277344e-07, -3.5762786865234375e-07, -2.980232238769531e-07, -2.384185791015625e-07, -1.7881393432617188e-07, -1.1920928955078125e-07, -5.960464477539063e-08, 0.0, 5.960464477539063e-08, 1.1920928955078125e-07, 1.7881393432617188e-07, 2.384185791015625e-07, 2.980232238769531e-07, 3.5762786865234375e-07, 4.172325134277344e-07, 4.76837158203125e-07, 5.364418029785156e-07, 5.960464477539062e-07, 6.556510925292969e-07, 7.152557373046875e-07, 7.748603820800781e-07, 8.344650268554688e-07, 8.940696716308594e-07, 9.5367431640625e-07, 1.0132789611816406e-06, 1.0728836059570312e-06, 1.1324882507324219e-06, 1.1920928955078125e-06, 1.2516975402832031e-06, 1.3113021850585938e-06, 1.3709068298339844e-06, 1.430511474609375e-06, 1.4901161193847656e-06, 1.5497207641601562e-06, 1.6093254089355469e-06, 1.6689300537109375e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 13.0, 20.0, 25.0, 39.0, 88.0, 159.0, 266.0, 720.0, 2483.0, 15213.0, 328514.0, 672634.0, 23366.0, 3399.0, 897.0, 359.0, 170.0, 85.0, 40.0, 28.0, 16.0, 5.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00650787353515625, -0.006267666816711426, -0.0060274600982666016, -0.005787253379821777, -0.005547046661376953, -0.005306839942932129, -0.005066633224487305, -0.0048264265060424805, -0.004586219787597656, -0.004346013069152832, -0.004105806350708008, -0.0038655996322631836, -0.0036253929138183594, -0.003385186195373535, -0.003144979476928711, -0.0029047727584838867, -0.0026645660400390625, -0.0024243593215942383, -0.002184152603149414, -0.0019439458847045898, -0.0017037391662597656, -0.0014635324478149414, -0.0012233257293701172, -0.000983119010925293, -0.0007429122924804688, -0.0005027055740356445, -0.0002624988555908203, -2.2292137145996094e-05, 0.00021791458129882812, 0.00045812129974365234, 0.0006983280181884766, 0.0009385347366333008, 0.001178741455078125, 0.0014189481735229492, 0.0016591548919677734, 0.0018993616104125977, 0.002139568328857422, 0.002379775047302246, 0.0026199817657470703, 0.0028601884841918945, 0.0031003952026367188, 0.003340601921081543, 0.003580808639526367, 0.0038210153579711914, 0.004061222076416016, 0.00430142879486084, 0.004541635513305664, 0.004781842231750488, 0.0050220489501953125, 0.005262255668640137, 0.005502462387084961, 0.005742669105529785, 0.005982875823974609, 0.006223082542419434, 0.006463289260864258, 0.006703495979309082, 0.006943702697753906, 0.0071839094161987305, 0.007424116134643555, 0.007664322853088379, 0.007904529571533203, 0.008144736289978027, 0.008384943008422852, 0.008625149726867676, 0.0088653564453125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 14.0, 12.0, 21.0, 25.0, 42.0, 72.0, 142.0, 232.0, 174.0, 111.0, 40.0, 30.0, 30.0, 17.0, 15.0, 12.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.007625579833984375, -0.00746607780456543, -0.007306575775146484, -0.007147073745727539, -0.006987571716308594, -0.0068280696868896484, -0.006668567657470703, -0.006509065628051758, -0.0063495635986328125, -0.006190061569213867, -0.006030559539794922, -0.0058710575103759766, -0.005711555480957031, -0.005552053451538086, -0.005392551422119141, -0.005233049392700195, -0.00507354736328125, -0.004914045333862305, -0.004754543304443359, -0.004595041275024414, -0.004435539245605469, -0.0042760372161865234, -0.004116535186767578, -0.003957033157348633, -0.0037975311279296875, -0.003638029098510742, -0.003478527069091797, -0.0033190250396728516, -0.0031595230102539062, -0.003000020980834961, -0.0028405189514160156, -0.0026810169219970703, -0.002521514892578125, -0.0023620128631591797, -0.0022025108337402344, -0.002043008804321289, -0.0018835067749023438, -0.0017240047454833984, -0.0015645027160644531, -0.0014050006866455078, -0.0012454986572265625, -0.0010859966278076172, -0.0009264945983886719, -0.0007669925689697266, -0.0006074905395507812, -0.00044798851013183594, -0.0002884864807128906, -0.0001289844512939453, 3.0517578125e-05, 0.0001900196075439453, 0.0003495216369628906, 0.0005090236663818359, 0.0006685256958007812, 0.0008280277252197266, 0.0009875297546386719, 0.0011470317840576172, 0.0013065338134765625, 0.0014660358428955078, 0.0016255378723144531, 0.0017850399017333984, 0.0019445419311523438, 0.002104043960571289, 0.0022635459899902344, 0.0024230480194091797, 0.002582550048828125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 3.0, 7.0, 6.0, 10.0, 24.0, 18.0, 38.0, 54.0, 96.0, 127.0, 167.0, 158.0, 114.0, 73.0, 44.0, 21.0, 15.0, 13.0, 8.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032931096851825714, -0.03180396929383278, -0.030676843598484993, -0.029549717903137207, -0.028422590345144272, -0.027295464649796486, -0.0261683389544487, -0.025041211396455765, -0.02391408570110798, -0.022786960005760193, -0.021659832447767258, -0.020532706752419472, -0.019405581057071686, -0.01827845349907875, -0.017151327803730965, -0.01602420210838318, -0.014897074550390244, -0.013769947923719883, -0.012642821297049522, -0.011515695601701736, -0.010388568975031376, -0.009261442348361015, -0.00813431665301323, -0.007007190026342869, -0.005880063399672508, -0.004752936773002148, -0.0036258106119930744, -0.0024986842181533575, -0.0013715578243136406, -0.00024443119764328003, 0.0008826949633657932, 0.0020098211243748665, 0.0031369440257549286, 0.004264070652425289, 0.005391196813434362, 0.006518322974443436, 0.007645449601113796, 0.008772576227784157, 0.009899701923131943, 0.011026828549802303, 0.012153955176472664, 0.013281081803143024, 0.014408208429813385, 0.015535334125161171, 0.016662459820508957, 0.017789587378501892, 0.018916713073849678, 0.020043838769197464, 0.0211709663271904, 0.022298092022538185, 0.02342521958053112, 0.024552345275878906, 0.02567947283387184, 0.026806598529219627, 0.027933724224567413, 0.02906085178256035, 0.030187977477908134, 0.03131510317325592, 0.032442230731248856, 0.03356935828924179, 0.03469648212194443, 0.03582360967993736, 0.0369507372379303, 0.038077861070632935, 0.03920498862862587]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 0.0, 6.0, 2.0, 6.0, 5.0, 7.0, 13.0, 9.0, 10.0, 8.0, 18.0, 19.0, 28.0, 23.0, 20.0, 31.0, 23.0, 20.0, 37.0, 37.0, 40.0, 42.0, 30.0, 20.0, 34.0, 53.0, 45.0, 37.0, 32.0, 28.0, 32.0, 34.0, 33.0, 21.0, 19.0, 27.0, 23.0, 16.0, 19.0, 20.0, 15.0, 10.0, 9.0, 8.0, 6.0, 10.0, 4.0, 7.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.020731806755065918, -0.020082686096429825, -0.01943356543779373, -0.01878444477915764, -0.018135324120521545, -0.017486203461885452, -0.01683708280324936, -0.016187962144613266, -0.015538841485977173, -0.01488972082734108, -0.014240600168704987, -0.013591479510068893, -0.0129423588514328, -0.012293238192796707, -0.011644117534160614, -0.010994996875524521, -0.010345876216888428, -0.009696755558252335, -0.009047634899616241, -0.008398514240980148, -0.007749393582344055, -0.007100272923707962, -0.006451152265071869, -0.005802031606435776, -0.005152910947799683, -0.0045037902891635895, -0.0038546696305274963, -0.003205548971891403, -0.00255642831325531, -0.001907307654619217, -0.0012581869959831238, -0.0006090663373470306, 4.00543212890625e-05, 0.0006891749799251556, 0.0013382956385612488, 0.001987416297197342, 0.002636536955833435, 0.003285657614469528, 0.003934778273105621, 0.0045838989317417145, 0.005233019590377808, 0.005882140249013901, 0.006531260907649994, 0.007180381566286087, 0.00782950222492218, 0.008478622883558273, 0.009127743542194366, 0.00977686420083046, 0.010425984859466553, 0.011075105518102646, 0.011724226176738739, 0.012373346835374832, 0.013022467494010925, 0.013671588152647018, 0.014320708811283112, 0.014969829469919205, 0.015618950128555298, 0.01626807078719139, 0.016917191445827484, 0.017566312104463577, 0.01821543276309967, 0.018864553421735764, 0.019513674080371857, 0.02016279473900795, 0.020811915397644043]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 6.0, 7.0, 16.0, 21.0, 37.0, 55.0, 69.0, 148.0, 235.0, 402.0, 840.0, 2231.0, 11168.0, 324928.0, 3818715.0, 28961.0, 3988.0, 1153.0, 561.0, 311.0, 163.0, 94.0, 60.0, 46.0, 17.0, 12.0, 6.0, 10.0, 4.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.021392822265625, -0.020767688751220703, -0.020142555236816406, -0.01951742172241211, -0.018892288208007812, -0.018267154693603516, -0.01764202117919922, -0.017016887664794922, -0.016391754150390625, -0.015766620635986328, -0.015141487121582031, -0.014516353607177734, -0.013891220092773438, -0.01326608657836914, -0.012640953063964844, -0.012015819549560547, -0.01139068603515625, -0.010765552520751953, -0.010140419006347656, -0.00951528549194336, -0.008890151977539062, -0.008265018463134766, -0.007639884948730469, -0.007014751434326172, -0.006389617919921875, -0.005764484405517578, -0.005139350891113281, -0.004514217376708984, -0.0038890838623046875, -0.0032639503479003906, -0.0026388168334960938, -0.002013683319091797, -0.0013885498046875, -0.0007634162902832031, -0.00013828277587890625, 0.0004868507385253906, 0.0011119842529296875, 0.0017371177673339844, 0.0023622512817382812, 0.002987384796142578, 0.003612518310546875, 0.004237651824951172, 0.004862785339355469, 0.005487918853759766, 0.0061130523681640625, 0.006738185882568359, 0.007363319396972656, 0.007988452911376953, 0.00861358642578125, 0.009238719940185547, 0.009863853454589844, 0.01048898696899414, 0.011114120483398438, 0.011739253997802734, 0.012364387512207031, 0.012989521026611328, 0.013614654541015625, 0.014239788055419922, 0.014864921569824219, 0.015490055084228516, 0.016115188598632812, 0.01674032211303711, 0.017365455627441406, 0.017990589141845703, 0.01861572265625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 8.0, 18.0, 20.0, 31.0, 32.0, 72.0, 84.0, 102.0, 105.0, 105.0, 103.0, 81.0, 77.0, 55.0, 35.0, 28.0, 21.0, 7.0, 5.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007480621337890625, -0.007232725620269775, -0.006984829902648926, -0.006736934185028076, -0.0064890384674072266, -0.006241142749786377, -0.005993247032165527, -0.005745351314544678, -0.005497455596923828, -0.0052495598793029785, -0.005001664161682129, -0.004753768444061279, -0.00450587272644043, -0.00425797700881958, -0.0040100812911987305, -0.003762185573577881, -0.0035142898559570312, -0.0032663941383361816, -0.003018498420715332, -0.0027706027030944824, -0.002522706985473633, -0.002274811267852783, -0.0020269155502319336, -0.001779019832611084, -0.0015311241149902344, -0.0012832283973693848, -0.0010353326797485352, -0.0007874369621276855, -0.0005395412445068359, -0.00029164552688598633, -4.374980926513672e-05, 0.0002041459083557129, 0.0004520416259765625, 0.0006999373435974121, 0.0009478330612182617, 0.0011957287788391113, 0.001443624496459961, 0.0016915202140808105, 0.0019394159317016602, 0.0021873116493225098, 0.0024352073669433594, 0.002683103084564209, 0.0029309988021850586, 0.003178894519805908, 0.003426790237426758, 0.0036746859550476074, 0.003922581672668457, 0.004170477390289307, 0.004418373107910156, 0.004666268825531006, 0.0049141645431518555, 0.005162060260772705, 0.005409955978393555, 0.005657851696014404, 0.005905747413635254, 0.0061536431312561035, 0.006401538848876953, 0.006649434566497803, 0.006897330284118652, 0.007145226001739502, 0.0073931217193603516, 0.007641017436981201, 0.00788891315460205, 0.0081368088722229, 0.00838470458984375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 6.0, 3.0, 6.0, 13.0, 14.0, 24.0, 33.0, 50.0, 57.0, 119.0, 154.0, 263.0, 418.0, 780.0, 1291.0, 2632.0, 5221.0, 12077.0, 34224.0, 161464.0, 3160778.0, 705092.0, 72632.0, 20477.0, 8030.0, 3854.0, 1972.0, 1014.0, 590.0, 369.0, 207.0, 132.0, 85.0, 65.0, 39.0, 18.0, 22.0, 13.0, 16.0, 11.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005725860595703125, -0.005519688129425049, -0.005313515663146973, -0.0051073431968688965, -0.00490117073059082, -0.004694998264312744, -0.004488825798034668, -0.004282653331756592, -0.004076480865478516, -0.0038703083992004395, -0.0036641359329223633, -0.003457963466644287, -0.003251791000366211, -0.0030456185340881348, -0.0028394460678100586, -0.0026332736015319824, -0.0024271011352539062, -0.00222092866897583, -0.002014756202697754, -0.0018085837364196777, -0.0016024112701416016, -0.0013962388038635254, -0.0011900663375854492, -0.000983893871307373, -0.0007777214050292969, -0.0005715489387512207, -0.00036537647247314453, -0.00015920400619506836, 4.696846008300781e-05, 0.000253140926361084, 0.00045931339263916016, 0.0006654858589172363, 0.0008716583251953125, 0.0010778307914733887, 0.0012840032577514648, 0.001490175724029541, 0.0016963481903076172, 0.0019025206565856934, 0.0021086931228637695, 0.0023148655891418457, 0.002521038055419922, 0.002727210521697998, 0.0029333829879760742, 0.0031395554542541504, 0.0033457279205322266, 0.0035519003868103027, 0.003758072853088379, 0.003964245319366455, 0.004170417785644531, 0.004376590251922607, 0.004582762718200684, 0.00478893518447876, 0.004995107650756836, 0.005201280117034912, 0.005407452583312988, 0.0056136250495910645, 0.005819797515869141, 0.006025969982147217, 0.006232142448425293, 0.006438314914703369, 0.006644487380981445, 0.0068506598472595215, 0.007056832313537598, 0.007263004779815674, 0.00746917724609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 8.0, 7.0, 8.0, 8.0, 15.0, 14.0, 42.0, 49.0, 134.0, 320.0, 1050.0, 1484.0, 532.0, 182.0, 77.0, 44.0, 23.0, 11.0, 20.0, 13.0, 8.0, 7.0, 9.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00550079345703125, -0.005252838134765625, -0.0050048828125, -0.004756927490234375, -0.00450897216796875, -0.004261016845703125, -0.0040130615234375, -0.003765106201171875, -0.00351715087890625, -0.003269195556640625, -0.003021240234375, -0.002773284912109375, -0.00252532958984375, -0.002277374267578125, -0.0020294189453125, -0.001781463623046875, -0.00153350830078125, -0.001285552978515625, -0.00103759765625, -0.000789642333984375, -0.00054168701171875, -0.000293731689453125, -4.57763671875e-05, 0.000202178955078125, 0.00045013427734375, 0.000698089599609375, 0.000946044921875, 0.001194000244140625, 0.00144195556640625, 0.001689910888671875, 0.0019378662109375, 0.002185821533203125, 0.00243377685546875, 0.002681732177734375, 0.0029296875, 0.003177642822265625, 0.00342559814453125, 0.003673553466796875, 0.0039215087890625, 0.004169464111328125, 0.00441741943359375, 0.004665374755859375, 0.004913330078125, 0.005161285400390625, 0.00540924072265625, 0.005657196044921875, 0.0059051513671875, 0.006153106689453125, 0.00640106201171875, 0.006649017333984375, 0.00689697265625, 0.007144927978515625, 0.00739288330078125, 0.007640838623046875, 0.0078887939453125, 0.008136749267578125, 0.00838470458984375, 0.008632659912109375, 0.008880615234375, 0.009128570556640625, 0.00937652587890625, 0.009624481201171875, 0.0098724365234375, 0.010120391845703125, 0.01036834716796875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 8.0, 15.0, 25.0, 62.0, 108.0, 160.0, 169.0, 172.0, 118.0, 65.0, 33.0, 22.0, 14.0, 8.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03788778930902481, -0.03697298839688301, -0.03605818375945091, -0.03514338284730911, -0.03422858193516731, -0.033313777297735214, -0.032398976385593414, -0.031484171748161316, -0.030569370836019516, -0.029654568061232567, -0.028739767149090767, -0.027824964374303818, -0.02691016159951687, -0.02599535882472992, -0.02508055791258812, -0.02416575513780117, -0.02325095236301422, -0.022336149588227272, -0.021421348676085472, -0.020506545901298523, -0.019591743126511574, -0.018676940351724625, -0.017762139439582825, -0.016847336664795876, -0.015932535752654076, -0.015017733909189701, -0.014102931134402752, -0.013188129290938377, -0.012273326516151428, -0.011358524672687054, -0.01044372282922268, -0.00952892005443573, -0.00861411727964878, -0.007699314970523119, -0.006784512661397457, -0.005869710817933083, -0.004954908043146133, -0.004040106199681759, -0.003125303890556097, -0.002210501581430435, -0.0012956992723047733, -0.0003808970213867724, 0.0005339052295312285, 0.0014487074222415686, 0.0023635097313672304, 0.0032783118076622486, 0.0041931141167879105, 0.005107916425913572, 0.006022718735039234, 0.006937521044164896, 0.007852323353290558, 0.008767125196754932, 0.009681927971541882, 0.010596729815006256, 0.011511532589793205, 0.01242633443325758, 0.013341136276721954, 0.014255938120186329, 0.015170740894973278, 0.016085542738437653, 0.017000345513224602, 0.01791514828801155, 0.01882994920015335, 0.0197447519749403, 0.02065955474972725]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 8.0, 14.0, 11.0, 12.0, 19.0, 26.0, 19.0, 40.0, 43.0, 39.0, 43.0, 33.0, 51.0, 47.0, 49.0, 48.0, 57.0, 51.0, 40.0, 40.0, 41.0, 35.0, 38.0, 33.0, 25.0, 21.0, 20.0, 14.0, 9.0, 15.0, 17.0, 7.0, 5.0, 5.0, 9.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.016137659549713135, -0.015669625252485275, -0.015201590955257416, -0.014733556658029556, -0.014265522360801697, -0.013797488063573837, -0.013329453766345978, -0.012861419469118118, -0.012393385171890259, -0.0119253508746624, -0.01145731657743454, -0.01098928228020668, -0.01052124798297882, -0.010053213685750961, -0.009585179388523102, -0.009117145091295242, -0.008649110794067383, -0.008181076496839523, -0.007713042199611664, -0.007245007902383804, -0.006776973605155945, -0.006308939307928085, -0.005840905010700226, -0.005372870713472366, -0.004904836416244507, -0.004436802119016647, -0.003968767821788788, -0.0035007335245609283, -0.003032699227333069, -0.0025646649301052094, -0.00209663063287735, -0.0016285963356494904, -0.0011605620384216309, -0.0006925277411937714, -0.00022449344396591187, 0.00024354085326194763, 0.0007115751504898071, 0.0011796094477176666, 0.0016476437449455261, 0.0021156780421733856, 0.002583712339401245, 0.0030517466366291046, 0.003519780933856964, 0.003987815231084824, 0.004455849528312683, 0.004923883825540543, 0.005391918122768402, 0.005859952419996262, 0.006327986717224121, 0.006796021014451981, 0.00726405531167984, 0.0077320896089077, 0.008200123906135559, 0.008668158203363419, 0.009136192500591278, 0.009604226797819138, 0.010072261095046997, 0.010540295392274857, 0.011008329689502716, 0.011476363986730576, 0.011944398283958435, 0.012412432581186295, 0.012880466878414154, 0.013348501175642014, 0.013816535472869873]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 11.0, 34.0, 42.0, 61.0, 146.0, 251.0, 590.0, 1751.0, 8216.0, 92397.0, 847948.0, 86555.0, 7722.0, 1713.0, 589.0, 243.0, 112.0, 74.0, 34.0, 24.0, 12.0, 13.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030426025390625, -0.029489517211914062, -0.028553009033203125, -0.027616500854492188, -0.02667999267578125, -0.025743484497070312, -0.024806976318359375, -0.023870468139648438, -0.0229339599609375, -0.021997451782226562, -0.021060943603515625, -0.020124435424804688, -0.01918792724609375, -0.018251419067382812, -0.017314910888671875, -0.016378402709960938, -0.01544189453125, -0.014505386352539062, -0.013568878173828125, -0.012632369995117188, -0.01169586181640625, -0.010759353637695312, -0.009822845458984375, -0.008886337280273438, -0.0079498291015625, -0.0070133209228515625, -0.006076812744140625, -0.0051403045654296875, -0.00420379638671875, -0.0032672882080078125, -0.002330780029296875, -0.0013942718505859375, -0.000457763671875, 0.0004787445068359375, 0.001415252685546875, 0.0023517608642578125, 0.00328826904296875, 0.0042247772216796875, 0.005161285400390625, 0.0060977935791015625, 0.0070343017578125, 0.007970809936523438, 0.008907318115234375, 0.009843826293945312, 0.01078033447265625, 0.011716842651367188, 0.012653350830078125, 0.013589859008789062, 0.0145263671875, 0.015462875366210938, 0.016399383544921875, 0.017335891723632812, 0.01827239990234375, 0.019208908081054688, 0.020145416259765625, 0.021081924438476562, 0.0220184326171875, 0.022954940795898438, 0.023891448974609375, 0.024827957153320312, 0.02576446533203125, 0.026700973510742188, 0.027637481689453125, 0.028573989868164062, 0.029510498046875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 6.0, 13.0, 18.0, 31.0, 35.0, 57.0, 82.0, 86.0, 120.0, 128.0, 100.0, 97.0, 81.0, 56.0, 37.0, 17.0, 23.0, 6.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0079803466796875, -0.007725358009338379, -0.007470369338989258, -0.007215380668640137, -0.006960391998291016, -0.0067054033279418945, -0.0064504146575927734, -0.006195425987243652, -0.005940437316894531, -0.00568544864654541, -0.005430459976196289, -0.005175471305847168, -0.004920482635498047, -0.004665493965148926, -0.004410505294799805, -0.004155516624450684, -0.0039005279541015625, -0.0036455392837524414, -0.0033905506134033203, -0.0031355619430541992, -0.002880573272705078, -0.002625584602355957, -0.002370595932006836, -0.002115607261657715, -0.0018606185913085938, -0.0016056299209594727, -0.0013506412506103516, -0.0010956525802612305, -0.0008406639099121094, -0.0005856752395629883, -0.0003306865692138672, -7.56978988647461e-05, 0.000179290771484375, 0.0004342794418334961, 0.0006892681121826172, 0.0009442567825317383, 0.0011992454528808594, 0.0014542341232299805, 0.0017092227935791016, 0.0019642114639282227, 0.0022192001342773438, 0.002474188804626465, 0.002729177474975586, 0.002984166145324707, 0.003239154815673828, 0.0034941434860229492, 0.0037491321563720703, 0.004004120826721191, 0.0042591094970703125, 0.004514098167419434, 0.004769086837768555, 0.005024075508117676, 0.005279064178466797, 0.005534052848815918, 0.005789041519165039, 0.00604403018951416, 0.006299018859863281, 0.006554007530212402, 0.0068089962005615234, 0.0070639848709106445, 0.007318973541259766, 0.007573962211608887, 0.007828950881958008, 0.008083939552307129, 0.00833892822265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 10.0, 16.0, 22.0, 40.0, 57.0, 80.0, 120.0, 195.0, 302.0, 558.0, 1020.0, 2352.0, 5519.0, 15477.0, 51900.0, 233642.0, 531456.0, 150094.0, 35939.0, 11536.0, 4204.0, 1871.0, 906.0, 488.0, 272.0, 164.0, 102.0, 53.0, 49.0, 28.0, 14.0, 11.0, 17.0, 8.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01067352294921875, -0.01033318042755127, -0.009992837905883789, -0.009652495384216309, -0.009312152862548828, -0.008971810340881348, -0.008631467819213867, -0.008291125297546387, -0.007950782775878906, -0.007610440254211426, -0.007270097732543945, -0.006929755210876465, -0.006589412689208984, -0.006249070167541504, -0.0059087276458740234, -0.005568385124206543, -0.0052280426025390625, -0.004887700080871582, -0.0045473575592041016, -0.004207015037536621, -0.0038666725158691406, -0.00352632999420166, -0.0031859874725341797, -0.0028456449508666992, -0.0025053024291992188, -0.0021649599075317383, -0.0018246173858642578, -0.0014842748641967773, -0.0011439323425292969, -0.0008035898208618164, -0.00046324729919433594, -0.00012290477752685547, 0.000217437744140625, 0.0005577802658081055, 0.0008981227874755859, 0.0012384653091430664, 0.0015788078308105469, 0.0019191503524780273, 0.002259492874145508, 0.0025998353958129883, 0.0029401779174804688, 0.0032805204391479492, 0.0036208629608154297, 0.00396120548248291, 0.004301548004150391, 0.004641890525817871, 0.0049822330474853516, 0.005322575569152832, 0.0056629180908203125, 0.006003260612487793, 0.0063436031341552734, 0.006683945655822754, 0.007024288177490234, 0.007364630699157715, 0.007704973220825195, 0.008045315742492676, 0.008385658264160156, 0.008726000785827637, 0.009066343307495117, 0.009406685829162598, 0.009747028350830078, 0.010087370872497559, 0.010427713394165039, 0.01076805591583252, 0.0111083984375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 1.0, 7.0, 3.0, 6.0, 6.0, 18.0, 13.0, 21.0, 18.0, 31.0, 23.0, 38.0, 37.0, 33.0, 37.0, 43.0, 45.0, 49.0, 48.0, 42.0, 43.0, 40.0, 36.0, 46.0, 33.0, 32.0, 39.0, 27.0, 35.0, 24.0, 16.0, 28.0, 8.0, 7.0, 12.0, 10.0, 8.0, 4.0, 3.0, 3.0, 7.0, 2.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.009368896484375, -0.00907433032989502, -0.008779764175415039, -0.008485198020935059, -0.008190631866455078, -0.007896065711975098, -0.007601499557495117, -0.007306933403015137, -0.007012367248535156, -0.006717801094055176, -0.006423234939575195, -0.006128668785095215, -0.005834102630615234, -0.005539536476135254, -0.0052449703216552734, -0.004950404167175293, -0.0046558380126953125, -0.004361271858215332, -0.0040667057037353516, -0.003772139549255371, -0.0034775733947753906, -0.00318300724029541, -0.0028884410858154297, -0.0025938749313354492, -0.0022993087768554688, -0.0020047426223754883, -0.0017101764678955078, -0.0014156103134155273, -0.0011210441589355469, -0.0008264780044555664, -0.0005319118499755859, -0.00023734569549560547, 5.7220458984375e-05, 0.00035178661346435547, 0.0006463527679443359, 0.0009409189224243164, 0.0012354850769042969, 0.0015300512313842773, 0.0018246173858642578, 0.0021191835403442383, 0.0024137496948242188, 0.0027083158493041992, 0.0030028820037841797, 0.00329744815826416, 0.0035920143127441406, 0.003886580467224121, 0.0041811466217041016, 0.004475712776184082, 0.0047702789306640625, 0.005064845085144043, 0.0053594112396240234, 0.005653977394104004, 0.005948543548583984, 0.006243109703063965, 0.006537675857543945, 0.006832242012023926, 0.007126808166503906, 0.007421374320983887, 0.007715940475463867, 0.008010506629943848, 0.008305072784423828, 0.008599638938903809, 0.008894205093383789, 0.00918877124786377, 0.00948333740234375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 5.0, 4.0, 2.0, 6.0, 10.0, 15.0, 18.0, 21.0, 41.0, 44.0, 67.0, 97.0, 121.0, 210.0, 306.0, 456.0, 853.0, 1436.0, 2687.0, 5477.0, 12867.0, 36577.0, 140166.0, 529620.0, 231238.0, 53715.0, 17783.0, 6925.0, 3340.0, 1759.0, 963.0, 567.0, 400.0, 220.0, 163.0, 116.0, 73.0, 53.0, 30.0, 28.0, 18.0, 12.0, 9.0, 11.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.00339508056640625, -0.0032971203327178955, -0.003199160099029541, -0.0031011998653411865, -0.003003239631652832, -0.0029052793979644775, -0.002807319164276123, -0.0027093589305877686, -0.002611398696899414, -0.0025134384632110596, -0.002415478229522705, -0.0023175179958343506, -0.002219557762145996, -0.0021215975284576416, -0.002023637294769287, -0.0019256770610809326, -0.0018277168273925781, -0.0017297565937042236, -0.0016317963600158691, -0.0015338361263275146, -0.0014358758926391602, -0.0013379156589508057, -0.0012399554252624512, -0.0011419951915740967, -0.0010440349578857422, -0.0009460747241973877, -0.0008481144905090332, -0.0007501542568206787, -0.0006521940231323242, -0.0005542337894439697, -0.00045627355575561523, -0.00035831332206726074, -0.00026035308837890625, -0.00016239285469055176, -6.443262100219727e-05, 3.3527612686157227e-05, 0.00013148784637451172, 0.0002294480800628662, 0.0003274083137512207, 0.0004253685474395752, 0.0005233287811279297, 0.0006212890148162842, 0.0007192492485046387, 0.0008172094821929932, 0.0009151697158813477, 0.0010131299495697021, 0.0011110901832580566, 0.0012090504169464111, 0.0013070106506347656, 0.0014049708843231201, 0.0015029311180114746, 0.001600891351699829, 0.0016988515853881836, 0.001796811819076538, 0.0018947720527648926, 0.001992732286453247, 0.0020906925201416016, 0.002188652753829956, 0.0022866129875183105, 0.002384573221206665, 0.0024825334548950195, 0.002580493688583374, 0.0026784539222717285, 0.002776414155960083, 0.0028743743896484375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 18.0, 11.0, 10.0, 29.0, 23.0, 24.0, 34.0, 38.0, 78.0, 36.0, 50.0, 62.0, 55.0, 63.0, 57.0, 51.0, 105.0, 38.0, 40.0, 32.0, 29.0, 28.0, 22.0, 7.0, 19.0, 9.0, 6.0, 3.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9669532775878906e-06, -1.8998980522155762e-06, -1.8328428268432617e-06, -1.7657876014709473e-06, -1.6987323760986328e-06, -1.6316771507263184e-06, -1.564621925354004e-06, -1.4975666999816895e-06, -1.430511474609375e-06, -1.3634562492370605e-06, -1.296401023864746e-06, -1.2293457984924316e-06, -1.1622905731201172e-06, -1.0952353477478027e-06, -1.0281801223754883e-06, -9.611248970031738e-07, -8.940696716308594e-07, -8.270144462585449e-07, -7.599592208862305e-07, -6.92903995513916e-07, -6.258487701416016e-07, -5.587935447692871e-07, -4.917383193969727e-07, -4.246830940246582e-07, -3.5762786865234375e-07, -2.905726432800293e-07, -2.2351741790771484e-07, -1.564621925354004e-07, -8.940696716308594e-08, -2.2351741790771484e-08, 4.470348358154297e-08, 1.1175870895385742e-07, 1.7881393432617188e-07, 2.4586915969848633e-07, 3.129243850708008e-07, 3.7997961044311523e-07, 4.470348358154297e-07, 5.140900611877441e-07, 5.811452865600586e-07, 6.48200511932373e-07, 7.152557373046875e-07, 7.82310962677002e-07, 8.493661880493164e-07, 9.164214134216309e-07, 9.834766387939453e-07, 1.0505318641662598e-06, 1.1175870895385742e-06, 1.1846423149108887e-06, 1.2516975402832031e-06, 1.3187527656555176e-06, 1.385807991027832e-06, 1.4528632164001465e-06, 1.519918441772461e-06, 1.5869736671447754e-06, 1.6540288925170898e-06, 1.7210841178894043e-06, 1.7881393432617188e-06, 1.8551945686340332e-06, 1.9222497940063477e-06, 1.989305019378662e-06, 2.0563602447509766e-06, 2.123415470123291e-06, 2.1904706954956055e-06, 2.25752592086792e-06, 2.3245811462402344e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 6.0, 5.0, 8.0, 21.0, 27.0, 31.0, 58.0, 86.0, 146.0, 273.0, 559.0, 1166.0, 2616.0, 7054.0, 22383.0, 123429.0, 700315.0, 151751.0, 25379.0, 7650.0, 2917.0, 1323.0, 595.0, 326.0, 171.0, 104.0, 57.0, 28.0, 18.0, 14.0, 11.0, 7.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005336761474609375, -0.005172789096832275, -0.005008816719055176, -0.004844844341278076, -0.0046808719635009766, -0.004516899585723877, -0.004352927207946777, -0.004188954830169678, -0.004024982452392578, -0.0038610100746154785, -0.003697037696838379, -0.0035330653190612793, -0.0033690929412841797, -0.00320512056350708, -0.0030411481857299805, -0.002877175807952881, -0.0027132034301757812, -0.0025492310523986816, -0.002385258674621582, -0.0022212862968444824, -0.002057313919067383, -0.0018933415412902832, -0.0017293691635131836, -0.001565396785736084, -0.0014014244079589844, -0.0012374520301818848, -0.0010734796524047852, -0.0009095072746276855, -0.0007455348968505859, -0.0005815625190734863, -0.0004175901412963867, -0.0002536177635192871, -8.96453857421875e-05, 7.432699203491211e-05, 0.00023829936981201172, 0.00040227174758911133, 0.0005662441253662109, 0.0007302165031433105, 0.0008941888809204102, 0.0010581612586975098, 0.0012221336364746094, 0.001386106014251709, 0.0015500783920288086, 0.0017140507698059082, 0.0018780231475830078, 0.0020419955253601074, 0.002205967903137207, 0.0023699402809143066, 0.0025339126586914062, 0.002697885036468506, 0.0028618574142456055, 0.003025829792022705, 0.0031898021697998047, 0.0033537745475769043, 0.003517746925354004, 0.0036817193031311035, 0.003845691680908203, 0.004009664058685303, 0.004173636436462402, 0.004337608814239502, 0.0045015811920166016, 0.004665553569793701, 0.004829525947570801, 0.0049934983253479, 0.005157470703125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 8.0, 7.0, 11.0, 9.0, 9.0, 15.0, 8.0, 19.0, 41.0, 44.0, 70.0, 95.0, 108.0, 119.0, 111.0, 78.0, 61.0, 50.0, 21.0, 19.0, 14.0, 17.0, 14.0, 5.0, 6.0, 6.0, 6.0, 7.0, 3.0, 3.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.004093170166015625, -0.003966212272644043, -0.003839254379272461, -0.003712296485900879, -0.003585338592529297, -0.003458380699157715, -0.003331422805786133, -0.0032044649124145508, -0.0030775070190429688, -0.0029505491256713867, -0.0028235912322998047, -0.0026966333389282227, -0.0025696754455566406, -0.0024427175521850586, -0.0023157596588134766, -0.0021888017654418945, -0.0020618438720703125, -0.0019348859786987305, -0.0018079280853271484, -0.0016809701919555664, -0.0015540122985839844, -0.0014270544052124023, -0.0013000965118408203, -0.0011731386184692383, -0.0010461807250976562, -0.0009192228317260742, -0.0007922649383544922, -0.0006653070449829102, -0.0005383491516113281, -0.0004113912582397461, -0.00028443336486816406, -0.00015747547149658203, -3.0517578125e-05, 9.644031524658203e-05, 0.00022339820861816406, 0.0003503561019897461, 0.0004773139953613281, 0.0006042718887329102, 0.0007312297821044922, 0.0008581876754760742, 0.0009851455688476562, 0.0011121034622192383, 0.0012390613555908203, 0.0013660192489624023, 0.0014929771423339844, 0.0016199350357055664, 0.0017468929290771484, 0.0018738508224487305, 0.0020008087158203125, 0.0021277666091918945, 0.0022547245025634766, 0.0023816823959350586, 0.0025086402893066406, 0.0026355981826782227, 0.0027625560760498047, 0.0028895139694213867, 0.0030164718627929688, 0.0031434297561645508, 0.003270387649536133, 0.003397345542907715, 0.003524303436279297, 0.003651261329650879, 0.003778219223022461, 0.003905177116394043, 0.004032135009765625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 6.0, 10.0, 32.0, 64.0, 125.0, 251.0, 253.0, 149.0, 63.0, 31.0, 11.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04601298272609711, -0.04351157322525978, -0.041010159999132156, -0.03850875049829483, -0.036007340997457504, -0.03350593149662018, -0.031004518270492554, -0.028503108769655228, -0.026001697406172752, -0.023500286042690277, -0.02099887654185295, -0.018497465178370476, -0.015996053814888, -0.013494644314050674, -0.0109932329505682, -0.008491823449730873, -0.005990412086248398, -0.0034890014212578535, -0.0009875907562673092, 0.0015138201415538788, 0.0040152305737137794, 0.00651664100587368, 0.009018052369356155, 0.011519461870193481, 0.014020873233675957, 0.016522284597158432, 0.019023694097995758, 0.021525105461478233, 0.02402651682496071, 0.026527926325798035, 0.02902933768928051, 0.03153074532747269, 0.03403215855360031, 0.03653356805443764, 0.03903498128056526, 0.04153639078140259, 0.044037800282239914, 0.04653920978307724, 0.049040623009204865, 0.05154203251004219, 0.05404344201087952, 0.05654485151171684, 0.05904626473784447, 0.06154767423868179, 0.06404908746480942, 0.06655049324035645, 0.06905190646648407, 0.0715533196926117, 0.07405473291873932, 0.07655614614486694, 0.07905755192041397, 0.0815589651465416, 0.08406037837266922, 0.08656178414821625, 0.08906319737434387, 0.0915646106004715, 0.09406601637601852, 0.09656742960214615, 0.09906883537769318, 0.1015702486038208, 0.10407166182994843, 0.10657306760549545, 0.10907448083162308, 0.1115758866071701, 0.11407729983329773]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 5.0, 8.0, 9.0, 5.0, 9.0, 12.0, 13.0, 15.0, 13.0, 25.0, 21.0, 28.0, 29.0, 32.0, 22.0, 34.0, 37.0, 26.0, 41.0, 27.0, 45.0, 47.0, 48.0, 32.0, 32.0, 47.0, 33.0, 39.0, 29.0, 29.0, 23.0, 23.0, 25.0, 16.0, 19.0, 15.0, 15.0, 7.0, 14.0, 9.0, 6.0, 7.0, 8.0, 3.0, 4.0, 5.0, 5.0, 1.0, 0.0, 0.0, 4.0, 4.0], "bins": [-0.028748035430908203, -0.02790858782827854, -0.02706914022564888, -0.02622969262301922, -0.025390245020389557, -0.024550797417759895, -0.023711349815130234, -0.022871902212500572, -0.02203245460987091, -0.02119300700724125, -0.020353559404611588, -0.019514111801981926, -0.018674664199352264, -0.017835216596722603, -0.01699576899409294, -0.01615632139146328, -0.015316873788833618, -0.014477426186203957, -0.013637978583574295, -0.012798530980944633, -0.011959083378314972, -0.01111963577568531, -0.010280188173055649, -0.009440740570425987, -0.008601292967796326, -0.007761845365166664, -0.0069223977625370026, -0.006082950159907341, -0.0052435025572776794, -0.004404054954648018, -0.0035646073520183563, -0.0027251597493886948, -0.0018857121467590332, -0.0010462645441293716, -0.00020681694149971008, 0.0006326306611299515, 0.001472078263759613, 0.0023115258663892746, 0.003150973469018936, 0.003990421071648598, 0.004829868674278259, 0.005669316276907921, 0.006508763879537582, 0.007348211482167244, 0.008187659084796906, 0.009027106687426567, 0.009866554290056229, 0.01070600189268589, 0.011545449495315552, 0.012384897097945213, 0.013224344700574875, 0.014063792303204536, 0.014903239905834198, 0.01574268750846386, 0.01658213511109352, 0.017421582713723183, 0.018261030316352844, 0.019100477918982506, 0.019939925521612167, 0.02077937312424183, 0.02161882072687149, 0.022458268329501152, 0.023297715932130814, 0.024137163534760475, 0.024976611137390137]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 8.0, 11.0, 12.0, 20.0, 26.0, 46.0, 74.0, 83.0, 164.0, 346.0, 784.0, 1808.0, 6458.0, 34289.0, 2136289.0, 1971862.0, 33016.0, 5849.0, 1740.0, 630.0, 303.0, 146.0, 94.0, 64.0, 36.0, 25.0, 22.0, 16.0, 14.0, 12.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01605224609375, -0.015565752983093262, -0.015079259872436523, -0.014592766761779785, -0.014106273651123047, -0.013619780540466309, -0.01313328742980957, -0.012646794319152832, -0.012160301208496094, -0.011673808097839355, -0.011187314987182617, -0.010700821876525879, -0.01021432876586914, -0.009727835655212402, -0.009241342544555664, -0.008754849433898926, -0.008268356323242188, -0.007781863212585449, -0.007295370101928711, -0.006808876991271973, -0.006322383880615234, -0.005835890769958496, -0.005349397659301758, -0.0048629045486450195, -0.004376411437988281, -0.003889918327331543, -0.0034034252166748047, -0.0029169321060180664, -0.002430438995361328, -0.0019439458847045898, -0.0014574527740478516, -0.0009709596633911133, -0.000484466552734375, 2.0265579223632812e-06, 0.0004885196685791016, 0.0009750127792358398, 0.0014615058898925781, 0.0019479990005493164, 0.0024344921112060547, 0.002920985221862793, 0.0034074783325195312, 0.0038939714431762695, 0.004380464553833008, 0.004866957664489746, 0.005353450775146484, 0.005839943885803223, 0.006326436996459961, 0.006812930107116699, 0.0072994232177734375, 0.007785916328430176, 0.008272409439086914, 0.008758902549743652, 0.00924539566040039, 0.009731888771057129, 0.010218381881713867, 0.010704874992370605, 0.011191368103027344, 0.011677861213684082, 0.01216435432434082, 0.012650847434997559, 0.013137340545654297, 0.013623833656311035, 0.014110326766967773, 0.014596819877624512, 0.01508331298828125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 2.0, 3.0, 5.0, 7.0, 5.0, 11.0, 15.0, 28.0, 44.0, 51.0, 64.0, 89.0, 89.0, 112.0, 94.0, 94.0, 71.0, 75.0, 46.0, 39.0, 25.0, 17.0, 7.0, 9.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.006725311279296875, -0.006491720676422119, -0.006258130073547363, -0.006024539470672607, -0.0057909488677978516, -0.005557358264923096, -0.00532376766204834, -0.005090177059173584, -0.004856586456298828, -0.004622995853424072, -0.004389405250549316, -0.0041558146476745605, -0.003922224044799805, -0.003688633441925049, -0.003455042839050293, -0.003221452236175537, -0.0029878616333007812, -0.0027542710304260254, -0.0025206804275512695, -0.0022870898246765137, -0.002053499221801758, -0.001819908618927002, -0.001586318016052246, -0.0013527274131774902, -0.0011191368103027344, -0.0008855462074279785, -0.0006519556045532227, -0.0004183650016784668, -0.00018477439880371094, 4.881620407104492e-05, 0.0002824068069458008, 0.0005159974098205566, 0.0007495880126953125, 0.0009831786155700684, 0.0012167692184448242, 0.00145035982131958, 0.001683950424194336, 0.0019175410270690918, 0.0021511316299438477, 0.0023847222328186035, 0.0026183128356933594, 0.0028519034385681152, 0.003085494041442871, 0.003319084644317627, 0.003552675247192383, 0.0037862658500671387, 0.0040198564529418945, 0.00425344705581665, 0.004487037658691406, 0.004720628261566162, 0.004954218864440918, 0.005187809467315674, 0.00542140007019043, 0.0056549906730651855, 0.005888581275939941, 0.006122171878814697, 0.006355762481689453, 0.006589353084564209, 0.006822943687438965, 0.007056534290313721, 0.0072901248931884766, 0.007523715496063232, 0.007757306098937988, 0.007990896701812744, 0.0082244873046875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 1.0, 9.0, 10.0, 13.0, 21.0, 24.0, 35.0, 43.0, 46.0, 100.0, 147.0, 221.0, 325.0, 485.0, 765.0, 1366.0, 2303.0, 4980.0, 12277.0, 38523.0, 199886.0, 3286346.0, 549097.0, 65806.0, 17745.0, 6474.0, 3073.0, 1510.0, 865.0, 566.0, 343.0, 253.0, 164.0, 120.0, 108.0, 63.0, 46.0, 30.0, 23.0, 16.0, 16.0, 11.0, 14.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0080413818359375, -0.007779359817504883, -0.007517337799072266, -0.0072553157806396484, -0.006993293762207031, -0.006731271743774414, -0.006469249725341797, -0.00620722770690918, -0.0059452056884765625, -0.005683183670043945, -0.005421161651611328, -0.005159139633178711, -0.004897117614746094, -0.0046350955963134766, -0.004373073577880859, -0.004111051559448242, -0.003849029541015625, -0.003587007522583008, -0.0033249855041503906, -0.0030629634857177734, -0.0028009414672851562, -0.002538919448852539, -0.002276897430419922, -0.0020148754119873047, -0.0017528533935546875, -0.0014908313751220703, -0.0012288093566894531, -0.0009667873382568359, -0.0007047653198242188, -0.00044274330139160156, -0.00018072128295898438, 8.130073547363281e-05, 0.00034332275390625, 0.0006053447723388672, 0.0008673667907714844, 0.0011293888092041016, 0.0013914108276367188, 0.001653432846069336, 0.0019154548645019531, 0.0021774768829345703, 0.0024394989013671875, 0.0027015209197998047, 0.002963542938232422, 0.003225564956665039, 0.0034875869750976562, 0.0037496089935302734, 0.004011631011962891, 0.004273653030395508, 0.004535675048828125, 0.004797697067260742, 0.005059719085693359, 0.0053217411041259766, 0.005583763122558594, 0.005845785140991211, 0.006107807159423828, 0.006369829177856445, 0.0066318511962890625, 0.00689387321472168, 0.007155895233154297, 0.007417917251586914, 0.007679939270019531, 0.007941961288452148, 0.008203983306884766, 0.008466005325317383, 0.00872802734375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 5.0, 5.0, 10.0, 16.0, 23.0, 52.0, 45.0, 97.0, 215.0, 666.0, 1607.0, 834.0, 267.0, 94.0, 64.0, 22.0, 19.0, 16.0, 8.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00814056396484375, -0.0078095197677612305, -0.007478475570678711, -0.007147431373596191, -0.006816387176513672, -0.006485342979431152, -0.006154298782348633, -0.005823254585266113, -0.005492210388183594, -0.005161166191101074, -0.004830121994018555, -0.004499077796936035, -0.004168033599853516, -0.003836989402770996, -0.0035059452056884766, -0.003174901008605957, -0.0028438568115234375, -0.002512812614440918, -0.0021817684173583984, -0.001850724220275879, -0.0015196800231933594, -0.0011886358261108398, -0.0008575916290283203, -0.0005265474319458008, -0.00019550323486328125, 0.00013554096221923828, 0.0004665851593017578, 0.0007976293563842773, 0.0011286735534667969, 0.0014597177505493164, 0.001790761947631836, 0.0021218061447143555, 0.002452850341796875, 0.0027838945388793945, 0.003114938735961914, 0.0034459829330444336, 0.003777027130126953, 0.004108071327209473, 0.004439115524291992, 0.004770159721374512, 0.005101203918457031, 0.005432248115539551, 0.00576329231262207, 0.00609433650970459, 0.006425380706787109, 0.006756424903869629, 0.0070874691009521484, 0.007418513298034668, 0.0077495574951171875, 0.008080601692199707, 0.008411645889282227, 0.008742690086364746, 0.009073734283447266, 0.009404778480529785, 0.009735822677612305, 0.010066866874694824, 0.010397911071777344, 0.010728955268859863, 0.011059999465942383, 0.011391043663024902, 0.011722087860107422, 0.012053132057189941, 0.012384176254272461, 0.01271522045135498, 0.0130462646484375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 7.0, 3.0, 2.0, 3.0, 5.0, 6.0, 17.0, 20.0, 32.0, 36.0, 53.0, 60.0, 88.0, 113.0, 133.0, 108.0, 104.0, 66.0, 42.0, 34.0, 23.0, 14.0, 16.0, 6.0, 2.0, 4.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02303050272166729, -0.022199442610144615, -0.02136838249862194, -0.020537322387099266, -0.01970626413822174, -0.018875204026699066, -0.01804414391517639, -0.017213083803653717, -0.016382023692131042, -0.015550963580608368, -0.014719903469085693, -0.013888844288885593, -0.013057784177362919, -0.012226724065840244, -0.011395664885640144, -0.01056460477411747, -0.009733544662594795, -0.00890248455107212, -0.008071424439549446, -0.007240365259349346, -0.006409305147826672, -0.005578245036303997, -0.00474718539044261, -0.0039161257445812225, -0.003085065633058548, -0.002254005754366517, -0.0014229458756744862, -0.0005918859969824553, 0.00023917388170957565, 0.0010702339932322502, 0.0019012936390936375, 0.0027323532849550247, 0.00356341153383255, 0.004394471645355225, 0.005225531291216612, 0.006056590937077999, 0.006887651048600674, 0.007718711160123348, 0.008549770340323448, 0.009380830451846123, 0.010211890563368797, 0.011042950674891472, 0.011874010786414146, 0.012705069966614246, 0.013536130078136921, 0.014367190189659595, 0.015198249369859695, 0.01602930948138237, 0.016860369592905045, 0.01769142970442772, 0.018522489815950394, 0.019353549927473068, 0.020184610038995743, 0.021015670150518417, 0.021846728399395943, 0.022677788510918617, 0.023508848622441292, 0.024339908733963966, 0.02517096884548664, 0.026002028957009315, 0.02683308720588684, 0.027664147317409515, 0.02849520742893219, 0.029326267540454865, 0.03015732765197754]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 4.0, 10.0, 5.0, 12.0, 11.0, 16.0, 14.0, 29.0, 31.0, 30.0, 42.0, 36.0, 45.0, 47.0, 56.0, 52.0, 43.0, 45.0, 53.0, 42.0, 41.0, 52.0, 43.0, 50.0, 28.0, 29.0, 20.0, 21.0, 20.0, 10.0, 16.0, 8.0, 8.0, 8.0, 2.0, 4.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.02463662624359131, -0.023985883221030235, -0.023335140198469162, -0.02268439717590809, -0.022033654153347015, -0.021382911130785942, -0.02073216810822487, -0.020081425085663795, -0.019430682063102722, -0.01877993904054165, -0.018129196017980576, -0.017478452995419502, -0.01682770997285843, -0.016176966950297356, -0.015526223927736282, -0.014875480905175209, -0.014224737882614136, -0.013573994860053062, -0.01292325183749199, -0.012272508814930916, -0.011621765792369843, -0.01097102276980877, -0.010320279747247696, -0.009669536724686623, -0.00901879370212555, -0.008368050679564476, -0.007717307657003403, -0.007066564634442329, -0.006415821611881256, -0.005765078589320183, -0.0051143355667591095, -0.004463592544198036, -0.003812849521636963, -0.0031621064990758896, -0.0025113634765148163, -0.001860620453953743, -0.0012098774313926697, -0.0005591344088315964, 9.160861372947693e-05, 0.0007423516362905502, 0.0013930946588516235, 0.002043837681412697, 0.00269458070397377, 0.0033453237265348434, 0.003996066749095917, 0.00464680977165699, 0.005297552794218063, 0.005948295816779137, 0.00659903883934021, 0.007249781861901283, 0.007900524884462357, 0.00855126790702343, 0.009202010929584503, 0.009852753952145576, 0.01050349697470665, 0.011154239997267723, 0.011804983019828796, 0.01245572604238987, 0.013106469064950943, 0.013757212087512016, 0.01440795511007309, 0.015058698132634163, 0.015709441155195236, 0.01636018417775631, 0.017010927200317383]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 4.0, 16.0, 15.0, 23.0, 20.0, 24.0, 54.0, 65.0, 110.0, 165.0, 271.0, 499.0, 899.0, 2372.0, 9081.0, 50408.0, 457287.0, 462370.0, 51178.0, 9055.0, 2458.0, 937.0, 467.0, 273.0, 171.0, 94.0, 71.0, 37.0, 33.0, 28.0, 14.0, 8.0, 9.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0220947265625, -0.021481037139892578, -0.020867347717285156, -0.020253658294677734, -0.019639968872070312, -0.01902627944946289, -0.01841259002685547, -0.017798900604248047, -0.017185211181640625, -0.016571521759033203, -0.01595783233642578, -0.01534414291381836, -0.014730453491210938, -0.014116764068603516, -0.013503074645996094, -0.012889385223388672, -0.01227569580078125, -0.011662006378173828, -0.011048316955566406, -0.010434627532958984, -0.009820938110351562, -0.00920724868774414, -0.008593559265136719, -0.007979869842529297, -0.007366180419921875, -0.006752490997314453, -0.006138801574707031, -0.005525112152099609, -0.0049114227294921875, -0.004297733306884766, -0.0036840438842773438, -0.003070354461669922, -0.0024566650390625, -0.0018429756164550781, -0.0012292861938476562, -0.0006155967712402344, -1.9073486328125e-06, 0.0006117820739746094, 0.0012254714965820312, 0.0018391609191894531, 0.002452850341796875, 0.003066539764404297, 0.0036802291870117188, 0.004293918609619141, 0.0049076080322265625, 0.005521297454833984, 0.006134986877441406, 0.006748676300048828, 0.00736236572265625, 0.007976055145263672, 0.008589744567871094, 0.009203433990478516, 0.009817123413085938, 0.01043081283569336, 0.011044502258300781, 0.011658191680908203, 0.012271881103515625, 0.012885570526123047, 0.013499259948730469, 0.01411294937133789, 0.014726638793945312, 0.015340328216552734, 0.015954017639160156, 0.016567707061767578, 0.017181396484375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 14.0, 19.0, 23.0, 31.0, 54.0, 72.0, 93.0, 98.0, 110.0, 114.0, 95.0, 82.0, 73.0, 45.0, 24.0, 26.0, 13.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0081024169921875, -0.007846474647521973, -0.007590532302856445, -0.007334589958190918, -0.007078647613525391, -0.006822705268859863, -0.006566762924194336, -0.006310820579528809, -0.006054878234863281, -0.005798935890197754, -0.0055429935455322266, -0.005287051200866699, -0.005031108856201172, -0.0047751665115356445, -0.004519224166870117, -0.00426328182220459, -0.0040073394775390625, -0.003751397132873535, -0.003495454788208008, -0.0032395124435424805, -0.002983570098876953, -0.0027276277542114258, -0.0024716854095458984, -0.002215743064880371, -0.0019598007202148438, -0.0017038583755493164, -0.001447916030883789, -0.0011919736862182617, -0.0009360313415527344, -0.000680088996887207, -0.0004241466522216797, -0.00016820430755615234, 8.7738037109375e-05, 0.00034368038177490234, 0.0005996227264404297, 0.000855565071105957, 0.0011115074157714844, 0.0013674497604370117, 0.001623392105102539, 0.0018793344497680664, 0.0021352767944335938, 0.002391219139099121, 0.0026471614837646484, 0.0029031038284301758, 0.003159046173095703, 0.0034149885177612305, 0.003670930862426758, 0.003926873207092285, 0.0041828155517578125, 0.00443875789642334, 0.004694700241088867, 0.0049506425857543945, 0.005206584930419922, 0.005462527275085449, 0.0057184696197509766, 0.005974411964416504, 0.006230354309082031, 0.006486296653747559, 0.006742238998413086, 0.006998181343078613, 0.007254123687744141, 0.007510066032409668, 0.007766008377075195, 0.008021950721740723, 0.00827789306640625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 12.0, 9.0, 15.0, 18.0, 18.0, 34.0, 55.0, 76.0, 109.0, 178.0, 324.0, 580.0, 1044.0, 2352.0, 5322.0, 13365.0, 37211.0, 119891.0, 418905.0, 317114.0, 85279.0, 27950.0, 10489.0, 4202.0, 1832.0, 936.0, 476.0, 282.0, 170.0, 101.0, 61.0, 51.0, 26.0, 16.0, 24.0, 8.0, 11.0, 4.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00962066650390625, -0.009336590766906738, -0.009052515029907227, -0.008768439292907715, -0.008484363555908203, -0.008200287818908691, -0.00791621208190918, -0.007632136344909668, -0.007348060607910156, -0.0070639848709106445, -0.006779909133911133, -0.006495833396911621, -0.006211757659912109, -0.005927681922912598, -0.005643606185913086, -0.005359530448913574, -0.0050754547119140625, -0.004791378974914551, -0.004507303237915039, -0.004223227500915527, -0.003939151763916016, -0.003655076026916504, -0.003371000289916992, -0.0030869245529174805, -0.0028028488159179688, -0.002518773078918457, -0.0022346973419189453, -0.0019506216049194336, -0.0016665458679199219, -0.0013824701309204102, -0.0010983943939208984, -0.0008143186569213867, -0.000530242919921875, -0.0002461671829223633, 3.790855407714844e-05, 0.00032198429107666016, 0.0006060600280761719, 0.0008901357650756836, 0.0011742115020751953, 0.001458287239074707, 0.0017423629760742188, 0.0020264387130737305, 0.002310514450073242, 0.002594590187072754, 0.0028786659240722656, 0.0031627416610717773, 0.003446817398071289, 0.0037308931350708008, 0.0040149688720703125, 0.004299044609069824, 0.004583120346069336, 0.004867196083068848, 0.005151271820068359, 0.005435347557067871, 0.005719423294067383, 0.0060034990310668945, 0.006287574768066406, 0.006571650505065918, 0.00685572624206543, 0.007139801979064941, 0.007423877716064453, 0.007707953453063965, 0.007992029190063477, 0.008276104927062988, 0.0085601806640625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 5.0, 8.0, 11.0, 7.0, 16.0, 13.0, 21.0, 24.0, 25.0, 22.0, 24.0, 38.0, 22.0, 35.0, 40.0, 54.0, 55.0, 45.0, 46.0, 34.0, 62.0, 37.0, 44.0, 36.0, 35.0, 23.0, 29.0, 36.0, 31.0, 21.0, 20.0, 20.0, 11.0, 10.0, 8.0, 7.0, 5.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0096893310546875, -0.009404540061950684, -0.009119749069213867, -0.00883495807647705, -0.008550167083740234, -0.008265376091003418, -0.007980585098266602, -0.007695794105529785, -0.007411003112792969, -0.007126212120056152, -0.006841421127319336, -0.0065566301345825195, -0.006271839141845703, -0.005987048149108887, -0.00570225715637207, -0.005417466163635254, -0.0051326751708984375, -0.004847884178161621, -0.004563093185424805, -0.004278302192687988, -0.003993511199951172, -0.0037087202072143555, -0.003423929214477539, -0.0031391382217407227, -0.0028543472290039062, -0.00256955623626709, -0.0022847652435302734, -0.001999974250793457, -0.0017151832580566406, -0.0014303922653198242, -0.0011456012725830078, -0.0008608102798461914, -0.000576019287109375, -0.0002912282943725586, -6.4373016357421875e-06, 0.0002783536911010742, 0.0005631446838378906, 0.000847935676574707, 0.0011327266693115234, 0.0014175176620483398, 0.0017023086547851562, 0.0019870996475219727, 0.002271890640258789, 0.0025566816329956055, 0.002841472625732422, 0.0031262636184692383, 0.0034110546112060547, 0.003695845603942871, 0.0039806365966796875, 0.004265427589416504, 0.00455021858215332, 0.004835009574890137, 0.005119800567626953, 0.0054045915603637695, 0.005689382553100586, 0.005974173545837402, 0.006258964538574219, 0.006543755531311035, 0.0068285465240478516, 0.007113337516784668, 0.007398128509521484, 0.007682919502258301, 0.007967710494995117, 0.008252501487731934, 0.00853729248046875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 8.0, 9.0, 23.0, 34.0, 38.0, 74.0, 123.0, 186.0, 330.0, 567.0, 1065.0, 2151.0, 4557.0, 11293.0, 31332.0, 103907.0, 407089.0, 351785.0, 88396.0, 27315.0, 9981.0, 4093.0, 1889.0, 958.0, 562.0, 291.0, 167.0, 123.0, 65.0, 50.0, 30.0, 19.0, 10.0, 10.0, 3.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.003448486328125, -0.003352522850036621, -0.003256559371948242, -0.0031605958938598633, -0.0030646324157714844, -0.0029686689376831055, -0.0028727054595947266, -0.0027767419815063477, -0.0026807785034179688, -0.00258481502532959, -0.002488851547241211, -0.002392888069152832, -0.002296924591064453, -0.0022009611129760742, -0.0021049976348876953, -0.0020090341567993164, -0.0019130706787109375, -0.0018171072006225586, -0.0017211437225341797, -0.0016251802444458008, -0.0015292167663574219, -0.001433253288269043, -0.001337289810180664, -0.0012413263320922852, -0.0011453628540039062, -0.0010493993759155273, -0.0009534358978271484, -0.0008574724197387695, -0.0007615089416503906, -0.0006655454635620117, -0.0005695819854736328, -0.0004736185073852539, -0.000377655029296875, -0.0002816915512084961, -0.0001857280731201172, -8.976459503173828e-05, 6.198883056640625e-06, 0.00010216236114501953, 0.00019812583923339844, 0.00029408931732177734, 0.00039005279541015625, 0.00048601627349853516, 0.0005819797515869141, 0.000677943229675293, 0.0007739067077636719, 0.0008698701858520508, 0.0009658336639404297, 0.0010617971420288086, 0.0011577606201171875, 0.0012537240982055664, 0.0013496875762939453, 0.0014456510543823242, 0.0015416145324707031, 0.001637578010559082, 0.001733541488647461, 0.0018295049667358398, 0.0019254684448242188, 0.0020214319229125977, 0.0021173954010009766, 0.0022133588790893555, 0.0023093223571777344, 0.0024052858352661133, 0.002501249313354492, 0.002597212791442871, 0.00269317626953125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 6.0, 4.0, 7.0, 0.0, 13.0, 6.0, 9.0, 10.0, 0.0, 28.0, 32.0, 32.0, 0.0, 21.0, 36.0, 41.0, 42.0, 0.0, 48.0, 58.0, 47.0, 0.0, 59.0, 76.0, 58.0, 44.0, 0.0, 63.0, 55.0, 37.0, 33.0, 0.0, 31.0, 24.0, 21.0, 0.0, 21.0, 15.0, 11.0, 4.0, 0.0, 3.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4901161193847656e-06, -1.4435499906539917e-06, -1.3969838619232178e-06, -1.3504177331924438e-06, -1.30385160446167e-06, -1.257285475730896e-06, -1.210719347000122e-06, -1.1641532182693481e-06, -1.1175870895385742e-06, -1.0710209608078003e-06, -1.0244548320770264e-06, -9.778887033462524e-07, -9.313225746154785e-07, -8.847564458847046e-07, -8.381903171539307e-07, -7.916241884231567e-07, -7.450580596923828e-07, -6.984919309616089e-07, -6.51925802230835e-07, -6.05359673500061e-07, -5.587935447692871e-07, -5.122274160385132e-07, -4.6566128730773926e-07, -4.1909515857696533e-07, -3.725290298461914e-07, -3.259629011154175e-07, -2.7939677238464355e-07, -2.3283064365386963e-07, -1.862645149230957e-07, -1.3969838619232178e-07, -9.313225746154785e-08, -4.6566128730773926e-08, 0.0, 4.6566128730773926e-08, 9.313225746154785e-08, 1.3969838619232178e-07, 1.862645149230957e-07, 2.3283064365386963e-07, 2.7939677238464355e-07, 3.259629011154175e-07, 3.725290298461914e-07, 4.1909515857696533e-07, 4.6566128730773926e-07, 5.122274160385132e-07, 5.587935447692871e-07, 6.05359673500061e-07, 6.51925802230835e-07, 6.984919309616089e-07, 7.450580596923828e-07, 7.916241884231567e-07, 8.381903171539307e-07, 8.847564458847046e-07, 9.313225746154785e-07, 9.778887033462524e-07, 1.0244548320770264e-06, 1.0710209608078003e-06, 1.1175870895385742e-06, 1.1641532182693481e-06, 1.210719347000122e-06, 1.257285475730896e-06, 1.30385160446167e-06, 1.3504177331924438e-06, 1.3969838619232178e-06, 1.4435499906539917e-06, 1.4901161193847656e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 7.0, 8.0, 11.0, 29.0, 27.0, 50.0, 80.0, 139.0, 202.0, 374.0, 716.0, 1392.0, 3094.0, 7744.0, 22820.0, 91706.0, 506056.0, 329274.0, 58148.0, 16041.0, 5756.0, 2319.0, 1105.0, 616.0, 315.0, 206.0, 115.0, 75.0, 44.0, 25.0, 14.0, 15.0, 11.0, 2.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00418853759765625, -0.0040610432624816895, -0.003933548927307129, -0.0038060545921325684, -0.003678560256958008, -0.0035510659217834473, -0.0034235715866088867, -0.003296077251434326, -0.0031685829162597656, -0.003041088581085205, -0.0029135942459106445, -0.002786099910736084, -0.0026586055755615234, -0.002531111240386963, -0.0024036169052124023, -0.002276122570037842, -0.0021486282348632812, -0.0020211338996887207, -0.0018936395645141602, -0.0017661452293395996, -0.001638650894165039, -0.0015111565589904785, -0.001383662223815918, -0.0012561678886413574, -0.0011286735534667969, -0.0010011792182922363, -0.0008736848831176758, -0.0007461905479431152, -0.0006186962127685547, -0.0004912018775939941, -0.0003637075424194336, -0.00023621320724487305, -0.0001087188720703125, 1.8775463104248047e-05, 0.0001462697982788086, 0.00027376413345336914, 0.0004012584686279297, 0.0005287528038024902, 0.0006562471389770508, 0.0007837414741516113, 0.0009112358093261719, 0.0010387301445007324, 0.001166224479675293, 0.0012937188148498535, 0.001421213150024414, 0.0015487074851989746, 0.0016762018203735352, 0.0018036961555480957, 0.0019311904907226562, 0.002058684825897217, 0.0021861791610717773, 0.002313673496246338, 0.0024411678314208984, 0.002568662166595459, 0.0026961565017700195, 0.00282365083694458, 0.0029511451721191406, 0.003078639507293701, 0.0032061338424682617, 0.0033336281776428223, 0.003461122512817383, 0.0035886168479919434, 0.003716111183166504, 0.0038436055183410645, 0.003971099853515625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 4.0, 8.0, 12.0, 13.0, 16.0, 15.0, 38.0, 42.0, 66.0, 79.0, 111.0, 131.0, 125.0, 91.0, 80.0, 54.0, 30.0, 19.0, 14.0, 10.0, 11.0, 7.0, 0.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0036945343017578125, -0.0035754144191741943, -0.003456294536590576, -0.003337174654006958, -0.00321805477142334, -0.0030989348888397217, -0.0029798150062561035, -0.0028606951236724854, -0.002741575241088867, -0.002622455358505249, -0.002503335475921631, -0.0023842155933380127, -0.0022650957107543945, -0.0021459758281707764, -0.002026855945587158, -0.00190773606300354, -0.0017886161804199219, -0.0016694962978363037, -0.0015503764152526855, -0.0014312565326690674, -0.0013121366500854492, -0.001193016767501831, -0.0010738968849182129, -0.0009547770023345947, -0.0008356571197509766, -0.0007165372371673584, -0.0005974173545837402, -0.00047829747200012207, -0.0003591775894165039, -0.00024005770683288574, -0.00012093782424926758, -1.817941665649414e-06, 0.00011730194091796875, 0.00023642182350158691, 0.0003555417060852051, 0.00047466158866882324, 0.0005937814712524414, 0.0007129013538360596, 0.0008320212364196777, 0.0009511411190032959, 0.001070261001586914, 0.0011893808841705322, 0.0013085007667541504, 0.0014276206493377686, 0.0015467405319213867, 0.0016658604145050049, 0.001784980297088623, 0.0019041001796722412, 0.0020232200622558594, 0.0021423399448394775, 0.0022614598274230957, 0.002380579710006714, 0.002499699592590332, 0.00261881947517395, 0.0027379393577575684, 0.0028570592403411865, 0.0029761791229248047, 0.003095299005508423, 0.003214418888092041, 0.003333538770675659, 0.0034526586532592773, 0.0035717785358428955, 0.0036908984184265137, 0.003810018301010132, 0.00392913818359375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 10.0, 18.0, 19.0, 39.0, 80.0, 121.0, 145.0, 188.0, 170.0, 104.0, 40.0, 26.0, 21.0, 8.0, 5.0, 4.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0295428317040205, -0.028162427246570587, -0.026782024651765823, -0.02540162019431591, -0.024021215736865997, -0.022640813142061234, -0.02126040868461132, -0.019880004227161407, -0.018499601632356644, -0.01711919717490673, -0.015738794580101967, -0.014358390122652054, -0.01297798566520214, -0.011597582139074802, -0.010217178612947464, -0.008836774155497551, -0.007456369698047638, -0.006075965706259012, -0.0046955617144703865, -0.003315158188343048, -0.0019347541965544224, -0.0005543502047657967, 0.0008260533213615417, 0.0022064577788114548, 0.003586861304938793, 0.004967265296727419, 0.006347669288516045, 0.007728072814643383, 0.009108476340770721, 0.010488880798220634, 0.011869284324347973, 0.013249688781797886, 0.014630090445280075, 0.016010494902729988, 0.017390897497534752, 0.018771301954984665, 0.020151706412434578, 0.02153211086988449, 0.022912513464689255, 0.024292917922139168, 0.02567332237958908, 0.027053726837038994, 0.028434129431843758, 0.02981453388929367, 0.031194938346743584, 0.0325753428041935, 0.03395574539899826, 0.03533615171909332, 0.03671655058860779, 0.03809695318341255, 0.039477359503507614, 0.04085776209831238, 0.04223816469311714, 0.043618571013212204, 0.04499897360801697, 0.04637937992811203, 0.047759782522916794, 0.04914018511772156, 0.05052059143781662, 0.051900994032621384, 0.05328139662742615, 0.05466180294752121, 0.056042205542325974, 0.05742260813713074, 0.0588030144572258]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 4.0, 6.0, 13.0, 8.0, 10.0, 19.0, 19.0, 28.0, 16.0, 27.0, 24.0, 36.0, 27.0, 28.0, 40.0, 46.0, 33.0, 47.0, 44.0, 38.0, 30.0, 40.0, 33.0, 37.0, 38.0, 37.0, 32.0, 22.0, 35.0, 23.0, 19.0, 26.0, 14.0, 16.0, 15.0, 8.0, 8.0, 8.0, 12.0, 5.0, 4.0, 3.0, 6.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.021200120449066162, -0.020542558282613754, -0.019884994253516197, -0.01922743022441864, -0.018569868057966232, -0.017912305891513824, -0.017254741862416267, -0.01659717783331871, -0.015939615666866302, -0.01528205256909132, -0.014624489471316338, -0.013966926373541355, -0.013309363275766373, -0.01265180017799139, -0.011994237080216408, -0.011336673982441425, -0.010679110884666443, -0.01002154778689146, -0.009363984689116478, -0.008706421591341496, -0.008048858493566513, -0.007391295395791531, -0.006733732298016548, -0.006076169200241566, -0.005418606102466583, -0.004761043004691601, -0.004103479906916618, -0.003445916809141636, -0.0027883537113666534, -0.002130790613591671, -0.0014732275158166885, -0.0008156644180417061, -0.00015810132026672363, 0.0004994617775082588, 0.0011570248752832413, 0.0018145879730582237, 0.002472151070833206, 0.0031297141686081886, 0.003787277266383171, 0.0044448403641581535, 0.005102403461933136, 0.0057599665597081184, 0.006417529657483101, 0.007075092755258083, 0.007732655853033066, 0.008390218950808048, 0.00904778204858303, 0.009705345146358013, 0.010362908244132996, 0.011020471341907978, 0.01167803443968296, 0.012335597537457943, 0.012993160635232925, 0.013650723733007908, 0.01430828683078289, 0.014965849928557873, 0.015623413026332855, 0.016280975192785263, 0.01693853922188282, 0.017596103250980377, 0.018253665417432785, 0.018911227583885193, 0.01956879161298275, 0.020226355642080307, 0.020883917808532715]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 9.0, 14.0, 13.0, 18.0, 29.0, 47.0, 61.0, 86.0, 188.0, 395.0, 1046.0, 3447.0, 18899.0, 464180.0, 3653713.0, 43428.0, 6189.0, 1467.0, 491.0, 220.0, 106.0, 68.0, 48.0, 34.0, 28.0, 10.0, 13.0, 5.0, 6.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018035888671875, -0.01745772361755371, -0.016879558563232422, -0.016301393508911133, -0.015723228454589844, -0.015145063400268555, -0.014566898345947266, -0.013988733291625977, -0.013410568237304688, -0.012832403182983398, -0.01225423812866211, -0.01167607307434082, -0.011097908020019531, -0.010519742965698242, -0.009941577911376953, -0.009363412857055664, -0.008785247802734375, -0.008207082748413086, -0.007628917694091797, -0.007050752639770508, -0.006472587585449219, -0.00589442253112793, -0.005316257476806641, -0.0047380924224853516, -0.0041599273681640625, -0.0035817623138427734, -0.0030035972595214844, -0.0024254322052001953, -0.0018472671508789062, -0.0012691020965576172, -0.0006909370422363281, -0.00011277198791503906, 0.00046539306640625, 0.001043558120727539, 0.0016217231750488281, 0.002199888229370117, 0.0027780532836914062, 0.0033562183380126953, 0.003934383392333984, 0.0045125484466552734, 0.0050907135009765625, 0.0056688785552978516, 0.006247043609619141, 0.00682520866394043, 0.007403373718261719, 0.007981538772583008, 0.008559703826904297, 0.009137868881225586, 0.009716033935546875, 0.010294198989868164, 0.010872364044189453, 0.011450529098510742, 0.012028694152832031, 0.01260685920715332, 0.01318502426147461, 0.013763189315795898, 0.014341354370117188, 0.014919519424438477, 0.015497684478759766, 0.016075849533081055, 0.016654014587402344, 0.017232179641723633, 0.017810344696044922, 0.01838850975036621, 0.0189666748046875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 11.0, 14.0, 15.0, 27.0, 34.0, 51.0, 68.0, 84.0, 101.0, 95.0, 114.0, 97.0, 96.0, 64.0, 54.0, 27.0, 19.0, 14.0, 11.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00698089599609375, -0.0067386627197265625, -0.006496429443359375, -0.0062541961669921875, -0.006011962890625, -0.0057697296142578125, -0.005527496337890625, -0.0052852630615234375, -0.00504302978515625, -0.0048007965087890625, -0.004558563232421875, -0.0043163299560546875, -0.0040740966796875, -0.0038318634033203125, -0.003589630126953125, -0.0033473968505859375, -0.00310516357421875, -0.0028629302978515625, -0.002620697021484375, -0.0023784637451171875, -0.00213623046875, -0.0018939971923828125, -0.001651763916015625, -0.0014095306396484375, -0.00116729736328125, -0.0009250640869140625, -0.000682830810546875, -0.0004405975341796875, -0.0001983642578125, 4.38690185546875e-05, 0.000286102294921875, 0.0005283355712890625, 0.00077056884765625, 0.0010128021240234375, 0.001255035400390625, 0.0014972686767578125, 0.001739501953125, 0.0019817352294921875, 0.002223968505859375, 0.0024662017822265625, 0.00270843505859375, 0.0029506683349609375, 0.003192901611328125, 0.0034351348876953125, 0.0036773681640625, 0.0039196014404296875, 0.004161834716796875, 0.0044040679931640625, 0.00464630126953125, 0.0048885345458984375, 0.005130767822265625, 0.0053730010986328125, 0.005615234375, 0.0058574676513671875, 0.006099700927734375, 0.0063419342041015625, 0.00658416748046875, 0.0068264007568359375, 0.007068634033203125, 0.0073108673095703125, 0.0075531005859375, 0.0077953338623046875, 0.008037567138671875, 0.008279800415039062, 0.00852203369140625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 4.0, 17.0, 22.0, 35.0, 32.0, 43.0, 65.0, 81.0, 128.0, 182.0, 306.0, 504.0, 950.0, 1904.0, 4121.0, 9715.0, 27113.0, 94330.0, 956961.0, 2879756.0, 156149.0, 38347.0, 13085.0, 5121.0, 2413.0, 1148.0, 590.0, 357.0, 219.0, 162.0, 118.0, 74.0, 69.0, 41.0, 26.0, 28.0, 16.0, 14.0, 11.0, 10.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.006832122802734375, -0.00658947229385376, -0.0063468217849731445, -0.006104171276092529, -0.005861520767211914, -0.005618870258331299, -0.005376219749450684, -0.005133569240570068, -0.004890918731689453, -0.004648268222808838, -0.004405617713928223, -0.004162967205047607, -0.003920316696166992, -0.003677666187286377, -0.0034350156784057617, -0.0031923651695251465, -0.0029497146606445312, -0.002707064151763916, -0.0024644136428833008, -0.0022217631340026855, -0.0019791126251220703, -0.001736462116241455, -0.0014938116073608398, -0.0012511610984802246, -0.0010085105895996094, -0.0007658600807189941, -0.0005232095718383789, -0.00028055906295776367, -3.790855407714844e-05, 0.0002047419548034668, 0.00044739246368408203, 0.0006900429725646973, 0.0009326934814453125, 0.0011753439903259277, 0.001417994499206543, 0.0016606450080871582, 0.0019032955169677734, 0.0021459460258483887, 0.002388596534729004, 0.002631247043609619, 0.0028738975524902344, 0.0031165480613708496, 0.003359198570251465, 0.00360184907913208, 0.0038444995880126953, 0.0040871500968933105, 0.004329800605773926, 0.004572451114654541, 0.004815101623535156, 0.0050577521324157715, 0.005300402641296387, 0.005543053150177002, 0.005785703659057617, 0.006028354167938232, 0.006271004676818848, 0.006513655185699463, 0.006756305694580078, 0.006998956203460693, 0.007241606712341309, 0.007484257221221924, 0.007726907730102539, 0.007969558238983154, 0.00821220874786377, 0.008454859256744385, 0.008697509765625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 13.0, 15.0, 16.0, 31.0, 41.0, 57.0, 93.0, 195.0, 597.0, 1556.0, 857.0, 289.0, 125.0, 54.0, 50.0, 21.0, 18.0, 8.0, 12.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00839996337890625, -0.00811624526977539, -0.007832527160644531, -0.007548809051513672, -0.0072650909423828125, -0.006981372833251953, -0.006697654724121094, -0.006413936614990234, -0.006130218505859375, -0.005846500396728516, -0.005562782287597656, -0.005279064178466797, -0.0049953460693359375, -0.004711627960205078, -0.004427909851074219, -0.004144191741943359, -0.0038604736328125, -0.0035767555236816406, -0.0032930374145507812, -0.003009319305419922, -0.0027256011962890625, -0.002441883087158203, -0.0021581649780273438, -0.0018744468688964844, -0.001590728759765625, -0.0013070106506347656, -0.0010232925415039062, -0.0007395744323730469, -0.0004558563232421875, -0.00017213821411132812, 0.00011157989501953125, 0.0003952980041503906, 0.00067901611328125, 0.0009627342224121094, 0.0012464523315429688, 0.0015301704406738281, 0.0018138885498046875, 0.002097606658935547, 0.0023813247680664062, 0.0026650428771972656, 0.002948760986328125, 0.0032324790954589844, 0.0035161972045898438, 0.003799915313720703, 0.0040836334228515625, 0.004367351531982422, 0.004651069641113281, 0.004934787750244141, 0.005218505859375, 0.005502223968505859, 0.005785942077636719, 0.006069660186767578, 0.0063533782958984375, 0.006637096405029297, 0.006920814514160156, 0.007204532623291016, 0.007488250732421875, 0.007771968841552734, 0.008055686950683594, 0.008339405059814453, 0.008623123168945312, 0.008906841278076172, 0.009190559387207031, 0.00947427749633789, 0.00975799560546875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 8.0, 20.0, 57.0, 98.0, 152.0, 196.0, 193.0, 125.0, 72.0, 36.0, 21.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06291228532791138, -0.06144343689084053, -0.05997459217905998, -0.058505743741989136, -0.05703689903020859, -0.05556805059313774, -0.05409920588135719, -0.052630357444286346, -0.0511615127325058, -0.04969266429543495, -0.048223819583654404, -0.04675497114658356, -0.04528612643480301, -0.04381727799773216, -0.042348433285951614, -0.04087958484888077, -0.03941074013710022, -0.03794189170002937, -0.036473046988248825, -0.03500419855117798, -0.03353535383939743, -0.032066505402326584, -0.030597660690546036, -0.02912881225347519, -0.027659963816404343, -0.026191117241978645, -0.024722270667552948, -0.02325342409312725, -0.021784577518701553, -0.020315730944275856, -0.01884688436985016, -0.017378035932779312, -0.015909191220998764, -0.014440344646573067, -0.01297149807214737, -0.011502651497721672, -0.010033804923295975, -0.008564958348870277, -0.0070961108431220055, -0.005627264268696308, -0.004158417694270611, -0.0026895711198449135, -0.0012207243125885725, 0.0002481224946677685, 0.0017169690690934658, 0.003185815643519163, 0.004654662683606148, 0.006123509258031845, 0.007592355832457542, 0.00906120240688324, 0.010530048981308937, 0.011998895555734634, 0.013467742130160332, 0.014936588704586029, 0.016405437141656876, 0.017874281853437424, 0.01934313029050827, 0.020811976864933968, 0.022280823439359665, 0.023749670013785362, 0.02521851658821106, 0.026687363162636757, 0.028156209737062454, 0.0296250581741333, 0.03109390288591385]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 9.0, 8.0, 8.0, 24.0, 18.0, 22.0, 18.0, 19.0, 22.0, 25.0, 40.0, 31.0, 25.0, 38.0, 46.0, 34.0, 39.0, 46.0, 52.0, 45.0, 40.0, 34.0, 38.0, 38.0, 33.0, 30.0, 37.0, 20.0, 29.0, 26.0, 20.0, 14.0, 17.0, 9.0, 8.0, 7.0, 6.0, 6.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01609623432159424, -0.015633855015039444, -0.015171477571129799, -0.01470909919589758, -0.01424672082066536, -0.01378434244543314, -0.01332196407020092, -0.0128595856949687, -0.01239720731973648, -0.011934828944504261, -0.011472450569272041, -0.011010072194039822, -0.010547693818807602, -0.010085315443575382, -0.009622937068343163, -0.009160558693110943, -0.008698180317878723, -0.008235801942646503, -0.007773423567414284, -0.007311045192182064, -0.006848666816949844, -0.006386288441717625, -0.005923910066485405, -0.005461531691253185, -0.004999153316020966, -0.004536774940788746, -0.004074396565556526, -0.0036120181903243065, -0.003149639815092087, -0.002687261439859867, -0.0022248830646276474, -0.0017625046893954277, -0.001300126314163208, -0.0008377479389309883, -0.0003753695636987686, 8.700881153345108e-05, 0.0005493871867656708, 0.0010117655619978905, 0.0014741439372301102, 0.0019365223124623299, 0.0023989006876945496, 0.0028612790629267693, 0.003323657438158989, 0.0037860358133912086, 0.004248414188623428, 0.004710792563855648, 0.005173170939087868, 0.005635549314320087, 0.006097927689552307, 0.006560306064784527, 0.0070226844400167465, 0.007485062815248966, 0.007947441190481186, 0.008409819565713406, 0.008872197940945625, 0.009334576316177845, 0.009796954691410065, 0.010259333066642284, 0.010721711441874504, 0.011184089817106724, 0.011646468192338943, 0.012108846567571163, 0.012571224942803383, 0.013033603318035603, 0.013495981693267822]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 10.0, 9.0, 13.0, 33.0, 35.0, 56.0, 62.0, 112.0, 177.0, 239.0, 477.0, 1016.0, 2946.0, 12064.0, 70795.0, 552609.0, 353069.0, 42486.0, 8122.0, 2325.0, 790.0, 405.0, 222.0, 163.0, 84.0, 71.0, 37.0, 42.0, 17.0, 22.0, 9.0, 9.0, 5.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0170135498046875, -0.016443967819213867, -0.015874385833740234, -0.015304803848266602, -0.014735221862792969, -0.014165639877319336, -0.013596057891845703, -0.01302647590637207, -0.012456893920898438, -0.011887311935424805, -0.011317729949951172, -0.010748147964477539, -0.010178565979003906, -0.009608983993530273, -0.00903940200805664, -0.008469820022583008, -0.007900238037109375, -0.007330656051635742, -0.006761074066162109, -0.0061914920806884766, -0.005621910095214844, -0.005052328109741211, -0.004482746124267578, -0.003913164138793945, -0.0033435821533203125, -0.0027740001678466797, -0.002204418182373047, -0.001634836196899414, -0.0010652542114257812, -0.0004956722259521484, 7.390975952148438e-05, 0.0006434917449951172, 0.00121307373046875, 0.0017826557159423828, 0.0023522377014160156, 0.0029218196868896484, 0.0034914016723632812, 0.004060983657836914, 0.004630565643310547, 0.00520014762878418, 0.0057697296142578125, 0.006339311599731445, 0.006908893585205078, 0.007478475570678711, 0.008048057556152344, 0.008617639541625977, 0.00918722152709961, 0.009756803512573242, 0.010326385498046875, 0.010895967483520508, 0.01146554946899414, 0.012035131454467773, 0.012604713439941406, 0.013174295425415039, 0.013743877410888672, 0.014313459396362305, 0.014883041381835938, 0.01545262336730957, 0.016022205352783203, 0.016591787338256836, 0.01716136932373047, 0.0177309513092041, 0.018300533294677734, 0.018870115280151367, 0.019439697265625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 12.0, 18.0, 18.0, 45.0, 48.0, 86.0, 81.0, 103.0, 115.0, 98.0, 111.0, 90.0, 57.0, 47.0, 20.0, 26.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0076751708984375, -0.007424712181091309, -0.007174253463745117, -0.006923794746398926, -0.006673336029052734, -0.006422877311706543, -0.0061724185943603516, -0.00592195987701416, -0.005671501159667969, -0.005421042442321777, -0.005170583724975586, -0.0049201250076293945, -0.004669666290283203, -0.004419207572937012, -0.00416874885559082, -0.003918290138244629, -0.0036678314208984375, -0.003417372703552246, -0.0031669139862060547, -0.0029164552688598633, -0.002665996551513672, -0.0024155378341674805, -0.002165079116821289, -0.0019146203994750977, -0.0016641616821289062, -0.0014137029647827148, -0.0011632442474365234, -0.000912785530090332, -0.0006623268127441406, -0.0004118680953979492, -0.0001614093780517578, 8.90493392944336e-05, 0.000339508056640625, 0.0005899667739868164, 0.0008404254913330078, 0.0010908842086791992, 0.0013413429260253906, 0.001591801643371582, 0.0018422603607177734, 0.002092719078063965, 0.0023431777954101562, 0.0025936365127563477, 0.002844095230102539, 0.0030945539474487305, 0.003345012664794922, 0.0035954713821411133, 0.0038459300994873047, 0.004096388816833496, 0.0043468475341796875, 0.004597306251525879, 0.00484776496887207, 0.005098223686218262, 0.005348682403564453, 0.0055991411209106445, 0.005849599838256836, 0.006100058555603027, 0.006350517272949219, 0.00660097599029541, 0.0068514347076416016, 0.007101893424987793, 0.007352352142333984, 0.007602810859680176, 0.007853269577026367, 0.008103728294372559, 0.00835418701171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 5.0, 18.0, 14.0, 21.0, 23.0, 48.0, 71.0, 97.0, 143.0, 219.0, 466.0, 841.0, 1663.0, 3379.0, 7217.0, 17249.0, 42308.0, 112328.0, 301035.0, 339732.0, 134996.0, 50467.0, 19887.0, 8350.0, 3891.0, 1843.0, 966.0, 513.0, 292.0, 155.0, 108.0, 64.0, 43.0, 20.0, 20.0, 14.0, 13.0, 12.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007537841796875, -0.007295370101928711, -0.007052898406982422, -0.006810426712036133, -0.006567955017089844, -0.006325483322143555, -0.006083011627197266, -0.0058405399322509766, -0.0055980682373046875, -0.0053555965423583984, -0.005113124847412109, -0.00487065315246582, -0.004628181457519531, -0.004385709762573242, -0.004143238067626953, -0.003900766372680664, -0.003658294677734375, -0.003415822982788086, -0.003173351287841797, -0.002930879592895508, -0.0026884078979492188, -0.0024459362030029297, -0.0022034645080566406, -0.0019609928131103516, -0.0017185211181640625, -0.0014760494232177734, -0.0012335777282714844, -0.0009911060333251953, -0.0007486343383789062, -0.0005061626434326172, -0.0002636909484863281, -2.1219253540039062e-05, 0.00022125244140625, 0.00046372413635253906, 0.0007061958312988281, 0.0009486675262451172, 0.0011911392211914062, 0.0014336109161376953, 0.0016760826110839844, 0.0019185543060302734, 0.0021610260009765625, 0.0024034976959228516, 0.0026459693908691406, 0.0028884410858154297, 0.0031309127807617188, 0.003373384475708008, 0.003615856170654297, 0.003858327865600586, 0.004100799560546875, 0.004343271255493164, 0.004585742950439453, 0.004828214645385742, 0.005070686340332031, 0.00531315803527832, 0.005555629730224609, 0.0057981014251708984, 0.0060405731201171875, 0.0062830448150634766, 0.006525516510009766, 0.006767988204956055, 0.007010459899902344, 0.007252931594848633, 0.007495403289794922, 0.007737874984741211, 0.0079803466796875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 1.0, 4.0, 5.0, 10.0, 4.0, 15.0, 16.0, 16.0, 29.0, 29.0, 29.0, 28.0, 38.0, 40.0, 63.0, 43.0, 60.0, 58.0, 51.0, 71.0, 50.0, 58.0, 51.0, 42.0, 35.0, 23.0, 25.0, 30.0, 15.0, 11.0, 11.0, 8.0, 11.0, 7.0, 4.0, 3.0, 6.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0119476318359375, -0.011586308479309082, -0.011224985122680664, -0.010863661766052246, -0.010502338409423828, -0.01014101505279541, -0.009779691696166992, -0.009418368339538574, -0.009057044982910156, -0.008695721626281738, -0.00833439826965332, -0.007973074913024902, -0.007611751556396484, -0.007250428199768066, -0.0068891048431396484, -0.0065277814865112305, -0.0061664581298828125, -0.0058051347732543945, -0.0054438114166259766, -0.005082488059997559, -0.004721164703369141, -0.004359841346740723, -0.003998517990112305, -0.0036371946334838867, -0.0032758712768554688, -0.0029145479202270508, -0.002553224563598633, -0.002191901206970215, -0.0018305778503417969, -0.001469254493713379, -0.001107931137084961, -0.000746607780456543, -0.000385284423828125, -2.396106719970703e-05, 0.00033736228942871094, 0.0006986856460571289, 0.0010600090026855469, 0.0014213323593139648, 0.0017826557159423828, 0.0021439790725708008, 0.0025053024291992188, 0.0028666257858276367, 0.0032279491424560547, 0.0035892724990844727, 0.003950595855712891, 0.004311919212341309, 0.0046732425689697266, 0.0050345659255981445, 0.0053958892822265625, 0.0057572126388549805, 0.0061185359954833984, 0.006479859352111816, 0.006841182708740234, 0.007202506065368652, 0.00756382942199707, 0.007925152778625488, 0.008286476135253906, 0.008647799491882324, 0.009009122848510742, 0.00937044620513916, 0.009731769561767578, 0.010093092918395996, 0.010454416275024414, 0.010815739631652832, 0.01117706298828125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 12.0, 15.0, 25.0, 38.0, 71.0, 86.0, 169.0, 285.0, 491.0, 903.0, 1828.0, 3814.0, 9190.0, 26473.0, 97397.0, 477576.0, 330794.0, 66139.0, 19703.0, 7274.0, 3122.0, 1433.0, 746.0, 384.0, 228.0, 131.0, 72.0, 57.0, 38.0, 23.0, 11.0, 9.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003406524658203125, -0.003284275531768799, -0.0031620264053344727, -0.0030397772789001465, -0.0029175281524658203, -0.002795279026031494, -0.002673029899597168, -0.002550780773162842, -0.0024285316467285156, -0.0023062825202941895, -0.0021840333938598633, -0.002061784267425537, -0.001939535140991211, -0.0018172860145568848, -0.0016950368881225586, -0.0015727877616882324, -0.0014505386352539062, -0.00132828950881958, -0.001206040382385254, -0.0010837912559509277, -0.0009615421295166016, -0.0008392930030822754, -0.0007170438766479492, -0.000594794750213623, -0.0004725456237792969, -0.0003502964973449707, -0.00022804737091064453, -0.00010579824447631836, 1.6450881958007812e-05, 0.00013870000839233398, 0.00026094913482666016, 0.00038319826126098633, 0.0005054473876953125, 0.0006276965141296387, 0.0007499456405639648, 0.000872194766998291, 0.0009944438934326172, 0.0011166930198669434, 0.0012389421463012695, 0.0013611912727355957, 0.0014834403991699219, 0.001605689525604248, 0.0017279386520385742, 0.0018501877784729004, 0.0019724369049072266, 0.0020946860313415527, 0.002216935157775879, 0.002339184284210205, 0.0024614334106445312, 0.0025836825370788574, 0.0027059316635131836, 0.0028281807899475098, 0.002950429916381836, 0.003072679042816162, 0.0031949281692504883, 0.0033171772956848145, 0.0034394264221191406, 0.003561675548553467, 0.003683924674987793, 0.003806173801422119, 0.003928422927856445, 0.0040506720542907715, 0.004172921180725098, 0.004295170307159424, 0.00441741943359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 9.0, 5.0, 0.0, 9.0, 16.0, 0.0, 22.0, 15.0, 23.0, 0.0, 38.0, 47.0, 38.0, 0.0, 54.0, 55.0, 61.0, 0.0, 67.0, 63.0, 0.0, 59.0, 65.0, 65.0, 0.0, 55.0, 38.0, 51.0, 0.0, 31.0, 24.0, 28.0, 0.0, 13.0, 13.0, 0.0, 11.0, 8.0, 7.0, 0.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.430511474609375e-06, -1.3867393136024475e-06, -1.34296715259552e-06, -1.2991949915885925e-06, -1.255422830581665e-06, -1.2116506695747375e-06, -1.16787850856781e-06, -1.1241063475608826e-06, -1.080334186553955e-06, -1.0365620255470276e-06, -9.927898645401e-07, -9.490177035331726e-07, -9.052455425262451e-07, -8.614733815193176e-07, -8.177012205123901e-07, -7.739290595054626e-07, -7.301568984985352e-07, -6.863847374916077e-07, -6.426125764846802e-07, -5.988404154777527e-07, -5.550682544708252e-07, -5.112960934638977e-07, -4.675239324569702e-07, -4.237517714500427e-07, -3.7997961044311523e-07, -3.3620744943618774e-07, -2.9243528842926025e-07, -2.4866312742233276e-07, -2.0489096641540527e-07, -1.6111880540847778e-07, -1.1734664440155029e-07, -7.35744833946228e-08, -2.9802322387695312e-08, 1.3969838619232178e-08, 5.774199962615967e-08, 1.0151416063308716e-07, 1.4528632164001465e-07, 1.8905848264694214e-07, 2.3283064365386963e-07, 2.766028046607971e-07, 3.203749656677246e-07, 3.641471266746521e-07, 4.079192876815796e-07, 4.516914486885071e-07, 4.954636096954346e-07, 5.392357707023621e-07, 5.830079317092896e-07, 6.26780092716217e-07, 6.705522537231445e-07, 7.14324414730072e-07, 7.580965757369995e-07, 8.01868736743927e-07, 8.456408977508545e-07, 8.89413058757782e-07, 9.331852197647095e-07, 9.76957380771637e-07, 1.0207295417785645e-06, 1.064501702785492e-06, 1.1082738637924194e-06, 1.152046024799347e-06, 1.1958181858062744e-06, 1.239590346813202e-06, 1.2833625078201294e-06, 1.3271346688270569e-06, 1.3709068298339844e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 17.0, 22.0, 30.0, 39.0, 81.0, 130.0, 318.0, 689.0, 1874.0, 5989.0, 23190.0, 159599.0, 731120.0, 100664.0, 17392.0, 4722.0, 1575.0, 535.0, 239.0, 127.0, 62.0, 38.0, 29.0, 22.0, 20.0, 7.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006053924560546875, -0.005824625492095947, -0.0055953264236450195, -0.005366027355194092, -0.005136728286743164, -0.004907429218292236, -0.004678130149841309, -0.004448831081390381, -0.004219532012939453, -0.003990232944488525, -0.0037609338760375977, -0.00353163480758667, -0.003302335739135742, -0.0030730366706848145, -0.0028437376022338867, -0.002614438533782959, -0.0023851394653320312, -0.0021558403968811035, -0.0019265413284301758, -0.001697242259979248, -0.0014679431915283203, -0.0012386441230773926, -0.0010093450546264648, -0.0007800459861755371, -0.0005507469177246094, -0.00032144784927368164, -9.21487808227539e-05, 0.00013715028762817383, 0.00036644935607910156, 0.0005957484245300293, 0.000825047492980957, 0.0010543465614318848, 0.0012836456298828125, 0.0015129446983337402, 0.001742243766784668, 0.0019715428352355957, 0.0022008419036865234, 0.002430140972137451, 0.002659440040588379, 0.0028887391090393066, 0.0031180381774902344, 0.003347337245941162, 0.00357663631439209, 0.0038059353828430176, 0.004035234451293945, 0.004264533519744873, 0.004493832588195801, 0.0047231316566467285, 0.004952430725097656, 0.005181729793548584, 0.005411028861999512, 0.0056403279304504395, 0.005869626998901367, 0.006098926067352295, 0.006328225135803223, 0.00655752420425415, 0.006786823272705078, 0.007016122341156006, 0.007245421409606934, 0.007474720478057861, 0.007704019546508789, 0.007933318614959717, 0.008162617683410645, 0.008391916751861572, 0.0086212158203125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 11.0, 10.0, 18.0, 20.0, 35.0, 52.0, 68.0, 138.0, 193.0, 165.0, 106.0, 53.0, 36.0, 14.0, 11.0, 17.0, 10.0, 8.0, 6.0, 4.0, 7.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004421234130859375, -0.00422590970993042, -0.004030585289001465, -0.0038352608680725098, -0.0036399364471435547, -0.0034446120262145996, -0.0032492876052856445, -0.0030539631843566895, -0.0028586387634277344, -0.0026633143424987793, -0.0024679899215698242, -0.002272665500640869, -0.002077341079711914, -0.001882016658782959, -0.001686692237854004, -0.0014913678169250488, -0.0012960433959960938, -0.0011007189750671387, -0.0009053945541381836, -0.0007100701332092285, -0.0005147457122802734, -0.00031942129135131836, -0.00012409687042236328, 7.12275505065918e-05, 0.0002665519714355469, 0.00046187639236450195, 0.000657200813293457, 0.0008525252342224121, 0.0010478496551513672, 0.0012431740760803223, 0.0014384984970092773, 0.0016338229179382324, 0.0018291473388671875, 0.0020244717597961426, 0.0022197961807250977, 0.0024151206016540527, 0.002610445022583008, 0.002805769443511963, 0.003001093864440918, 0.003196418285369873, 0.003391742706298828, 0.003587067127227783, 0.0037823915481567383, 0.003977715969085693, 0.0041730403900146484, 0.0043683648109436035, 0.004563689231872559, 0.004759013652801514, 0.004954338073730469, 0.005149662494659424, 0.005344986915588379, 0.005540311336517334, 0.005735635757446289, 0.005930960178375244, 0.006126284599304199, 0.006321609020233154, 0.006516933441162109, 0.0067122578620910645, 0.0069075822830200195, 0.007102906703948975, 0.00729823112487793, 0.007493555545806885, 0.00768887996673584, 0.007884204387664795, 0.00807952880859375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 10.0, 24.0, 66.0, 118.0, 183.0, 221.0, 178.0, 93.0, 50.0, 23.0, 17.0, 10.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033246103674173355, -0.03134322538971901, -0.029440347105264664, -0.027537468820810318, -0.025634590536355972, -0.023731712251901627, -0.02182883210480213, -0.019925953820347786, -0.01802307553589344, -0.016120197251439095, -0.014217318966984749, -0.012314439751207829, -0.010411561466753483, -0.008508683182299137, -0.006605803966522217, -0.004702925682067871, -0.0028000473976135254, -0.000897168880328536, 0.0010057096369564533, 0.0029085883870720863, 0.004811466671526432, 0.006714344955980778, 0.008617224171757698, 0.010520102456212044, 0.01242298074066639, 0.014325859025120735, 0.01622873730957508, 0.018131617456674576, 0.02003449574112892, 0.021937374025583267, 0.023840252310037613, 0.02574313059449196, 0.027646005153656006, 0.02954888343811035, 0.0314517617225647, 0.03335464000701904, 0.03525751829147339, 0.037160396575927734, 0.03906327486038208, 0.040966153144836426, 0.04286903142929077, 0.04477190971374512, 0.04667478799819946, 0.04857766628265381, 0.050480544567108154, 0.0523834228515625, 0.054286301136016846, 0.05618917942047119, 0.058092061430215836, 0.05999493971467018, 0.06189781799912453, 0.06380070000886917, 0.06570357829332352, 0.06760645657777786, 0.06950933486223221, 0.07141221314668655, 0.0733150914311409, 0.07521796971559525, 0.07712084800004959, 0.07902372628450394, 0.08092660456895828, 0.08282948285341263, 0.08473236113786697, 0.08663523942232132, 0.08853811770677567]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 3.0, 4.0, 6.0, 9.0, 11.0, 12.0, 15.0, 17.0, 16.0, 21.0, 30.0, 20.0, 31.0, 27.0, 34.0, 33.0, 30.0, 46.0, 40.0, 41.0, 40.0, 40.0, 32.0, 42.0, 39.0, 36.0, 25.0, 34.0, 29.0, 28.0, 24.0, 21.0, 21.0, 24.0, 20.0, 10.0, 11.0, 18.0, 9.0, 12.0, 9.0, 7.0, 4.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.021313011646270752, -0.02061578445136547, -0.01991855725646019, -0.01922133006155491, -0.018524102866649628, -0.017826875671744347, -0.017129648476839066, -0.016432421281933784, -0.015735194087028503, -0.015037966892123222, -0.014340739697217941, -0.01364351250231266, -0.01294628530740738, -0.012249058112502098, -0.011551830917596817, -0.010854603722691536, -0.010157376527786255, -0.009460149332880974, -0.008762922137975693, -0.008065694943070412, -0.007368467748165131, -0.0066712405532598495, -0.0059740133583545685, -0.005276786163449287, -0.004579558968544006, -0.0038823317736387253, -0.003185104578733444, -0.002487877383828163, -0.001790650188922882, -0.001093422994017601, -0.00039619579911231995, 0.0003010313957929611, 0.0009982585906982422, 0.0016954857856035233, 0.0023927129805088043, 0.0030899401754140854, 0.0037871673703193665, 0.0044843945652246475, 0.005181621760129929, 0.00587884895503521, 0.006576076149940491, 0.007273303344845772, 0.007970530539751053, 0.008667757734656334, 0.009364984929561615, 0.010062212124466896, 0.010759439319372177, 0.011456666514277458, 0.01215389370918274, 0.01285112090408802, 0.013548348098993301, 0.014245575293898582, 0.014942802488803864, 0.015640029683709145, 0.016337256878614426, 0.017034484073519707, 0.017731711268424988, 0.01842893846333027, 0.01912616565823555, 0.01982339285314083, 0.020520620048046112, 0.021217847242951393, 0.021915074437856674, 0.022612301632761955, 0.023309528827667236]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 22.0, 26.0, 38.0, 74.0, 141.0, 247.0, 530.0, 1504.0, 7062.0, 98539.0, 4002469.0, 74769.0, 6338.0, 1473.0, 471.0, 255.0, 131.0, 62.0, 39.0, 20.0, 25.0, 11.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.02642822265625, -0.025722742080688477, -0.025017261505126953, -0.02431178092956543, -0.023606300354003906, -0.022900819778442383, -0.02219533920288086, -0.021489858627319336, -0.020784378051757812, -0.02007889747619629, -0.019373416900634766, -0.018667936325073242, -0.01796245574951172, -0.017256975173950195, -0.016551494598388672, -0.01584601402282715, -0.015140533447265625, -0.014435052871704102, -0.013729572296142578, -0.013024091720581055, -0.012318611145019531, -0.011613130569458008, -0.010907649993896484, -0.010202169418334961, -0.009496688842773438, -0.008791208267211914, -0.00808572769165039, -0.007380247116088867, -0.006674766540527344, -0.00596928596496582, -0.005263805389404297, -0.0045583248138427734, -0.00385284423828125, -0.0031473636627197266, -0.002441883087158203, -0.0017364025115966797, -0.0010309219360351562, -0.0003254413604736328, 0.0003800392150878906, 0.001085519790649414, 0.0017910003662109375, 0.002496480941772461, 0.0032019615173339844, 0.003907442092895508, 0.004612922668457031, 0.005318403244018555, 0.006023883819580078, 0.0067293643951416016, 0.007434844970703125, 0.008140325546264648, 0.008845806121826172, 0.009551286697387695, 0.010256767272949219, 0.010962247848510742, 0.011667728424072266, 0.012373208999633789, 0.013078689575195312, 0.013784170150756836, 0.01448965072631836, 0.015195131301879883, 0.015900611877441406, 0.01660609245300293, 0.017311573028564453, 0.018017053604125977, 0.0187225341796875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 9.0, 22.0, 33.0, 33.0, 70.0, 73.0, 95.0, 103.0, 131.0, 97.0, 87.0, 83.0, 58.0, 39.0, 30.0, 17.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007740020751953125, -0.007475912570953369, -0.007211804389953613, -0.006947696208953857, -0.0066835880279541016, -0.006419479846954346, -0.00615537166595459, -0.005891263484954834, -0.005627155303955078, -0.005363047122955322, -0.005098938941955566, -0.0048348307609558105, -0.004570722579956055, -0.004306614398956299, -0.004042506217956543, -0.003778398036956787, -0.0035142898559570312, -0.0032501816749572754, -0.0029860734939575195, -0.0027219653129577637, -0.002457857131958008, -0.002193748950958252, -0.001929640769958496, -0.0016655325889587402, -0.0014014244079589844, -0.0011373162269592285, -0.0008732080459594727, -0.0006090998649597168, -0.00034499168395996094, -8.088350296020508e-05, 0.00018322467803955078, 0.00044733285903930664, 0.0007114410400390625, 0.0009755492210388184, 0.0012396574020385742, 0.00150376558303833, 0.001767873764038086, 0.002031981945037842, 0.0022960901260375977, 0.0025601983070373535, 0.0028243064880371094, 0.0030884146690368652, 0.003352522850036621, 0.003616631031036377, 0.003880739212036133, 0.004144847393035889, 0.0044089555740356445, 0.0046730637550354, 0.004937171936035156, 0.005201280117034912, 0.005465388298034668, 0.005729496479034424, 0.00599360466003418, 0.0062577128410339355, 0.006521821022033691, 0.006785929203033447, 0.007050037384033203, 0.007314145565032959, 0.007578253746032715, 0.00784236192703247, 0.008106470108032227, 0.008370578289031982, 0.008634686470031738, 0.008898794651031494, 0.00916290283203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 9.0, 5.0, 7.0, 11.0, 14.0, 17.0, 23.0, 31.0, 41.0, 47.0, 64.0, 98.0, 169.0, 200.0, 324.0, 621.0, 1085.0, 2217.0, 5175.0, 13303.0, 46338.0, 267264.0, 3390664.0, 381384.0, 58011.0, 15991.0, 5776.0, 2446.0, 1170.0, 611.0, 382.0, 207.0, 132.0, 120.0, 68.0, 52.0, 49.0, 44.0, 25.0, 23.0, 17.0, 16.0, 10.0, 7.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00830841064453125, -0.008027434349060059, -0.007746458053588867, -0.007465481758117676, -0.007184505462646484, -0.006903529167175293, -0.0066225528717041016, -0.00634157657623291, -0.006060600280761719, -0.005779623985290527, -0.005498647689819336, -0.0052176713943481445, -0.004936695098876953, -0.004655718803405762, -0.00437474250793457, -0.004093766212463379, -0.0038127899169921875, -0.003531813621520996, -0.0032508373260498047, -0.0029698610305786133, -0.002688884735107422, -0.0024079084396362305, -0.002126932144165039, -0.0018459558486938477, -0.0015649795532226562, -0.0012840032577514648, -0.0010030269622802734, -0.000722050666809082, -0.0004410743713378906, -0.00016009807586669922, 0.00012087821960449219, 0.0004018545150756836, 0.000682830810546875, 0.0009638071060180664, 0.0012447834014892578, 0.0015257596969604492, 0.0018067359924316406, 0.002087712287902832, 0.0023686885833740234, 0.002649664878845215, 0.0029306411743164062, 0.0032116174697875977, 0.003492593765258789, 0.0037735700607299805, 0.004054546356201172, 0.004335522651672363, 0.004616498947143555, 0.004897475242614746, 0.0051784515380859375, 0.005459427833557129, 0.00574040412902832, 0.006021380424499512, 0.006302356719970703, 0.0065833330154418945, 0.006864309310913086, 0.007145285606384277, 0.007426261901855469, 0.00770723819732666, 0.007988214492797852, 0.008269190788269043, 0.008550167083740234, 0.008831143379211426, 0.009112119674682617, 0.009393095970153809, 0.009674072265625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 2.0, 6.0, 8.0, 9.0, 5.0, 16.0, 28.0, 31.0, 66.0, 84.0, 162.0, 407.0, 1103.0, 1150.0, 469.0, 201.0, 109.0, 68.0, 45.0, 34.0, 22.0, 15.0, 8.0, 7.0, 5.0, 5.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007537841796875, -0.0072362422943115234, -0.006934642791748047, -0.00663304328918457, -0.006331443786621094, -0.006029844284057617, -0.005728244781494141, -0.005426645278930664, -0.0051250457763671875, -0.004823446273803711, -0.004521846771240234, -0.004220247268676758, -0.003918647766113281, -0.0036170482635498047, -0.003315448760986328, -0.0030138492584228516, -0.002712249755859375, -0.0024106502532958984, -0.002109050750732422, -0.0018074512481689453, -0.0015058517456054688, -0.0012042522430419922, -0.0009026527404785156, -0.0006010532379150391, -0.0002994537353515625, 2.1457672119140625e-06, 0.0003037452697753906, 0.0006053447723388672, 0.0009069442749023438, 0.0012085437774658203, 0.0015101432800292969, 0.0018117427825927734, 0.00211334228515625, 0.0024149417877197266, 0.002716541290283203, 0.0030181407928466797, 0.0033197402954101562, 0.003621339797973633, 0.003922939300537109, 0.004224538803100586, 0.0045261383056640625, 0.004827737808227539, 0.005129337310791016, 0.005430936813354492, 0.005732536315917969, 0.006034135818481445, 0.006335735321044922, 0.0066373348236083984, 0.006938934326171875, 0.0072405338287353516, 0.007542133331298828, 0.007843732833862305, 0.008145332336425781, 0.008446931838989258, 0.008748531341552734, 0.009050130844116211, 0.009351730346679688, 0.009653329849243164, 0.00995492935180664, 0.010256528854370117, 0.010558128356933594, 0.01085972785949707, 0.011161327362060547, 0.011462926864624023, 0.0117645263671875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 18.0, 47.0, 103.0, 210.0, 279.0, 185.0, 81.0, 44.0, 19.0, 3.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.079001285135746, -0.07655414938926697, -0.07410700619220734, -0.0716598704457283, -0.06921273469924927, -0.06676559150218964, -0.0643184557557106, -0.06187132000923157, -0.059424180537462234, -0.0569770410656929, -0.05452990531921387, -0.052082765847444534, -0.0496356263756752, -0.04718849062919617, -0.044741351157426834, -0.0422942116856575, -0.03984707593917847, -0.037399936467409134, -0.0349528007209301, -0.03250566124916077, -0.030058523640036583, -0.0276113860309124, -0.025164246559143066, -0.022717108950018883, -0.0202699713408947, -0.017822833731770515, -0.015375695191323757, -0.012928556650876999, -0.010481419041752815, -0.008034281432628632, -0.005587142892181873, -0.003140004351735115, -0.0006928592920303345, 0.0017542787827551365, 0.0042014168575406075, 0.006648554932326078, 0.00909569300711155, 0.011542830616235733, 0.013989969156682491, 0.01643710769712925, 0.018884245306253433, 0.021331382915377617, 0.0237785205245018, 0.026225659996271133, 0.028672797605395317, 0.0311199352145195, 0.033567074686288834, 0.036014214158058167, 0.0384613499045372, 0.040908489376306534, 0.04335562512278557, 0.0458027645945549, 0.048249900341033936, 0.05069703981280327, 0.0531441792845726, 0.055591315031051636, 0.05803845450282097, 0.0604855939745903, 0.06293272972106934, 0.06537986546754837, 0.067827008664608, 0.07027414441108704, 0.07272128015756607, 0.0751684233546257, 0.07761555910110474]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 7.0, 9.0, 9.0, 7.0, 9.0, 10.0, 10.0, 17.0, 24.0, 17.0, 30.0, 26.0, 24.0, 25.0, 31.0, 35.0, 35.0, 45.0, 41.0, 35.0, 37.0, 33.0, 37.0, 37.0, 33.0, 32.0, 30.0, 31.0, 29.0, 26.0, 28.0, 29.0, 20.0, 23.0, 20.0, 14.0, 12.0, 13.0, 10.0, 11.0, 5.0, 9.0, 4.0, 7.0, 5.0, 1.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.017048776149749756, -0.01651330664753914, -0.015977835282683372, -0.01544236484915018, -0.01490689441561699, -0.014371423982083797, -0.013835953548550606, -0.013300483115017414, -0.012765012681484222, -0.01222954224795103, -0.011694071814417839, -0.011158601380884647, -0.010623130947351456, -0.010087660513818264, -0.009552190080285072, -0.00901671964675188, -0.008481249213218689, -0.007945778779685497, -0.007410308346152306, -0.006874837912619114, -0.006339367479085922, -0.0058038970455527306, -0.005268426612019539, -0.004732956178486347, -0.0041974857449531555, -0.003662015311419964, -0.003126544877886772, -0.0025910744443535805, -0.002055604010820389, -0.0015201335772871971, -0.0009846631437540054, -0.00044919271022081375, 8.627772331237793e-05, 0.0006217481568455696, 0.0011572185903787613, 0.001692689023911953, 0.0022281594574451447, 0.0027636298909783363, 0.003299100324511528, 0.0038345707580447197, 0.004370041191577911, 0.004905511625111103, 0.005440982058644295, 0.005976452492177486, 0.006511922925710678, 0.00704739335924387, 0.0075828637927770615, 0.008118334226310253, 0.008653804659843445, 0.009189275093376637, 0.009724745526909828, 0.01026021596044302, 0.010795686393976212, 0.011331156827509403, 0.011866627261042595, 0.012402097694575787, 0.012937568128108978, 0.01347303856164217, 0.014008508995175362, 0.014543979428708553, 0.015079449862241745, 0.015614920295774937, 0.01615039072930813, 0.016685862094163895, 0.01722133159637451]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 7.0, 10.0, 14.0, 17.0, 23.0, 32.0, 66.0, 91.0, 152.0, 332.0, 583.0, 1499.0, 5937.0, 33113.0, 320963.0, 611470.0, 60846.0, 9549.0, 2265.0, 744.0, 340.0, 167.0, 105.0, 68.0, 45.0, 35.0, 19.0, 20.0, 10.0, 9.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.025146484375, -0.02433919906616211, -0.02353191375732422, -0.022724628448486328, -0.021917343139648438, -0.021110057830810547, -0.020302772521972656, -0.019495487213134766, -0.018688201904296875, -0.017880916595458984, -0.017073631286621094, -0.016266345977783203, -0.015459060668945312, -0.014651775360107422, -0.013844490051269531, -0.01303720474243164, -0.01222991943359375, -0.01142263412475586, -0.010615348815917969, -0.009808063507080078, -0.009000778198242188, -0.008193492889404297, -0.007386207580566406, -0.006578922271728516, -0.005771636962890625, -0.004964351654052734, -0.004157066345214844, -0.003349781036376953, -0.0025424957275390625, -0.0017352104187011719, -0.0009279251098632812, -0.00012063980102539062, 0.0006866455078125, 0.0014939308166503906, 0.0023012161254882812, 0.003108501434326172, 0.0039157867431640625, 0.004723072052001953, 0.005530357360839844, 0.006337642669677734, 0.007144927978515625, 0.007952213287353516, 0.008759498596191406, 0.009566783905029297, 0.010374069213867188, 0.011181354522705078, 0.011988639831542969, 0.01279592514038086, 0.01360321044921875, 0.01441049575805664, 0.015217781066894531, 0.016025066375732422, 0.016832351684570312, 0.017639636993408203, 0.018446922302246094, 0.019254207611083984, 0.020061492919921875, 0.020868778228759766, 0.021676063537597656, 0.022483348846435547, 0.023290634155273438, 0.024097919464111328, 0.02490520477294922, 0.02571249008178711, 0.026519775390625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 7.0, 25.0, 24.0, 39.0, 62.0, 72.0, 86.0, 96.0, 113.0, 111.0, 100.0, 90.0, 58.0, 40.0, 30.0, 21.0, 11.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007740020751953125, -0.007470071315765381, -0.007200121879577637, -0.006930172443389893, -0.0066602230072021484, -0.006390273571014404, -0.00612032413482666, -0.005850374698638916, -0.005580425262451172, -0.005310475826263428, -0.005040526390075684, -0.0047705769538879395, -0.004500627517700195, -0.004230678081512451, -0.003960728645324707, -0.003690779209136963, -0.0034208297729492188, -0.0031508803367614746, -0.0028809309005737305, -0.0026109814643859863, -0.002341032028198242, -0.002071082592010498, -0.001801133155822754, -0.0015311837196350098, -0.0012612342834472656, -0.0009912848472595215, -0.0007213354110717773, -0.0004513859748840332, -0.00018143653869628906, 8.851289749145508e-05, 0.0003584623336791992, 0.0006284117698669434, 0.0008983612060546875, 0.0011683106422424316, 0.0014382600784301758, 0.00170820951461792, 0.001978158950805664, 0.002248108386993408, 0.0025180578231811523, 0.0027880072593688965, 0.0030579566955566406, 0.0033279061317443848, 0.003597855567932129, 0.003867805004119873, 0.004137754440307617, 0.004407703876495361, 0.0046776533126831055, 0.00494760274887085, 0.005217552185058594, 0.005487501621246338, 0.005757451057434082, 0.006027400493621826, 0.00629734992980957, 0.0065672993659973145, 0.006837248802185059, 0.007107198238372803, 0.007377147674560547, 0.007647097110748291, 0.007917046546936035, 0.00818699598312378, 0.008456945419311523, 0.008726894855499268, 0.008996844291687012, 0.009266793727874756, 0.0095367431640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 5.0, 3.0, 10.0, 7.0, 11.0, 12.0, 22.0, 35.0, 48.0, 57.0, 92.0, 153.0, 274.0, 545.0, 1081.0, 2402.0, 5658.0, 15414.0, 45940.0, 156322.0, 475130.0, 242160.0, 67691.0, 21600.0, 7785.0, 3086.0, 1468.0, 660.0, 356.0, 170.0, 102.0, 77.0, 45.0, 22.0, 33.0, 23.0, 18.0, 8.0, 8.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0105133056640625, -0.01013326644897461, -0.009753227233886719, -0.009373188018798828, -0.008993148803710938, -0.008613109588623047, -0.008233070373535156, -0.007853031158447266, -0.007472991943359375, -0.007092952728271484, -0.006712913513183594, -0.006332874298095703, -0.0059528350830078125, -0.005572795867919922, -0.005192756652832031, -0.004812717437744141, -0.00443267822265625, -0.004052639007568359, -0.0036725997924804688, -0.003292560577392578, -0.0029125213623046875, -0.002532482147216797, -0.0021524429321289062, -0.0017724037170410156, -0.001392364501953125, -0.0010123252868652344, -0.0006322860717773438, -0.0002522468566894531, 0.0001277923583984375, 0.0005078315734863281, 0.0008878707885742188, 0.0012679100036621094, 0.00164794921875, 0.0020279884338378906, 0.0024080276489257812, 0.002788066864013672, 0.0031681060791015625, 0.003548145294189453, 0.003928184509277344, 0.004308223724365234, 0.004688262939453125, 0.005068302154541016, 0.005448341369628906, 0.005828380584716797, 0.0062084197998046875, 0.006588459014892578, 0.006968498229980469, 0.007348537445068359, 0.00772857666015625, 0.00810861587524414, 0.008488655090332031, 0.008868694305419922, 0.009248733520507812, 0.009628772735595703, 0.010008811950683594, 0.010388851165771484, 0.010768890380859375, 0.011148929595947266, 0.011528968811035156, 0.011909008026123047, 0.012289047241210938, 0.012669086456298828, 0.013049125671386719, 0.01342916488647461, 0.0138092041015625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 5.0, 8.0, 3.0, 2.0, 5.0, 10.0, 10.0, 19.0, 22.0, 23.0, 22.0, 24.0, 34.0, 31.0, 51.0, 25.0, 60.0, 47.0, 52.0, 48.0, 40.0, 61.0, 56.0, 45.0, 38.0, 49.0, 26.0, 38.0, 21.0, 20.0, 18.0, 19.0, 17.0, 16.0, 7.0, 6.0, 6.0, 3.0, 4.0, 1.0, 0.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.01090240478515625, -0.010561466217041016, -0.010220527648925781, -0.009879589080810547, -0.009538650512695312, -0.009197711944580078, -0.008856773376464844, -0.00851583480834961, -0.008174896240234375, -0.00783395767211914, -0.007493019104003906, -0.007152080535888672, -0.0068111419677734375, -0.006470203399658203, -0.006129264831542969, -0.005788326263427734, -0.0054473876953125, -0.005106449127197266, -0.004765510559082031, -0.004424571990966797, -0.0040836334228515625, -0.003742694854736328, -0.0034017562866210938, -0.0030608177185058594, -0.002719879150390625, -0.0023789405822753906, -0.0020380020141601562, -0.0016970634460449219, -0.0013561248779296875, -0.0010151863098144531, -0.0006742477416992188, -0.0003333091735839844, 7.62939453125e-06, 0.0003485679626464844, 0.0006895065307617188, 0.0010304450988769531, 0.0013713836669921875, 0.0017123222351074219, 0.0020532608032226562, 0.0023941993713378906, 0.002735137939453125, 0.0030760765075683594, 0.0034170150756835938, 0.003757953643798828, 0.0040988922119140625, 0.004439830780029297, 0.004780769348144531, 0.005121707916259766, 0.005462646484375, 0.005803585052490234, 0.006144523620605469, 0.006485462188720703, 0.0068264007568359375, 0.007167339324951172, 0.007508277893066406, 0.00784921646118164, 0.008190155029296875, 0.00853109359741211, 0.008872032165527344, 0.009212970733642578, 0.009553909301757812, 0.009894847869873047, 0.010235786437988281, 0.010576725006103516, 0.01091766357421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 5.0, 27.0, 40.0, 60.0, 104.0, 175.0, 312.0, 696.0, 1435.0, 3862.0, 14631.0, 118190.0, 789434.0, 99956.0, 13324.0, 3550.0, 1381.0, 663.0, 316.0, 154.0, 103.0, 49.0, 21.0, 15.0, 17.0, 6.0, 6.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0091705322265625, -0.008919060230255127, -0.008667588233947754, -0.00841611623764038, -0.008164644241333008, -0.007913172245025635, -0.007661700248718262, -0.007410228252410889, -0.007158756256103516, -0.006907284259796143, -0.0066558122634887695, -0.0064043402671813965, -0.0061528682708740234, -0.00590139627456665, -0.005649924278259277, -0.005398452281951904, -0.005146980285644531, -0.004895508289337158, -0.004644036293029785, -0.004392564296722412, -0.004141092300415039, -0.003889620304107666, -0.003638148307800293, -0.00338667631149292, -0.003135204315185547, -0.002883732318878174, -0.0026322603225708008, -0.0023807883262634277, -0.0021293163299560547, -0.0018778443336486816, -0.0016263723373413086, -0.0013749003410339355, -0.0011234283447265625, -0.0008719563484191895, -0.0006204843521118164, -0.00036901235580444336, -0.00011754035949707031, 0.00013393163681030273, 0.0003854036331176758, 0.0006368756294250488, 0.0008883476257324219, 0.001139819622039795, 0.001391291618347168, 0.001642763614654541, 0.001894235610961914, 0.002145707607269287, 0.00239717960357666, 0.002648651599884033, 0.0029001235961914062, 0.0031515955924987793, 0.0034030675888061523, 0.0036545395851135254, 0.0039060115814208984, 0.0041574835777282715, 0.0044089555740356445, 0.004660427570343018, 0.004911899566650391, 0.005163371562957764, 0.005414843559265137, 0.00566631555557251, 0.005917787551879883, 0.006169259548187256, 0.006420731544494629, 0.006672203540802002, 0.006923675537109375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 0.0, 4.0, 0.0, 5.0, 8.0, 0.0, 6.0, 13.0, 17.0, 0.0, 21.0, 20.0, 25.0, 0.0, 33.0, 41.0, 54.0, 0.0, 54.0, 47.0, 50.0, 65.0, 0.0, 56.0, 54.0, 61.0, 0.0, 82.0, 37.0, 52.0, 0.0, 45.0, 27.0, 26.0, 0.0, 20.0, 16.0, 13.0, 16.0, 0.0, 11.0, 8.0, 4.0, 0.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.6093254089355469e-06, -1.5636906027793884e-06, -1.51805579662323e-06, -1.4724209904670715e-06, -1.426786184310913e-06, -1.3811513781547546e-06, -1.3355165719985962e-06, -1.2898817658424377e-06, -1.2442469596862793e-06, -1.1986121535301208e-06, -1.1529773473739624e-06, -1.107342541217804e-06, -1.0617077350616455e-06, -1.016072928905487e-06, -9.704381227493286e-07, -9.248033165931702e-07, -8.791685104370117e-07, -8.335337042808533e-07, -7.878988981246948e-07, -7.422640919685364e-07, -6.966292858123779e-07, -6.509944796562195e-07, -6.05359673500061e-07, -5.597248673439026e-07, -5.140900611877441e-07, -4.684552550315857e-07, -4.2282044887542725e-07, -3.771856427192688e-07, -3.3155083656311035e-07, -2.859160304069519e-07, -2.4028122425079346e-07, -1.94646418094635e-07, -1.4901161193847656e-07, -1.0337680578231812e-07, -5.774199962615967e-08, -1.210719347000122e-08, 3.3527612686157227e-08, 7.916241884231567e-08, 1.2479722499847412e-07, 1.7043203115463257e-07, 2.1606683731079102e-07, 2.6170164346694946e-07, 3.073364496231079e-07, 3.5297125577926636e-07, 3.986060619354248e-07, 4.4424086809158325e-07, 4.898756742477417e-07, 5.355104804039001e-07, 5.811452865600586e-07, 6.26780092716217e-07, 6.724148988723755e-07, 7.180497050285339e-07, 7.636845111846924e-07, 8.093193173408508e-07, 8.549541234970093e-07, 9.005889296531677e-07, 9.462237358093262e-07, 9.918585419654846e-07, 1.037493348121643e-06, 1.0831281542778015e-06, 1.12876296043396e-06, 1.1743977665901184e-06, 1.2200325727462769e-06, 1.2656673789024353e-06, 1.3113021850585938e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 14.0, 11.0, 22.0, 39.0, 56.0, 107.0, 158.0, 331.0, 514.0, 880.0, 1551.0, 3294.0, 8458.0, 36597.0, 357579.0, 566903.0, 53196.0, 10834.0, 3873.0, 1804.0, 942.0, 490.0, 278.0, 212.0, 134.0, 70.0, 63.0, 40.0, 30.0, 19.0, 10.0, 6.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0081329345703125, -0.00788724422454834, -0.00764155387878418, -0.0073958635330200195, -0.007150173187255859, -0.006904482841491699, -0.006658792495727539, -0.006413102149963379, -0.006167411804199219, -0.005921721458435059, -0.0056760311126708984, -0.005430340766906738, -0.005184650421142578, -0.004938960075378418, -0.004693269729614258, -0.004447579383850098, -0.0042018890380859375, -0.003956198692321777, -0.003710508346557617, -0.003464818000793457, -0.003219127655029297, -0.0029734373092651367, -0.0027277469635009766, -0.0024820566177368164, -0.0022363662719726562, -0.001990675926208496, -0.001744985580444336, -0.0014992952346801758, -0.0012536048889160156, -0.0010079145431518555, -0.0007622241973876953, -0.0005165338516235352, -0.000270843505859375, -2.5153160095214844e-05, 0.0002205371856689453, 0.00046622753143310547, 0.0007119178771972656, 0.0009576082229614258, 0.001203298568725586, 0.001448988914489746, 0.0016946792602539062, 0.0019403696060180664, 0.0021860599517822266, 0.0024317502975463867, 0.002677440643310547, 0.002923130989074707, 0.003168821334838867, 0.0034145116806030273, 0.0036602020263671875, 0.0039058923721313477, 0.004151582717895508, 0.004397273063659668, 0.004642963409423828, 0.004888653755187988, 0.0051343441009521484, 0.005380034446716309, 0.005625724792480469, 0.005871415138244629, 0.006117105484008789, 0.006362795829772949, 0.006608486175537109, 0.0068541765213012695, 0.00709986686706543, 0.00734555721282959, 0.00759124755859375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 3.0, 7.0, 7.0, 13.0, 27.0, 41.0, 50.0, 87.0, 156.0, 187.0, 148.0, 91.0, 52.0, 37.0, 25.0, 19.0, 11.0, 5.0, 5.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006938934326171875, -0.006732940673828125, -0.006526947021484375, -0.006320953369140625, -0.006114959716796875, -0.005908966064453125, -0.005702972412109375, -0.005496978759765625, -0.005290985107421875, -0.005084991455078125, -0.004878997802734375, -0.004673004150390625, -0.004467010498046875, -0.004261016845703125, -0.004055023193359375, -0.003849029541015625, -0.003643035888671875, -0.003437042236328125, -0.003231048583984375, -0.003025054931640625, -0.002819061279296875, -0.002613067626953125, -0.002407073974609375, -0.002201080322265625, -0.001995086669921875, -0.001789093017578125, -0.001583099365234375, -0.001377105712890625, -0.001171112060546875, -0.000965118408203125, -0.000759124755859375, -0.000553131103515625, -0.000347137451171875, -0.000141143798828125, 6.4849853515625e-05, 0.000270843505859375, 0.000476837158203125, 0.000682830810546875, 0.000888824462890625, 0.001094818115234375, 0.001300811767578125, 0.001506805419921875, 0.001712799072265625, 0.001918792724609375, 0.002124786376953125, 0.002330780029296875, 0.002536773681640625, 0.002742767333984375, 0.002948760986328125, 0.003154754638671875, 0.003360748291015625, 0.003566741943359375, 0.003772735595703125, 0.003978729248046875, 0.004184722900390625, 0.004390716552734375, 0.004596710205078125, 0.004802703857421875, 0.005008697509765625, 0.005214691162109375, 0.005420684814453125, 0.005626678466796875, 0.005832672119140625, 0.006038665771484375, 0.006244659423828125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 14.0, 27.0, 54.0, 117.0, 188.0, 259.0, 192.0, 76.0, 41.0, 13.0, 11.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049316197633743286, -0.04650735855102539, -0.043698519468307495, -0.0408896803855896, -0.038080841302871704, -0.03527200222015381, -0.03246316313743591, -0.02965432219207287, -0.026845483109354973, -0.024036644026637077, -0.021227804943919182, -0.018418963998556137, -0.015610125847160816, -0.01280128676444292, -0.00999244675040245, -0.007183607667684555, -0.0043747685849666595, -0.0015659292694181204, 0.0012429100461304188, 0.004051749594509602, 0.006860588677227497, 0.009669427759945393, 0.012478267773985863, 0.015287106856703758, 0.018095945939421654, 0.02090478502213955, 0.023713624104857445, 0.02652246505022049, 0.029331304132938385, 0.03214014321565628, 0.034948982298374176, 0.03775782138109207, 0.04056666046380997, 0.04337549954652786, 0.04618433862924576, 0.048993177711963654, 0.05180201679468155, 0.054610855877399445, 0.05741969496011734, 0.060228534042835236, 0.06303737312555313, 0.06584621220827103, 0.06865505129098892, 0.07146389037370682, 0.07427272945642471, 0.07708156853914261, 0.0798904076218605, 0.0826992467045784, 0.08550809323787689, 0.08831693232059479, 0.09112577140331268, 0.09393461048603058, 0.09674344956874847, 0.09955228865146637, 0.10236112773418427, 0.10516996681690216, 0.10797880589962006, 0.11078764498233795, 0.11359648406505585, 0.11640532314777374, 0.11921416223049164, 0.12202300131320953, 0.12483184039592743, 0.12764067947864532, 0.13044951856136322]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 5.0, 3.0, 11.0, 12.0, 7.0, 9.0, 14.0, 21.0, 20.0, 20.0, 23.0, 27.0, 34.0, 26.0, 38.0, 36.0, 35.0, 37.0, 44.0, 42.0, 39.0, 41.0, 33.0, 39.0, 50.0, 35.0, 40.0, 34.0, 28.0, 27.0, 23.0, 17.0, 18.0, 17.0, 13.0, 16.0, 14.0, 8.0, 8.0, 10.0, 4.0, 7.0, 4.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.02602165937423706, -0.025179946795105934, -0.024338234215974808, -0.02349652163684368, -0.022654809057712555, -0.02181309647858143, -0.020971383899450302, -0.020129671320319176, -0.01928795874118805, -0.018446246162056923, -0.017604533582925797, -0.01676282100379467, -0.015921108424663544, -0.015079395845532417, -0.014237683266401291, -0.013395970687270164, -0.012554258108139038, -0.011712545529007912, -0.010870832949876785, -0.010029120370745659, -0.009187407791614532, -0.008345695212483406, -0.00750398263335228, -0.006662270054221153, -0.005820557475090027, -0.0049788448959589005, -0.004137132316827774, -0.0032954197376966476, -0.0024537071585655212, -0.0016119945794343948, -0.0007702820003032684, 7.143057882785797e-05, 0.0009131431579589844, 0.0017548557370901108, 0.002596568316221237, 0.0034382808953523636, 0.00427999347448349, 0.005121706053614616, 0.005963418632745743, 0.006805131211876869, 0.007646843791007996, 0.008488556370139122, 0.009330268949270248, 0.010171981528401375, 0.011013694107532501, 0.011855406686663628, 0.012697119265794754, 0.01353883184492588, 0.014380544424057007, 0.015222257003188133, 0.01606396958231926, 0.016905682161450386, 0.017747394740581512, 0.01858910731971264, 0.019430819898843765, 0.02027253247797489, 0.021114245057106018, 0.021955957636237144, 0.02279767021536827, 0.023639382794499397, 0.024481095373630524, 0.02532280795276165, 0.026164520531892776, 0.027006233111023903, 0.02784794569015503]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 6.0, 6.0, 10.0, 9.0, 8.0, 12.0, 19.0, 28.0, 35.0, 56.0, 81.0, 111.0, 181.0, 289.0, 498.0, 895.0, 1995.0, 5624.0, 19709.0, 96967.0, 2104508.0, 1842942.0, 92637.0, 17791.0, 5590.0, 2044.0, 933.0, 458.0, 292.0, 143.0, 119.0, 73.0, 58.0, 31.0, 28.0, 16.0, 18.0, 15.0, 8.0, 9.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.012115478515625, -0.011758923530578613, -0.011402368545532227, -0.01104581356048584, -0.010689258575439453, -0.010332703590393066, -0.00997614860534668, -0.009619593620300293, -0.009263038635253906, -0.00890648365020752, -0.008549928665161133, -0.008193373680114746, -0.00783681869506836, -0.007480263710021973, -0.007123708724975586, -0.006767153739929199, -0.0064105987548828125, -0.006054043769836426, -0.005697488784790039, -0.005340933799743652, -0.004984378814697266, -0.004627823829650879, -0.004271268844604492, -0.0039147138595581055, -0.0035581588745117188, -0.003201603889465332, -0.0028450489044189453, -0.0024884939193725586, -0.002131938934326172, -0.0017753839492797852, -0.0014188289642333984, -0.0010622739791870117, -0.000705718994140625, -0.0003491640090942383, 7.3909759521484375e-06, 0.00036394596099853516, 0.0007205009460449219, 0.0010770559310913086, 0.0014336109161376953, 0.001790165901184082, 0.0021467208862304688, 0.0025032758712768555, 0.002859830856323242, 0.003216385841369629, 0.0035729408264160156, 0.003929495811462402, 0.004286050796508789, 0.004642605781555176, 0.0049991607666015625, 0.005355715751647949, 0.005712270736694336, 0.006068825721740723, 0.006425380706787109, 0.006781935691833496, 0.007138490676879883, 0.0074950456619262695, 0.007851600646972656, 0.008208155632019043, 0.00856471061706543, 0.008921265602111816, 0.009277820587158203, 0.00963437557220459, 0.009990930557250977, 0.010347485542297363, 0.01070404052734375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 11.0, 11.0, 23.0, 26.0, 37.0, 53.0, 66.0, 73.0, 113.0, 119.0, 98.0, 87.0, 69.0, 64.0, 64.0, 35.0, 22.0, 17.0, 9.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00839996337890625, -0.008127093315124512, -0.007854223251342773, -0.007581353187561035, -0.007308483123779297, -0.007035613059997559, -0.00676274299621582, -0.006489872932434082, -0.006217002868652344, -0.0059441328048706055, -0.005671262741088867, -0.005398392677307129, -0.005125522613525391, -0.004852652549743652, -0.004579782485961914, -0.004306912422180176, -0.0040340423583984375, -0.0037611722946166992, -0.003488302230834961, -0.0032154321670532227, -0.0029425621032714844, -0.002669692039489746, -0.002396821975708008, -0.0021239519119262695, -0.0018510818481445312, -0.001578211784362793, -0.0013053417205810547, -0.0010324716567993164, -0.0007596015930175781, -0.00048673152923583984, -0.00021386146545410156, 5.900859832763672e-05, 0.000331878662109375, 0.0006047487258911133, 0.0008776187896728516, 0.0011504888534545898, 0.0014233589172363281, 0.0016962289810180664, 0.0019690990447998047, 0.002241969108581543, 0.0025148391723632812, 0.0027877092361450195, 0.003060579299926758, 0.003333449363708496, 0.0036063194274902344, 0.0038791894912719727, 0.004152059555053711, 0.004424929618835449, 0.0046977996826171875, 0.004970669746398926, 0.005243539810180664, 0.005516409873962402, 0.005789279937744141, 0.006062150001525879, 0.006335020065307617, 0.0066078901290893555, 0.006880760192871094, 0.007153630256652832, 0.00742650032043457, 0.007699370384216309, 0.007972240447998047, 0.008245110511779785, 0.008517980575561523, 0.008790850639343262, 0.009063720703125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 14.0, 8.0, 11.0, 32.0, 50.0, 59.0, 99.0, 170.0, 252.0, 458.0, 792.0, 1613.0, 3473.0, 7448.0, 18464.0, 52578.0, 198791.0, 2017266.0, 1635923.0, 177351.0, 48171.0, 17332.0, 7110.0, 3231.0, 1655.0, 813.0, 444.0, 239.0, 173.0, 100.0, 57.0, 31.0, 24.0, 14.0, 11.0, 5.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006290435791015625, -0.006048142910003662, -0.005805850028991699, -0.005563557147979736, -0.0053212642669677734, -0.0050789713859558105, -0.004836678504943848, -0.004594385623931885, -0.004352092742919922, -0.004109799861907959, -0.003867506980895996, -0.003625214099884033, -0.0033829212188720703, -0.0031406283378601074, -0.0028983354568481445, -0.0026560425758361816, -0.0024137496948242188, -0.002171456813812256, -0.001929163932800293, -0.00168687105178833, -0.0014445781707763672, -0.0012022852897644043, -0.0009599924087524414, -0.0007176995277404785, -0.0004754066467285156, -0.00023311376571655273, 9.179115295410156e-06, 0.00025147199630737305, 0.0004937648773193359, 0.0007360577583312988, 0.0009783506393432617, 0.0012206435203552246, 0.0014629364013671875, 0.0017052292823791504, 0.0019475221633911133, 0.002189815044403076, 0.002432107925415039, 0.002674400806427002, 0.002916693687438965, 0.0031589865684509277, 0.0034012794494628906, 0.0036435723304748535, 0.0038858652114868164, 0.004128158092498779, 0.004370450973510742, 0.004612743854522705, 0.004855036735534668, 0.005097329616546631, 0.005339622497558594, 0.005581915378570557, 0.0058242082595825195, 0.006066501140594482, 0.006308794021606445, 0.006551086902618408, 0.006793379783630371, 0.007035672664642334, 0.007277965545654297, 0.00752025842666626, 0.007762551307678223, 0.008004844188690186, 0.008247137069702148, 0.008489429950714111, 0.008731722831726074, 0.008974015712738037, 0.00921630859375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 8.0, 10.0, 12.0, 15.0, 21.0, 33.0, 52.0, 49.0, 77.0, 124.0, 232.0, 479.0, 880.0, 931.0, 493.0, 223.0, 135.0, 81.0, 63.0, 43.0, 24.0, 17.0, 19.0, 14.0, 13.0, 8.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00957489013671875, -0.009284377098083496, -0.008993864059448242, -0.008703351020812988, -0.008412837982177734, -0.00812232494354248, -0.007831811904907227, -0.007541298866271973, -0.007250785827636719, -0.006960272789001465, -0.006669759750366211, -0.006379246711730957, -0.006088733673095703, -0.005798220634460449, -0.005507707595825195, -0.005217194557189941, -0.0049266815185546875, -0.004636168479919434, -0.00434565544128418, -0.004055142402648926, -0.003764629364013672, -0.003474116325378418, -0.003183603286743164, -0.00289309024810791, -0.0026025772094726562, -0.0023120641708374023, -0.0020215511322021484, -0.0017310380935668945, -0.0014405250549316406, -0.0011500120162963867, -0.0008594989776611328, -0.0005689859390258789, -0.000278472900390625, 1.2040138244628906e-05, 0.0003025531768798828, 0.0005930662155151367, 0.0008835792541503906, 0.0011740922927856445, 0.0014646053314208984, 0.0017551183700561523, 0.0020456314086914062, 0.00233614444732666, 0.002626657485961914, 0.002917170524597168, 0.003207683563232422, 0.0034981966018676758, 0.0037887096405029297, 0.004079222679138184, 0.0043697357177734375, 0.004660248756408691, 0.004950761795043945, 0.005241274833679199, 0.005531787872314453, 0.005822300910949707, 0.006112813949584961, 0.006403326988220215, 0.006693840026855469, 0.006984353065490723, 0.0072748661041259766, 0.0075653791427612305, 0.007855892181396484, 0.008146405220031738, 0.008436918258666992, 0.008727431297302246, 0.0090179443359375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 8.0, 20.0, 18.0, 47.0, 74.0, 152.0, 214.0, 187.0, 116.0, 74.0, 51.0, 13.0, 15.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06653587520122528, -0.064447320997715, -0.06235876679420471, -0.06027021259069443, -0.05818165838718414, -0.05609310418367386, -0.054004549980163574, -0.05191599577665329, -0.049827441573143005, -0.04773888736963272, -0.045650333166122437, -0.04356177896261215, -0.04147322475910187, -0.03938467055559158, -0.0372961163520813, -0.035207562148571014, -0.03311900794506073, -0.031030453741550446, -0.02894189953804016, -0.026853345334529877, -0.024764791131019592, -0.022676236927509308, -0.020587682723999023, -0.01849912852048874, -0.016410574316978455, -0.01432202011346817, -0.012233465909957886, -0.010144911706447601, -0.008056357502937317, -0.0059678032994270325, -0.003879249095916748, -0.0017906948924064636, 0.0002978667616844177, 0.002386420965194702, 0.004474975168704987, 0.006563529372215271, 0.008652083575725555, 0.01074063777923584, 0.012829191982746124, 0.014917746186256409, 0.017006300389766693, 0.019094854593276978, 0.021183408796787262, 0.023271963000297546, 0.02536051720380783, 0.027449071407318115, 0.0295376256108284, 0.031626179814338684, 0.03371473401784897, 0.03580328822135925, 0.03789184242486954, 0.03998039662837982, 0.042068950831890106, 0.04415750503540039, 0.046246059238910675, 0.04833461344242096, 0.050423167645931244, 0.05251172184944153, 0.05460027605295181, 0.0566888302564621, 0.05877738445997238, 0.060865938663482666, 0.06295449286699295, 0.06504304707050323, 0.06713160127401352]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 5.0, 6.0, 8.0, 9.0, 20.0, 14.0, 16.0, 25.0, 25.0, 26.0, 25.0, 27.0, 33.0, 40.0, 41.0, 60.0, 40.0, 49.0, 47.0, 48.0, 52.0, 53.0, 42.0, 34.0, 33.0, 34.0, 25.0, 31.0, 20.0, 27.0, 12.0, 13.0, 18.0, 14.0, 7.0, 4.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023464739322662354, -0.022655023261904716, -0.02184530720114708, -0.021035591140389442, -0.020225875079631805, -0.01941615901887417, -0.01860644295811653, -0.017796726897358894, -0.016987010836601257, -0.01617729477584362, -0.015367578715085983, -0.014557862654328346, -0.01374814659357071, -0.012938430532813072, -0.012128714472055435, -0.011318998411297798, -0.010509282350540161, -0.009699566289782524, -0.008889850229024887, -0.00808013416826725, -0.007270418107509613, -0.006460702046751976, -0.005650985985994339, -0.004841269925236702, -0.004031553864479065, -0.003221837803721428, -0.002412121742963791, -0.0016024056822061539, -0.0007926896214485168, 1.7026439309120178e-05, 0.0008267425000667572, 0.0016364585608243942, 0.0024461746215820312, 0.0032558906823396683, 0.004065606743097305, 0.004875322803854942, 0.005685038864612579, 0.006494754925370216, 0.007304470986127853, 0.00811418704688549, 0.008923903107643127, 0.009733619168400764, 0.010543335229158401, 0.011353051289916039, 0.012162767350673676, 0.012972483411431313, 0.01378219947218895, 0.014591915532946587, 0.015401631593704224, 0.01621134765446186, 0.017021063715219498, 0.017830779775977135, 0.01864049583673477, 0.01945021189749241, 0.020259927958250046, 0.021069644019007683, 0.02187936007976532, 0.022689076140522957, 0.023498792201280594, 0.02430850826203823, 0.025118224322795868, 0.025927940383553505, 0.026737656444311142, 0.02754737250506878, 0.028357088565826416]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 10.0, 13.0, 16.0, 19.0, 27.0, 50.0, 90.0, 153.0, 267.0, 574.0, 1536.0, 5487.0, 33469.0, 391254.0, 560304.0, 45135.0, 6932.0, 1855.0, 651.0, 297.0, 144.0, 99.0, 58.0, 39.0, 19.0, 19.0, 9.0, 3.0, 5.0, 6.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030303955078125, -0.029359102249145508, -0.028414249420166016, -0.027469396591186523, -0.02652454376220703, -0.02557969093322754, -0.024634838104248047, -0.023689985275268555, -0.022745132446289062, -0.02180027961730957, -0.020855426788330078, -0.019910573959350586, -0.018965721130371094, -0.0180208683013916, -0.01707601547241211, -0.016131162643432617, -0.015186309814453125, -0.014241456985473633, -0.01329660415649414, -0.012351751327514648, -0.011406898498535156, -0.010462045669555664, -0.009517192840576172, -0.00857234001159668, -0.0076274871826171875, -0.006682634353637695, -0.005737781524658203, -0.004792928695678711, -0.0038480758666992188, -0.0029032230377197266, -0.0019583702087402344, -0.0010135173797607422, -6.866455078125e-05, 0.0008761882781982422, 0.0018210411071777344, 0.0027658939361572266, 0.0037107467651367188, 0.004655599594116211, 0.005600452423095703, 0.006545305252075195, 0.0074901580810546875, 0.00843501091003418, 0.009379863739013672, 0.010324716567993164, 0.011269569396972656, 0.012214422225952148, 0.01315927505493164, 0.014104127883911133, 0.015048980712890625, 0.015993833541870117, 0.01693868637084961, 0.0178835391998291, 0.018828392028808594, 0.019773244857788086, 0.020718097686767578, 0.02166295051574707, 0.022607803344726562, 0.023552656173706055, 0.024497509002685547, 0.02544236183166504, 0.02638721466064453, 0.027332067489624023, 0.028276920318603516, 0.029221773147583008, 0.0301666259765625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 8.0, 13.0, 18.0, 36.0, 42.0, 61.0, 71.0, 92.0, 99.0, 106.0, 86.0, 96.0, 77.0, 66.0, 42.0, 35.0, 23.0, 15.0, 8.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007396697998046875, -0.007128417491912842, -0.006860136985778809, -0.006591856479644775, -0.006323575973510742, -0.006055295467376709, -0.005787014961242676, -0.005518734455108643, -0.005250453948974609, -0.004982173442840576, -0.004713892936706543, -0.00444561243057251, -0.0041773319244384766, -0.003909051418304443, -0.00364077091217041, -0.003372490406036377, -0.0031042098999023438, -0.0028359293937683105, -0.0025676488876342773, -0.002299368381500244, -0.002031087875366211, -0.0017628073692321777, -0.0014945268630981445, -0.0012262463569641113, -0.0009579658508300781, -0.0006896853446960449, -0.0004214048385620117, -0.00015312433242797852, 0.00011515617370605469, 0.0003834366798400879, 0.0006517171859741211, 0.0009199976921081543, 0.0011882781982421875, 0.0014565587043762207, 0.001724839210510254, 0.001993119716644287, 0.0022614002227783203, 0.0025296807289123535, 0.0027979612350463867, 0.00306624174118042, 0.003334522247314453, 0.0036028027534484863, 0.0038710832595825195, 0.004139363765716553, 0.004407644271850586, 0.004675924777984619, 0.004944205284118652, 0.0052124857902526855, 0.005480766296386719, 0.005749046802520752, 0.006017327308654785, 0.006285607814788818, 0.0065538883209228516, 0.006822168827056885, 0.007090449333190918, 0.007358729839324951, 0.007627010345458984, 0.007895290851593018, 0.00816357135772705, 0.008431851863861084, 0.008700132369995117, 0.00896841287612915, 0.009236693382263184, 0.009504973888397217, 0.00977325439453125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 4.0, 9.0, 8.0, 14.0, 14.0, 19.0, 29.0, 31.0, 58.0, 87.0, 119.0, 203.0, 368.0, 735.0, 1560.0, 3835.0, 9957.0, 30805.0, 116206.0, 554295.0, 249760.0, 54020.0, 16090.0, 5710.0, 2281.0, 1013.0, 515.0, 281.0, 174.0, 85.0, 78.0, 48.0, 31.0, 20.0, 21.0, 14.0, 13.0, 10.0, 7.0, 7.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.017578125, -0.01704096794128418, -0.01650381088256836, -0.01596665382385254, -0.015429496765136719, -0.014892339706420898, -0.014355182647705078, -0.013818025588989258, -0.013280868530273438, -0.012743711471557617, -0.012206554412841797, -0.011669397354125977, -0.011132240295410156, -0.010595083236694336, -0.010057926177978516, -0.009520769119262695, -0.008983612060546875, -0.008446455001831055, -0.007909297943115234, -0.007372140884399414, -0.006834983825683594, -0.0062978267669677734, -0.005760669708251953, -0.005223512649536133, -0.0046863555908203125, -0.004149198532104492, -0.003612041473388672, -0.0030748844146728516, -0.0025377273559570312, -0.002000570297241211, -0.0014634132385253906, -0.0009262561798095703, -0.00038909912109375, 0.0001480579376220703, 0.0006852149963378906, 0.001222372055053711, 0.0017595291137695312, 0.0022966861724853516, 0.002833843231201172, 0.003371000289916992, 0.0039081573486328125, 0.004445314407348633, 0.004982471466064453, 0.0055196285247802734, 0.006056785583496094, 0.006593942642211914, 0.007131099700927734, 0.007668256759643555, 0.008205413818359375, 0.008742570877075195, 0.009279727935791016, 0.009816884994506836, 0.010354042053222656, 0.010891199111938477, 0.011428356170654297, 0.011965513229370117, 0.012502670288085938, 0.013039827346801758, 0.013576984405517578, 0.014114141464233398, 0.014651298522949219, 0.015188455581665039, 0.01572561264038086, 0.01626276969909668, 0.0167999267578125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 2.0, 3.0, 9.0, 5.0, 16.0, 15.0, 12.0, 17.0, 11.0, 25.0, 28.0, 22.0, 45.0, 36.0, 41.0, 50.0, 48.0, 51.0, 60.0, 54.0, 52.0, 53.0, 50.0, 31.0, 38.0, 35.0, 34.0, 27.0, 25.0, 22.0, 16.0, 18.0, 7.0, 9.0, 8.0, 4.0, 2.0, 11.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.01390838623046875, -0.01349496841430664, -0.013081550598144531, -0.012668132781982422, -0.012254714965820312, -0.011841297149658203, -0.011427879333496094, -0.011014461517333984, -0.010601043701171875, -0.010187625885009766, -0.009774208068847656, -0.009360790252685547, -0.008947372436523438, -0.008533954620361328, -0.008120536804199219, -0.007707118988037109, -0.007293701171875, -0.006880283355712891, -0.006466865539550781, -0.006053447723388672, -0.0056400299072265625, -0.005226612091064453, -0.004813194274902344, -0.004399776458740234, -0.003986358642578125, -0.0035729408264160156, -0.0031595230102539062, -0.002746105194091797, -0.0023326873779296875, -0.0019192695617675781, -0.0015058517456054688, -0.0010924339294433594, -0.00067901611328125, -0.0002655982971191406, 0.00014781951904296875, 0.0005612373352050781, 0.0009746551513671875, 0.0013880729675292969, 0.0018014907836914062, 0.0022149085998535156, 0.002628326416015625, 0.0030417442321777344, 0.0034551620483398438, 0.003868579864501953, 0.0042819976806640625, 0.004695415496826172, 0.005108833312988281, 0.005522251129150391, 0.0059356689453125, 0.006349086761474609, 0.006762504577636719, 0.007175922393798828, 0.0075893402099609375, 0.008002758026123047, 0.008416175842285156, 0.008829593658447266, 0.009243011474609375, 0.009656429290771484, 0.010069847106933594, 0.010483264923095703, 0.010896682739257812, 0.011310100555419922, 0.011723518371582031, 0.01213693618774414, 0.01255035400390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 9.0, 15.0, 21.0, 27.0, 31.0, 72.0, 92.0, 161.0, 306.0, 491.0, 1158.0, 2820.0, 7541.0, 21723.0, 71591.0, 340874.0, 461484.0, 96635.0, 27752.0, 9452.0, 3496.0, 1399.0, 631.0, 309.0, 150.0, 104.0, 63.0, 41.0, 36.0, 10.0, 14.0, 7.0, 7.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004787445068359375, -0.004633545875549316, -0.004479646682739258, -0.004325747489929199, -0.004171848297119141, -0.004017949104309082, -0.0038640499114990234, -0.003710150718688965, -0.0035562515258789062, -0.0034023523330688477, -0.003248453140258789, -0.0030945539474487305, -0.002940654754638672, -0.0027867555618286133, -0.0026328563690185547, -0.002478957176208496, -0.0023250579833984375, -0.002171158790588379, -0.0020172595977783203, -0.0018633604049682617, -0.0017094612121582031, -0.0015555620193481445, -0.001401662826538086, -0.0012477636337280273, -0.0010938644409179688, -0.0009399652481079102, -0.0007860660552978516, -0.000632166862487793, -0.0004782676696777344, -0.0003243684768676758, -0.0001704692840576172, -1.6570091247558594e-05, 0.0001373291015625, 0.0002912282943725586, 0.0004451274871826172, 0.0005990266799926758, 0.0007529258728027344, 0.000906825065612793, 0.0010607242584228516, 0.0012146234512329102, 0.0013685226440429688, 0.0015224218368530273, 0.001676321029663086, 0.0018302202224731445, 0.001984119415283203, 0.0021380186080932617, 0.0022919178009033203, 0.002445816993713379, 0.0025997161865234375, 0.002753615379333496, 0.0029075145721435547, 0.0030614137649536133, 0.003215312957763672, 0.0033692121505737305, 0.003523111343383789, 0.0036770105361938477, 0.0038309097290039062, 0.003984808921813965, 0.0041387081146240234, 0.004292607307434082, 0.004446506500244141, 0.004600405693054199, 0.004754304885864258, 0.004908204078674316, 0.005062103271484375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 9.0, 0.0, 6.0, 3.0, 12.0, 12.0, 15.0, 0.0, 23.0, 32.0, 27.0, 29.0, 0.0, 34.0, 33.0, 63.0, 58.0, 0.0, 64.0, 51.0, 74.0, 56.0, 55.0, 0.0, 48.0, 54.0, 48.0, 46.0, 0.0, 20.0, 29.0, 20.0, 16.0, 0.0, 12.0, 14.0, 8.0, 9.0, 8.0, 0.0, 3.0, 6.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.6689300537109375e-06, -1.6205012798309326e-06, -1.5720725059509277e-06, -1.5236437320709229e-06, -1.475214958190918e-06, -1.426786184310913e-06, -1.3783574104309082e-06, -1.3299286365509033e-06, -1.2814998626708984e-06, -1.2330710887908936e-06, -1.1846423149108887e-06, -1.1362135410308838e-06, -1.087784767150879e-06, -1.039355993270874e-06, -9.909272193908691e-07, -9.424984455108643e-07, -8.940696716308594e-07, -8.456408977508545e-07, -7.972121238708496e-07, -7.487833499908447e-07, -7.003545761108398e-07, -6.51925802230835e-07, -6.034970283508301e-07, -5.550682544708252e-07, -5.066394805908203e-07, -4.5821070671081543e-07, -4.0978193283081055e-07, -3.6135315895080566e-07, -3.129243850708008e-07, -2.644956111907959e-07, -2.1606683731079102e-07, -1.6763806343078613e-07, -1.1920928955078125e-07, -7.078051567077637e-08, -2.2351741790771484e-08, 2.60770320892334e-08, 7.450580596923828e-08, 1.2293457984924316e-07, 1.7136335372924805e-07, 2.1979212760925293e-07, 2.682209014892578e-07, 3.166496753692627e-07, 3.650784492492676e-07, 4.1350722312927246e-07, 4.6193599700927734e-07, 5.103647708892822e-07, 5.587935447692871e-07, 6.07222318649292e-07, 6.556510925292969e-07, 7.040798664093018e-07, 7.525086402893066e-07, 8.009374141693115e-07, 8.493661880493164e-07, 8.977949619293213e-07, 9.462237358093262e-07, 9.94652509689331e-07, 1.043081283569336e-06, 1.0915100574493408e-06, 1.1399388313293457e-06, 1.1883676052093506e-06, 1.2367963790893555e-06, 1.2852251529693604e-06, 1.3336539268493652e-06, 1.3820827007293701e-06, 1.430511474609375e-06]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 7.0, 16.0, 26.0, 33.0, 56.0, 122.0, 263.0, 577.0, 1496.0, 5029.0, 24153.0, 182338.0, 727478.0, 87377.0, 14382.0, 3293.0, 1047.0, 438.0, 185.0, 93.0, 56.0, 30.0, 20.0, 14.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00771331787109375, -0.007441163063049316, -0.007169008255004883, -0.006896853446960449, -0.006624698638916016, -0.006352543830871582, -0.0060803890228271484, -0.005808234214782715, -0.005536079406738281, -0.005263924598693848, -0.004991769790649414, -0.0047196149826049805, -0.004447460174560547, -0.004175305366516113, -0.0039031505584716797, -0.003630995750427246, -0.0033588409423828125, -0.003086686134338379, -0.0028145313262939453, -0.0025423765182495117, -0.002270221710205078, -0.0019980669021606445, -0.001725912094116211, -0.0014537572860717773, -0.0011816024780273438, -0.0009094476699829102, -0.0006372928619384766, -0.00036513805389404297, -9.298324584960938e-05, 0.00017917156219482422, 0.0004513263702392578, 0.0007234811782836914, 0.000995635986328125, 0.0012677907943725586, 0.0015399456024169922, 0.0018121004104614258, 0.0020842552185058594, 0.002356410026550293, 0.0026285648345947266, 0.00290071964263916, 0.0031728744506835938, 0.0034450292587280273, 0.003717184066772461, 0.0039893388748168945, 0.004261493682861328, 0.004533648490905762, 0.004805803298950195, 0.005077958106994629, 0.0053501129150390625, 0.005622267723083496, 0.00589442253112793, 0.006166577339172363, 0.006438732147216797, 0.0067108869552612305, 0.006983041763305664, 0.007255196571350098, 0.007527351379394531, 0.007799506187438965, 0.008071660995483398, 0.008343815803527832, 0.008615970611572266, 0.0088881254196167, 0.009160280227661133, 0.009432435035705566, 0.00970458984375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 4.0, 6.0, 13.0, 12.0, 21.0, 26.0, 38.0, 54.0, 71.0, 102.0, 143.0, 119.0, 120.0, 69.0, 49.0, 39.0, 23.0, 20.0, 13.0, 16.0, 13.0, 6.0, 8.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005054473876953125, -0.004873991012573242, -0.004693508148193359, -0.0045130252838134766, -0.004332542419433594, -0.004152059555053711, -0.003971576690673828, -0.0037910938262939453, -0.0036106109619140625, -0.0034301280975341797, -0.003249645233154297, -0.003069162368774414, -0.0028886795043945312, -0.0027081966400146484, -0.0025277137756347656, -0.002347230911254883, -0.002166748046875, -0.001986265182495117, -0.0018057823181152344, -0.0016252994537353516, -0.0014448165893554688, -0.001264333724975586, -0.0010838508605957031, -0.0009033679962158203, -0.0007228851318359375, -0.0005424022674560547, -0.0003619194030761719, -0.00018143653869628906, -9.5367431640625e-07, 0.00017952919006347656, 0.0003600120544433594, 0.0005404949188232422, 0.000720977783203125, 0.0009014606475830078, 0.0010819435119628906, 0.0012624263763427734, 0.0014429092407226562, 0.001623392105102539, 0.0018038749694824219, 0.0019843578338623047, 0.0021648406982421875, 0.0023453235626220703, 0.002525806427001953, 0.002706289291381836, 0.0028867721557617188, 0.0030672550201416016, 0.0032477378845214844, 0.003428220748901367, 0.00360870361328125, 0.003789186477661133, 0.003969669342041016, 0.0041501522064208984, 0.004330635070800781, 0.004511117935180664, 0.004691600799560547, 0.00487208366394043, 0.0050525665283203125, 0.005233049392700195, 0.005413532257080078, 0.005594015121459961, 0.005774497985839844, 0.0059549808502197266, 0.006135463714599609, 0.006315946578979492, 0.006496429443359375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 12.0, 11.0, 23.0, 84.0, 160.0, 260.0, 195.0, 134.0, 59.0, 27.0, 15.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08269111812114716, -0.0799342468380928, -0.07717737555503845, -0.0744204968214035, -0.07166362553834915, -0.0689067542552948, -0.06614987552165985, -0.0633930042386055, -0.06063613295555115, -0.057879261672496796, -0.055122386664152145, -0.052365511655807495, -0.04960864037275314, -0.04685176908969879, -0.04409489408135414, -0.04133801907300949, -0.03858114778995514, -0.03582427650690079, -0.03306740149855614, -0.030310528352856636, -0.027553655207157135, -0.024796782061457634, -0.022039908915758133, -0.019283035770058632, -0.01652616262435913, -0.01376928947865963, -0.011012416332960129, -0.008255543187260628, -0.005498670041561127, -0.0027417968958616257, 1.5076249837875366e-05, 0.0027719493955373764, 0.005528829991817474, 0.008285703137516975, 0.011042576283216476, 0.013799449428915977, 0.01655632257461548, 0.01931319572031498, 0.02207006886601448, 0.02482694201171398, 0.027583815157413483, 0.030340688303112984, 0.033097561448812485, 0.035854436457157135, 0.03861130774021149, 0.04136817902326584, 0.04412505403161049, 0.04688192903995514, 0.04963880032300949, 0.05239567160606384, 0.05515254661440849, 0.05790942162275314, 0.060666292905807495, 0.06342316418886185, 0.0661800354719162, 0.06893691420555115, 0.0716937854886055, 0.07445065677165985, 0.0772075355052948, 0.07996440678834915, 0.0827212780714035, 0.08547814935445786, 0.08823502063751221, 0.09099189937114716, 0.09374877065420151]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 6.0, 8.0, 9.0, 13.0, 14.0, 22.0, 17.0, 28.0, 34.0, 40.0, 37.0, 37.0, 40.0, 43.0, 39.0, 56.0, 46.0, 48.0, 48.0, 51.0, 41.0, 37.0, 43.0, 31.0, 39.0, 28.0, 28.0, 20.0, 23.0, 15.0, 16.0, 8.0, 10.0, 10.0, 5.0, 1.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03858065605163574, -0.03752383217215538, -0.03646700829267502, -0.03541018068790436, -0.034353356808423996, -0.033296532928943634, -0.032239705324172974, -0.03118288144469261, -0.03012605756521225, -0.029069233685731888, -0.028012407943606377, -0.026955582201480865, -0.025898758322000504, -0.02484193444252014, -0.02378510870039463, -0.02272828295826912, -0.021671459078788757, -0.020614635199308395, -0.019557809457182884, -0.018500983715057373, -0.01744415983557701, -0.01638733595609665, -0.015330510213971138, -0.014273685403168201, -0.013216860592365265, -0.012160035781562328, -0.011103210970759392, -0.010046386159956455, -0.008989561349153519, -0.007932736538350582, -0.006875911727547646, -0.005819086916744709, -0.0047622621059417725, -0.003705437295138836, -0.0026486124843358994, -0.0015917876735329628, -0.0005349628627300262, 0.0005218619480729103, 0.0015786867588758469, 0.0026355115696787834, 0.00369233638048172, 0.0047491611912846565, 0.005805986002087593, 0.00686281081289053, 0.007919635623693466, 0.008976460434496403, 0.01003328524529934, 0.011090110056102276, 0.012146934866905212, 0.013203759677708149, 0.014260584488511086, 0.015317409299314022, 0.01637423411011696, 0.01743105798959732, 0.01848788373172283, 0.019544709473848343, 0.020601533353328705, 0.021658357232809067, 0.022715182974934578, 0.02377200871706009, 0.02482883259654045, 0.025885656476020813, 0.026942482218146324, 0.027999307960271835, 0.029056131839752197]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 7.0, 10.0, 13.0, 8.0, 28.0, 25.0, 34.0, 73.0, 84.0, 152.0, 293.0, 522.0, 1321.0, 3874.0, 13808.0, 58182.0, 831422.0, 3040269.0, 204989.0, 27545.0, 7228.0, 2345.0, 928.0, 432.0, 221.0, 161.0, 92.0, 56.0, 34.0, 32.0, 22.0, 20.0, 15.0, 16.0, 3.0, 6.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0107574462890625, -0.010377049446105957, -0.009996652603149414, -0.009616255760192871, -0.009235858917236328, -0.008855462074279785, -0.008475065231323242, -0.0080946683883667, -0.007714271545410156, -0.007333874702453613, -0.00695347785949707, -0.006573081016540527, -0.006192684173583984, -0.005812287330627441, -0.0054318904876708984, -0.0050514936447143555, -0.0046710968017578125, -0.0042906999588012695, -0.0039103031158447266, -0.0035299062728881836, -0.0031495094299316406, -0.0027691125869750977, -0.0023887157440185547, -0.0020083189010620117, -0.0016279220581054688, -0.0012475252151489258, -0.0008671283721923828, -0.00048673152923583984, -0.00010633468627929688, 0.0002740621566772461, 0.0006544589996337891, 0.001034855842590332, 0.001415252685546875, 0.001795649528503418, 0.002176046371459961, 0.002556443214416504, 0.002936840057373047, 0.00331723690032959, 0.003697633743286133, 0.004078030586242676, 0.004458427429199219, 0.004838824272155762, 0.005219221115112305, 0.005599617958068848, 0.005980014801025391, 0.006360411643981934, 0.0067408084869384766, 0.0071212053298950195, 0.0075016021728515625, 0.007881999015808105, 0.008262395858764648, 0.008642792701721191, 0.009023189544677734, 0.009403586387634277, 0.00978398323059082, 0.010164380073547363, 0.010544776916503906, 0.01092517375946045, 0.011305570602416992, 0.011685967445373535, 0.012066364288330078, 0.012446761131286621, 0.012827157974243164, 0.013207554817199707, 0.01358795166015625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 8.0, 16.0, 7.0, 44.0, 43.0, 57.0, 70.0, 88.0, 80.0, 93.0, 103.0, 96.0, 86.0, 70.0, 45.0, 26.0, 21.0, 17.0, 9.0, 4.0, 5.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00768280029296875, -0.007415175437927246, -0.007147550582885742, -0.006879925727844238, -0.006612300872802734, -0.0063446760177612305, -0.0060770511627197266, -0.005809426307678223, -0.005541801452636719, -0.005274176597595215, -0.005006551742553711, -0.004738926887512207, -0.004471302032470703, -0.004203677177429199, -0.003936052322387695, -0.0036684274673461914, -0.0034008026123046875, -0.0031331777572631836, -0.0028655529022216797, -0.0025979280471801758, -0.002330303192138672, -0.002062678337097168, -0.001795053482055664, -0.0015274286270141602, -0.0012598037719726562, -0.0009921789169311523, -0.0007245540618896484, -0.00045692920684814453, -0.00018930435180664062, 7.832050323486328e-05, 0.0003459453582763672, 0.0006135702133178711, 0.000881195068359375, 0.001148819923400879, 0.0014164447784423828, 0.0016840696334838867, 0.0019516944885253906, 0.0022193193435668945, 0.0024869441986083984, 0.0027545690536499023, 0.0030221939086914062, 0.00328981876373291, 0.003557443618774414, 0.003825068473815918, 0.004092693328857422, 0.004360318183898926, 0.00462794303894043, 0.004895567893981934, 0.0051631927490234375, 0.005430817604064941, 0.005698442459106445, 0.005966067314147949, 0.006233692169189453, 0.006501317024230957, 0.006768941879272461, 0.007036566734313965, 0.007304191589355469, 0.007571816444396973, 0.007839441299438477, 0.00810706615447998, 0.008374691009521484, 0.008642315864562988, 0.008909940719604492, 0.009177565574645996, 0.0094451904296875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 10.0, 10.0, 10.0, 22.0, 18.0, 23.0, 47.0, 46.0, 76.0, 122.0, 178.0, 352.0, 740.0, 2055.0, 6395.0, 24269.0, 135816.0, 2528974.0, 1372190.0, 95916.0, 18570.0, 5202.0, 1654.0, 651.0, 332.0, 191.0, 112.0, 65.0, 61.0, 34.0, 34.0, 22.0, 16.0, 9.0, 14.0, 8.0, 12.0, 5.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01300048828125, -0.012579917907714844, -0.012159347534179688, -0.011738777160644531, -0.011318206787109375, -0.010897636413574219, -0.010477066040039062, -0.010056495666503906, -0.00963592529296875, -0.009215354919433594, -0.008794784545898438, -0.008374214172363281, -0.007953643798828125, -0.007533073425292969, -0.0071125030517578125, -0.006691932678222656, -0.0062713623046875, -0.005850791931152344, -0.0054302215576171875, -0.005009651184082031, -0.004589080810546875, -0.004168510437011719, -0.0037479400634765625, -0.0033273696899414062, -0.00290679931640625, -0.0024862289428710938, -0.0020656585693359375, -0.0016450881958007812, -0.001224517822265625, -0.0008039474487304688, -0.0003833770751953125, 3.719329833984375e-05, 0.000457763671875, 0.0008783340454101562, 0.0012989044189453125, 0.0017194747924804688, 0.002140045166015625, 0.0025606155395507812, 0.0029811859130859375, 0.0034017562866210938, 0.00382232666015625, 0.004242897033691406, 0.0046634674072265625, 0.005084037780761719, 0.005504608154296875, 0.005925178527832031, 0.0063457489013671875, 0.006766319274902344, 0.0071868896484375, 0.007607460021972656, 0.008028030395507812, 0.008448600769042969, 0.008869171142578125, 0.009289741516113281, 0.009710311889648438, 0.010130882263183594, 0.01055145263671875, 0.010972023010253906, 0.011392593383789062, 0.011813163757324219, 0.012233734130859375, 0.012654304504394531, 0.013074874877929688, 0.013495445251464844, 0.013916015625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 7.0, 12.0, 22.0, 24.0, 32.0, 48.0, 53.0, 91.0, 140.0, 223.0, 392.0, 813.0, 948.0, 508.0, 276.0, 156.0, 93.0, 72.0, 60.0, 23.0, 15.0, 17.0, 13.0, 6.0, 11.0, 7.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007625579833984375, -0.007265269756317139, -0.006904959678649902, -0.006544649600982666, -0.00618433952331543, -0.005824029445648193, -0.005463719367980957, -0.005103409290313721, -0.004743099212646484, -0.004382789134979248, -0.004022479057312012, -0.0036621689796447754, -0.003301858901977539, -0.0029415488243103027, -0.0025812387466430664, -0.00222092866897583, -0.0018606185913085938, -0.0015003085136413574, -0.001139998435974121, -0.0007796883583068848, -0.00041937828063964844, -5.906820297241211e-05, 0.0003012418746948242, 0.0006615519523620605, 0.0010218620300292969, 0.0013821721076965332, 0.0017424821853637695, 0.002102792263031006, 0.002463102340698242, 0.0028234124183654785, 0.003183722496032715, 0.003544032573699951, 0.0039043426513671875, 0.004264652729034424, 0.00462496280670166, 0.0049852728843688965, 0.005345582962036133, 0.005705893039703369, 0.0060662031173706055, 0.006426513195037842, 0.006786823272705078, 0.0071471333503723145, 0.007507443428039551, 0.007867753505706787, 0.008228063583374023, 0.00858837366104126, 0.008948683738708496, 0.009308993816375732, 0.009669303894042969, 0.010029613971710205, 0.010389924049377441, 0.010750234127044678, 0.011110544204711914, 0.01147085428237915, 0.011831164360046387, 0.012191474437713623, 0.01255178451538086, 0.012912094593048096, 0.013272404670715332, 0.013632714748382568, 0.013993024826049805, 0.014353334903717041, 0.014713644981384277, 0.015073955059051514, 0.01543426513671875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 16.0, 41.0, 93.0, 187.0, 224.0, 215.0, 128.0, 39.0, 25.0, 13.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09859433025121689, -0.09526361525058746, -0.09193290770053864, -0.08860219269990921, -0.08527148514986038, -0.08194077014923096, -0.07861006259918213, -0.0752793475985527, -0.07194863259792328, -0.06861791759729385, -0.06528721004724503, -0.0619564950466156, -0.058625783771276474, -0.05529507249593735, -0.05196436122059822, -0.048633649945259094, -0.04530293866991997, -0.04197222739458084, -0.038641516119241714, -0.03531080484390259, -0.03198008984327316, -0.028649378567934036, -0.02531866729259491, -0.021987954154610634, -0.018657242879271507, -0.015326530672609806, -0.011995818465948105, -0.008665107190608978, -0.005334394983947277, -0.002003682777285576, 0.0013270284980535507, 0.0046577416360378265, 0.007988452911376953, 0.011319165118038654, 0.014649877324700356, 0.017980588600039482, 0.021311301738023758, 0.024642013013362885, 0.02797272428870201, 0.03130343556404114, 0.03463415056467056, 0.03796486184000969, 0.041295573115348816, 0.04462628811597824, 0.04795699939131737, 0.051287710666656494, 0.05461842194199562, 0.05794913321733475, 0.061279844492673874, 0.064610555768013, 0.06794127076864243, 0.07127197831869125, 0.07460269331932068, 0.0779334008693695, 0.08126411586999893, 0.08459483087062836, 0.08792553842067719, 0.09125625342130661, 0.09458696097135544, 0.09791767597198486, 0.10124838352203369, 0.10457909852266312, 0.10790981352329254, 0.11124052107334137, 0.1145712360739708]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 6.0, 8.0, 9.0, 4.0, 14.0, 11.0, 20.0, 14.0, 20.0, 30.0, 17.0, 35.0, 44.0, 30.0, 44.0, 38.0, 41.0, 42.0, 45.0, 49.0, 33.0, 54.0, 51.0, 35.0, 48.0, 31.0, 34.0, 24.0, 32.0, 25.0, 26.0, 16.0, 15.0, 7.0, 7.0, 8.0, 10.0, 4.0, 4.0, 4.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030428409576416016, -0.029482223093509674, -0.028536038473248482, -0.02758985385298729, -0.026643667370080948, -0.025697480887174606, -0.024751296266913414, -0.02380511164665222, -0.02285892516374588, -0.02191273868083954, -0.020966554060578346, -0.020020369440317154, -0.019074182957410812, -0.01812799647450447, -0.01718181185424328, -0.016235627233982086, -0.015289440751075745, -0.014343255199491978, -0.01339706964790821, -0.012450884096324444, -0.011504698544740677, -0.01055851299315691, -0.009612327441573143, -0.008666141889989376, -0.007719956338405609, -0.006773770786821842, -0.005827585235238075, -0.004881399683654308, -0.003935214132070541, -0.0029890285804867744, -0.0020428430289030075, -0.0010966574773192406, -0.00015047192573547363, 0.0007957136258482933, 0.0017418991774320602, 0.002688084729015827, 0.003634270280599594, 0.004580455832183361, 0.005526641383767128, 0.006472826935350895, 0.007419012486934662, 0.008365198038518429, 0.009311383590102196, 0.010257569141685963, 0.01120375469326973, 0.012149940244853497, 0.013096125796437263, 0.01404231134802103, 0.014988496899604797, 0.01593468338251114, 0.01688086800277233, 0.017827052623033524, 0.018773239105939865, 0.019719425588846207, 0.0206656102091074, 0.02161179482936859, 0.022557981312274933, 0.023504167795181274, 0.024450352415442467, 0.02539653703570366, 0.02634272351861, 0.027288910001516342, 0.028235094621777534, 0.029181279242038727, 0.03012746572494507]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 6.0, 9.0, 36.0, 40.0, 68.0, 114.0, 194.0, 500.0, 1393.0, 6338.0, 49204.0, 599982.0, 354515.0, 29983.0, 4280.0, 1060.0, 413.0, 177.0, 82.0, 63.0, 36.0, 19.0, 23.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.032745361328125, -0.03177905082702637, -0.030812740325927734, -0.0298464298248291, -0.02888011932373047, -0.027913808822631836, -0.026947498321533203, -0.02598118782043457, -0.025014877319335938, -0.024048566818237305, -0.023082256317138672, -0.02211594581604004, -0.021149635314941406, -0.020183324813842773, -0.01921701431274414, -0.018250703811645508, -0.017284393310546875, -0.016318082809448242, -0.01535177230834961, -0.014385461807250977, -0.013419151306152344, -0.012452840805053711, -0.011486530303955078, -0.010520219802856445, -0.009553909301757812, -0.00858759880065918, -0.007621288299560547, -0.006654977798461914, -0.005688667297363281, -0.0047223567962646484, -0.0037560462951660156, -0.002789735794067383, -0.00182342529296875, -0.0008571147918701172, 0.00010919570922851562, 0.0010755062103271484, 0.0020418167114257812, 0.003008127212524414, 0.003974437713623047, 0.00494074821472168, 0.0059070587158203125, 0.006873369216918945, 0.007839679718017578, 0.008805990219116211, 0.009772300720214844, 0.010738611221313477, 0.01170492172241211, 0.012671232223510742, 0.013637542724609375, 0.014603853225708008, 0.01557016372680664, 0.016536474227905273, 0.017502784729003906, 0.01846909523010254, 0.019435405731201172, 0.020401716232299805, 0.021368026733398438, 0.02233433723449707, 0.023300647735595703, 0.024266958236694336, 0.02523326873779297, 0.0261995792388916, 0.027165889739990234, 0.028132200241088867, 0.0290985107421875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 9.0, 12.0, 24.0, 31.0, 49.0, 57.0, 76.0, 90.0, 101.0, 109.0, 73.0, 101.0, 71.0, 54.0, 53.0, 33.0, 23.0, 10.0, 10.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00751495361328125, -0.0072422027587890625, -0.006969451904296875, -0.0066967010498046875, -0.0064239501953125, -0.0061511993408203125, -0.005878448486328125, -0.0056056976318359375, -0.00533294677734375, -0.0050601959228515625, -0.004787445068359375, -0.0045146942138671875, -0.004241943359375, -0.0039691925048828125, -0.003696441650390625, -0.0034236907958984375, -0.00315093994140625, -0.0028781890869140625, -0.002605438232421875, -0.0023326873779296875, -0.0020599365234375, -0.0017871856689453125, -0.001514434814453125, -0.0012416839599609375, -0.00096893310546875, -0.0006961822509765625, -0.000423431396484375, -0.0001506805419921875, 0.0001220703125, 0.0003948211669921875, 0.000667572021484375, 0.0009403228759765625, 0.00121307373046875, 0.0014858245849609375, 0.001758575439453125, 0.0020313262939453125, 0.0023040771484375, 0.0025768280029296875, 0.002849578857421875, 0.0031223297119140625, 0.00339508056640625, 0.0036678314208984375, 0.003940582275390625, 0.0042133331298828125, 0.004486083984375, 0.0047588348388671875, 0.005031585693359375, 0.0053043365478515625, 0.00557708740234375, 0.0058498382568359375, 0.006122589111328125, 0.0063953399658203125, 0.0066680908203125, 0.0069408416748046875, 0.007213592529296875, 0.0074863433837890625, 0.00775909423828125, 0.008031845092773438, 0.008304595947265625, 0.008577346801757812, 0.00885009765625, 0.009122848510742188, 0.009395599365234375, 0.009668350219726562, 0.00994110107421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 10.0, 10.0, 15.0, 24.0, 34.0, 75.0, 100.0, 146.0, 309.0, 637.0, 1429.0, 3536.0, 9448.0, 29098.0, 103308.0, 422514.0, 353901.0, 85763.0, 24534.0, 8187.0, 2953.0, 1267.0, 558.0, 267.0, 138.0, 86.0, 73.0, 37.0, 23.0, 18.0, 13.0, 8.0, 10.0, 7.0, 2.0, 6.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.0198822021484375, -0.019384264945983887, -0.018886327743530273, -0.01838839054107666, -0.017890453338623047, -0.017392516136169434, -0.01689457893371582, -0.016396641731262207, -0.015898704528808594, -0.01540076732635498, -0.014902830123901367, -0.014404892921447754, -0.01390695571899414, -0.013409018516540527, -0.012911081314086914, -0.0124131441116333, -0.011915206909179688, -0.011417269706726074, -0.010919332504272461, -0.010421395301818848, -0.009923458099365234, -0.009425520896911621, -0.008927583694458008, -0.008429646492004395, -0.007931709289550781, -0.007433772087097168, -0.006935834884643555, -0.006437897682189941, -0.005939960479736328, -0.005442023277282715, -0.0049440860748291016, -0.004446148872375488, -0.003948211669921875, -0.0034502744674682617, -0.0029523372650146484, -0.002454400062561035, -0.001956462860107422, -0.0014585256576538086, -0.0009605884552001953, -0.00046265125274658203, 3.528594970703125e-05, 0.0005332231521606445, 0.0010311603546142578, 0.001529097557067871, 0.0020270347595214844, 0.0025249719619750977, 0.003022909164428711, 0.0035208463668823242, 0.0040187835693359375, 0.004516720771789551, 0.005014657974243164, 0.005512595176696777, 0.006010532379150391, 0.006508469581604004, 0.007006406784057617, 0.0075043439865112305, 0.008002281188964844, 0.008500218391418457, 0.00899815559387207, 0.009496092796325684, 0.009994029998779297, 0.01049196720123291, 0.010989904403686523, 0.011487841606140137, 0.01198577880859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 5.0, 7.0, 8.0, 6.0, 9.0, 11.0, 10.0, 20.0, 19.0, 10.0, 24.0, 23.0, 25.0, 25.0, 45.0, 43.0, 46.0, 53.0, 37.0, 50.0, 47.0, 54.0, 34.0, 40.0, 32.0, 26.0, 39.0, 33.0, 36.0, 25.0, 23.0, 18.0, 19.0, 18.0, 19.0, 12.0, 9.0, 12.0, 5.0, 4.0, 5.0, 5.0, 4.0, 8.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0120391845703125, -0.011681556701660156, -0.011323928833007812, -0.010966300964355469, -0.010608673095703125, -0.010251045227050781, -0.009893417358398438, -0.009535789489746094, -0.00917816162109375, -0.008820533752441406, -0.008462905883789062, -0.008105278015136719, -0.007747650146484375, -0.007390022277832031, -0.0070323944091796875, -0.006674766540527344, -0.006317138671875, -0.005959510803222656, -0.0056018829345703125, -0.005244255065917969, -0.004886627197265625, -0.004528999328613281, -0.0041713714599609375, -0.0038137435913085938, -0.00345611572265625, -0.0030984878540039062, -0.0027408599853515625, -0.0023832321166992188, -0.002025604248046875, -0.0016679763793945312, -0.0013103485107421875, -0.0009527206420898438, -0.0005950927734375, -0.00023746490478515625, 0.0001201629638671875, 0.00047779083251953125, 0.000835418701171875, 0.0011930465698242188, 0.0015506744384765625, 0.0019083023071289062, 0.00226593017578125, 0.0026235580444335938, 0.0029811859130859375, 0.0033388137817382812, 0.003696441650390625, 0.004054069519042969, 0.0044116973876953125, 0.004769325256347656, 0.005126953125, 0.005484580993652344, 0.0058422088623046875, 0.006199836730957031, 0.006557464599609375, 0.006915092468261719, 0.0072727203369140625, 0.007630348205566406, 0.00798797607421875, 0.008345603942871094, 0.008703231811523438, 0.009060859680175781, 0.009418487548828125, 0.009776115417480469, 0.010133743286132812, 0.010491371154785156, 0.0108489990234375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 7.0, 10.0, 21.0, 35.0, 58.0, 100.0, 213.0, 366.0, 650.0, 1414.0, 3051.0, 7369.0, 22327.0, 122312.0, 653886.0, 190880.0, 29768.0, 8900.0, 3692.0, 1718.0, 817.0, 422.0, 238.0, 115.0, 66.0, 41.0, 28.0, 18.0, 10.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00789642333984375, -0.007686436176300049, -0.007476449012756348, -0.0072664618492126465, -0.007056474685668945, -0.006846487522125244, -0.006636500358581543, -0.006426513195037842, -0.006216526031494141, -0.0060065388679504395, -0.005796551704406738, -0.005586564540863037, -0.005376577377319336, -0.005166590213775635, -0.004956603050231934, -0.004746615886688232, -0.004536628723144531, -0.00432664155960083, -0.004116654396057129, -0.003906667232513428, -0.0036966800689697266, -0.0034866929054260254, -0.0032767057418823242, -0.003066718578338623, -0.002856731414794922, -0.0026467442512512207, -0.0024367570877075195, -0.0022267699241638184, -0.002016782760620117, -0.001806795597076416, -0.0015968084335327148, -0.0013868212699890137, -0.0011768341064453125, -0.0009668469429016113, -0.0007568597793579102, -0.000546872615814209, -0.0003368854522705078, -0.00012689828872680664, 8.308887481689453e-05, 0.0002930760383605957, 0.0005030632019042969, 0.000713050365447998, 0.0009230375289916992, 0.0011330246925354004, 0.0013430118560791016, 0.0015529990196228027, 0.001762986183166504, 0.001972973346710205, 0.0021829605102539062, 0.0023929476737976074, 0.0026029348373413086, 0.0028129220008850098, 0.003022909164428711, 0.003232896327972412, 0.0034428834915161133, 0.0036528706550598145, 0.0038628578186035156, 0.004072844982147217, 0.004282832145690918, 0.004492819309234619, 0.00470280647277832, 0.0049127936363220215, 0.005122780799865723, 0.005332767963409424, 0.005542755126953125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 5.0, 7.0, 10.0, 15.0, 10.0, 23.0, 22.0, 0.0, 35.0, 32.0, 38.0, 48.0, 42.0, 54.0, 60.0, 61.0, 60.0, 59.0, 78.0, 53.0, 0.0, 42.0, 52.0, 36.0, 27.0, 26.0, 22.0, 17.0, 17.0, 10.0, 4.0, 9.0, 6.0, 0.0, 5.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9073486328125e-06, -1.8524006009101868e-06, -1.7974525690078735e-06, -1.7425045371055603e-06, -1.687556505203247e-06, -1.6326084733009338e-06, -1.5776604413986206e-06, -1.5227124094963074e-06, -1.4677643775939941e-06, -1.412816345691681e-06, -1.3578683137893677e-06, -1.3029202818870544e-06, -1.2479722499847412e-06, -1.193024218082428e-06, -1.1380761861801147e-06, -1.0831281542778015e-06, -1.0281801223754883e-06, -9.73232090473175e-07, -9.182840585708618e-07, -8.633360266685486e-07, -8.083879947662354e-07, -7.534399628639221e-07, -6.984919309616089e-07, -6.435438990592957e-07, -5.885958671569824e-07, -5.336478352546692e-07, -4.78699803352356e-07, -4.237517714500427e-07, -3.688037395477295e-07, -3.1385570764541626e-07, -2.5890767574310303e-07, -2.039596438407898e-07, -1.4901161193847656e-07, -9.406358003616333e-08, -3.91155481338501e-08, 1.5832483768463135e-08, 7.078051567077637e-08, 1.257285475730896e-07, 1.8067657947540283e-07, 2.3562461137771606e-07, 2.905726432800293e-07, 3.4552067518234253e-07, 4.0046870708465576e-07, 4.55416738986969e-07, 5.103647708892822e-07, 5.653128027915955e-07, 6.202608346939087e-07, 6.752088665962219e-07, 7.301568984985352e-07, 7.851049304008484e-07, 8.400529623031616e-07, 8.950009942054749e-07, 9.499490261077881e-07, 1.0048970580101013e-06, 1.0598450899124146e-06, 1.1147931218147278e-06, 1.169741153717041e-06, 1.2246891856193542e-06, 1.2796372175216675e-06, 1.3345852494239807e-06, 1.389533281326294e-06, 1.4444813132286072e-06, 1.4994293451309204e-06, 1.5543773770332336e-06, 1.6093254089355469e-06]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 14.0, 9.0, 23.0, 16.0, 32.0, 50.0, 71.0, 123.0, 170.0, 282.0, 399.0, 695.0, 1388.0, 2835.0, 7362.0, 24193.0, 129244.0, 656209.0, 179918.0, 29987.0, 8636.0, 3217.0, 1523.0, 836.0, 495.0, 299.0, 170.0, 116.0, 79.0, 33.0, 34.0, 22.0, 18.0, 10.0, 10.0, 6.0, 4.0, 5.0, 2.0, 1.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.006267547607421875, -0.006055653095245361, -0.005843758583068848, -0.005631864070892334, -0.00541996955871582, -0.005208075046539307, -0.004996180534362793, -0.004784286022186279, -0.004572391510009766, -0.004360496997833252, -0.004148602485656738, -0.003936707973480225, -0.003724813461303711, -0.0035129189491271973, -0.0033010244369506836, -0.00308912992477417, -0.0028772354125976562, -0.0026653409004211426, -0.002453446388244629, -0.0022415518760681152, -0.0020296573638916016, -0.0018177628517150879, -0.0016058683395385742, -0.0013939738273620605, -0.0011820793151855469, -0.0009701848030090332, -0.0007582902908325195, -0.0005463957786560059, -0.0003345012664794922, -0.00012260675430297852, 8.928775787353516e-05, 0.00030118227005004883, 0.0005130767822265625, 0.0007249712944030762, 0.0009368658065795898, 0.0011487603187561035, 0.0013606548309326172, 0.0015725493431091309, 0.0017844438552856445, 0.001996338367462158, 0.002208232879638672, 0.0024201273918151855, 0.0026320219039916992, 0.002843916416168213, 0.0030558109283447266, 0.0032677054405212402, 0.003479599952697754, 0.0036914944648742676, 0.0039033889770507812, 0.004115283489227295, 0.004327178001403809, 0.004539072513580322, 0.004750967025756836, 0.00496286153793335, 0.005174756050109863, 0.005386650562286377, 0.005598545074462891, 0.005810439586639404, 0.006022334098815918, 0.006234228610992432, 0.006446123123168945, 0.006658017635345459, 0.006869912147521973, 0.007081806659698486, 0.007293701171875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 11.0, 11.0, 17.0, 29.0, 38.0, 44.0, 107.0, 154.0, 180.0, 147.0, 101.0, 61.0, 24.0, 17.0, 11.0, 11.0, 13.0, 10.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00771331787109375, -0.00746917724609375, -0.00722503662109375, -0.00698089599609375, -0.00673675537109375, -0.00649261474609375, -0.00624847412109375, -0.00600433349609375, -0.00576019287109375, -0.00551605224609375, -0.00527191162109375, -0.00502777099609375, -0.00478363037109375, -0.00453948974609375, -0.00429534912109375, -0.00405120849609375, -0.00380706787109375, -0.00356292724609375, -0.00331878662109375, -0.00307464599609375, -0.00283050537109375, -0.00258636474609375, -0.00234222412109375, -0.00209808349609375, -0.00185394287109375, -0.00160980224609375, -0.00136566162109375, -0.00112152099609375, -0.00087738037109375, -0.00063323974609375, -0.00038909912109375, -0.00014495849609375, 9.918212890625e-05, 0.00034332275390625, 0.00058746337890625, 0.00083160400390625, 0.00107574462890625, 0.00131988525390625, 0.00156402587890625, 0.00180816650390625, 0.00205230712890625, 0.00229644775390625, 0.00254058837890625, 0.00278472900390625, 0.00302886962890625, 0.00327301025390625, 0.00351715087890625, 0.00376129150390625, 0.00400543212890625, 0.00424957275390625, 0.00449371337890625, 0.00473785400390625, 0.00498199462890625, 0.00522613525390625, 0.00547027587890625, 0.00571441650390625, 0.00595855712890625, 0.00620269775390625, 0.00644683837890625, 0.00669097900390625, 0.00693511962890625, 0.00717926025390625, 0.00742340087890625, 0.00766754150390625, 0.00791168212890625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 27.0, 65.0, 132.0, 219.0, 251.0, 145.0, 86.0, 34.0, 16.0, 14.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05695367977023125, -0.05362071096897125, -0.05028773844242096, -0.046954769641160965, -0.04362180083990097, -0.04028882831335068, -0.03695585951209068, -0.03362289071083069, -0.030289920046925545, -0.0269569493830204, -0.023623980581760406, -0.020291009917855263, -0.01695803925395012, -0.013625070452690125, -0.01029209978878498, -0.006959130987524986, -0.0036261603236198425, -0.00029319035820662975, 0.003039779607206583, 0.0063727498054504395, 0.009705719538033009, 0.013038689270615578, 0.01637165993452072, 0.019704628735780716, 0.02303759939968586, 0.026370570063591003, 0.029703538864850998, 0.03303650766611099, 0.036369480192661285, 0.03970244899392128, 0.043035417795181274, 0.04636839032173157, 0.04970135539770126, 0.05303432419896126, 0.05636729672551155, 0.059700265526771545, 0.06303323805332184, 0.06636620312929153, 0.06969917565584183, 0.07303214073181152, 0.07636511325836182, 0.07969808578491211, 0.0830310508608818, 0.0863640233874321, 0.08969699591398239, 0.09302996098995209, 0.09636293351650238, 0.09969590604305267, 0.10302887856960297, 0.10636185109615326, 0.10969481617212296, 0.11302778869867325, 0.11636076122522354, 0.11969372630119324, 0.12302669882774353, 0.12635967135429382, 0.12969262897968292, 0.13302560150623322, 0.1363585740327835, 0.1396915316581726, 0.1430245041847229, 0.1463574767112732, 0.1496904492378235, 0.15302342176437378, 0.15635639429092407]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 7.0, 5.0, 11.0, 7.0, 3.0, 12.0, 11.0, 18.0, 11.0, 14.0, 18.0, 22.0, 29.0, 25.0, 31.0, 32.0, 33.0, 33.0, 36.0, 33.0, 45.0, 38.0, 38.0, 48.0, 37.0, 36.0, 44.0, 38.0, 34.0, 36.0, 24.0, 32.0, 27.0, 18.0, 20.0, 24.0, 16.0, 16.0, 12.0, 5.0, 5.0, 6.0, 4.0, 3.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03128767013549805, -0.030349910259246826, -0.029412148520350456, -0.028474386781454086, -0.027536626905202866, -0.026598867028951645, -0.025661105290055275, -0.024723343551158905, -0.023785583674907684, -0.022847823798656464, -0.021910062059760094, -0.020972300320863724, -0.020034540444612503, -0.019096780568361282, -0.018159018829464912, -0.017221257090568542, -0.016283497214317322, -0.015345736406743526, -0.014407975599169731, -0.013470214791595936, -0.01253245398402214, -0.011594693176448345, -0.01065693236887455, -0.009719171561300755, -0.00878141075372696, -0.007843649946153164, -0.006905889138579369, -0.005968128331005573, -0.005030367523431778, -0.004092606715857983, -0.0031548459082841873, -0.002217085100710392, -0.0012793242931365967, -0.00034156348556280136, 0.000596197322010994, 0.0015339581295847893, 0.0024717189371585846, 0.00340947974473238, 0.004347240552306175, 0.0052850013598799706, 0.006222762167453766, 0.007160522975027561, 0.008098283782601357, 0.009036044590175152, 0.009973805397748947, 0.010911566205322742, 0.011849327012896538, 0.012787087820470333, 0.013724848628044128, 0.014662609435617924, 0.015600370243191719, 0.01653813198208809, 0.01747589185833931, 0.01841365173459053, 0.0193514134734869, 0.02028917521238327, 0.02122693508863449, 0.02216469496488571, 0.02310245670378208, 0.02404021844267845, 0.024977978318929672, 0.025915738195180893, 0.026853499934077263, 0.027791261672973633, 0.028729021549224854]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 2.0, 3.0, 6.0, 3.0, 10.0, 8.0, 19.0, 21.0, 25.0, 30.0, 44.0, 74.0, 122.0, 199.0, 402.0, 808.0, 2066.0, 6417.0, 26002.0, 181690.0, 3359389.0, 559682.0, 42276.0, 9709.0, 2874.0, 1084.0, 530.0, 286.0, 155.0, 104.0, 66.0, 45.0, 34.0, 21.0, 17.0, 17.0, 6.0, 10.0, 8.0, 6.0, 6.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0159149169921875, -0.015412330627441406, -0.014909744262695312, -0.014407157897949219, -0.013904571533203125, -0.013401985168457031, -0.012899398803710938, -0.012396812438964844, -0.01189422607421875, -0.011391639709472656, -0.010889053344726562, -0.010386466979980469, -0.009883880615234375, -0.009381294250488281, -0.008878707885742188, -0.008376121520996094, -0.00787353515625, -0.007370948791503906, -0.0068683624267578125, -0.006365776062011719, -0.005863189697265625, -0.005360603332519531, -0.0048580169677734375, -0.004355430603027344, -0.00385284423828125, -0.0033502578735351562, -0.0028476715087890625, -0.0023450851440429688, -0.001842498779296875, -0.0013399124145507812, -0.0008373260498046875, -0.00033473968505859375, 0.0001678466796875, 0.0006704330444335938, 0.0011730194091796875, 0.0016756057739257812, 0.002178192138671875, 0.0026807785034179688, 0.0031833648681640625, 0.0036859512329101562, 0.00418853759765625, 0.004691123962402344, 0.0051937103271484375, 0.005696296691894531, 0.006198883056640625, 0.006701469421386719, 0.0072040557861328125, 0.007706642150878906, 0.008209228515625, 0.008711814880371094, 0.009214401245117188, 0.009716987609863281, 0.010219573974609375, 0.010722160339355469, 0.011224746704101562, 0.011727333068847656, 0.01222991943359375, 0.012732505798339844, 0.013235092163085938, 0.013737678527832031, 0.014240264892578125, 0.014742851257324219, 0.015245437622070312, 0.015748023986816406, 0.0162506103515625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 11.0, 19.0, 32.0, 28.0, 49.0, 66.0, 78.0, 94.0, 106.0, 102.0, 97.0, 72.0, 77.0, 50.0, 46.0, 24.0, 18.0, 21.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008026123046875, -0.007742047309875488, -0.0074579715728759766, -0.007173895835876465, -0.006889820098876953, -0.006605744361877441, -0.00632166862487793, -0.006037592887878418, -0.005753517150878906, -0.0054694414138793945, -0.005185365676879883, -0.004901289939880371, -0.004617214202880859, -0.004333138465881348, -0.004049062728881836, -0.0037649869918823242, -0.0034809112548828125, -0.0031968355178833008, -0.002912759780883789, -0.0026286840438842773, -0.0023446083068847656, -0.002060532569885254, -0.0017764568328857422, -0.0014923810958862305, -0.0012083053588867188, -0.000924229621887207, -0.0006401538848876953, -0.0003560781478881836, -7.200241088867188e-05, 0.00021207332611083984, 0.0004961490631103516, 0.0007802248001098633, 0.001064300537109375, 0.0013483762741088867, 0.0016324520111083984, 0.0019165277481079102, 0.002200603485107422, 0.0024846792221069336, 0.0027687549591064453, 0.003052830696105957, 0.0033369064331054688, 0.0036209821701049805, 0.003905057907104492, 0.004189133644104004, 0.004473209381103516, 0.004757285118103027, 0.005041360855102539, 0.005325436592102051, 0.0056095123291015625, 0.005893588066101074, 0.006177663803100586, 0.006461739540100098, 0.006745815277099609, 0.007029891014099121, 0.007313966751098633, 0.0075980424880981445, 0.007882118225097656, 0.008166193962097168, 0.00845026969909668, 0.008734345436096191, 0.009018421173095703, 0.009302496910095215, 0.009586572647094727, 0.009870648384094238, 0.01015472412109375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 2.0, 12.0, 11.0, 10.0, 12.0, 37.0, 46.0, 87.0, 165.0, 254.0, 495.0, 961.0, 1842.0, 4398.0, 10717.0, 30442.0, 103747.0, 571073.0, 2954949.0, 390583.0, 82568.0, 25265.0, 9381.0, 3806.0, 1666.0, 838.0, 367.0, 224.0, 119.0, 60.0, 56.0, 36.0, 8.0, 11.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.01290130615234375, -0.012573957443237305, -0.01224660873413086, -0.011919260025024414, -0.011591911315917969, -0.011264562606811523, -0.010937213897705078, -0.010609865188598633, -0.010282516479492188, -0.009955167770385742, -0.009627819061279297, -0.009300470352172852, -0.008973121643066406, -0.008645772933959961, -0.008318424224853516, -0.00799107551574707, -0.007663726806640625, -0.00733637809753418, -0.007009029388427734, -0.006681680679321289, -0.006354331970214844, -0.0060269832611083984, -0.005699634552001953, -0.005372285842895508, -0.0050449371337890625, -0.004717588424682617, -0.004390239715576172, -0.0040628910064697266, -0.0037355422973632812, -0.003408193588256836, -0.0030808448791503906, -0.0027534961700439453, -0.0024261474609375, -0.0020987987518310547, -0.0017714500427246094, -0.001444101333618164, -0.0011167526245117188, -0.0007894039154052734, -0.0004620552062988281, -0.0001347064971923828, 0.0001926422119140625, 0.0005199909210205078, 0.0008473396301269531, 0.0011746883392333984, 0.0015020370483398438, 0.001829385757446289, 0.0021567344665527344, 0.0024840831756591797, 0.002811431884765625, 0.0031387805938720703, 0.0034661293029785156, 0.003793478012084961, 0.004120826721191406, 0.0044481754302978516, 0.004775524139404297, 0.005102872848510742, 0.0054302215576171875, 0.005757570266723633, 0.006084918975830078, 0.0064122676849365234, 0.006739616394042969, 0.007066965103149414, 0.007394313812255859, 0.007721662521362305, 0.00804901123046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 8.0, 8.0, 6.0, 7.0, 16.0, 17.0, 16.0, 31.0, 33.0, 41.0, 67.0, 72.0, 93.0, 136.0, 191.0, 331.0, 526.0, 652.0, 565.0, 356.0, 238.0, 143.0, 106.0, 80.0, 74.0, 58.0, 37.0, 24.0, 30.0, 21.0, 12.0, 12.0, 14.0, 12.0, 11.0, 7.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.00875091552734375, -0.008504986763000488, -0.008259057998657227, -0.008013129234313965, -0.007767200469970703, -0.007521271705627441, -0.00727534294128418, -0.007029414176940918, -0.006783485412597656, -0.0065375566482543945, -0.006291627883911133, -0.006045699119567871, -0.005799770355224609, -0.005553841590881348, -0.005307912826538086, -0.005061984062194824, -0.0048160552978515625, -0.004570126533508301, -0.004324197769165039, -0.004078269004821777, -0.0038323402404785156, -0.003586411476135254, -0.003340482711791992, -0.0030945539474487305, -0.0028486251831054688, -0.002602696418762207, -0.0023567676544189453, -0.0021108388900756836, -0.0018649101257324219, -0.0016189813613891602, -0.0013730525970458984, -0.0011271238327026367, -0.000881195068359375, -0.0006352663040161133, -0.00038933753967285156, -0.00014340877532958984, 0.00010251998901367188, 0.0003484487533569336, 0.0005943775177001953, 0.000840306282043457, 0.0010862350463867188, 0.0013321638107299805, 0.0015780925750732422, 0.001824021339416504, 0.0020699501037597656, 0.0023158788681030273, 0.002561807632446289, 0.0028077363967895508, 0.0030536651611328125, 0.0032995939254760742, 0.003545522689819336, 0.0037914514541625977, 0.004037380218505859, 0.004283308982849121, 0.004529237747192383, 0.0047751665115356445, 0.005021095275878906, 0.005267024040222168, 0.00551295280456543, 0.005758881568908691, 0.006004810333251953, 0.006250739097595215, 0.0064966678619384766, 0.006742596626281738, 0.006988525390625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 12.0, 14.0, 32.0, 64.0, 111.0, 153.0, 184.0, 164.0, 116.0, 66.0, 27.0, 24.0, 9.0, 8.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11252281814813614, -0.11000123620033264, -0.10747965425252914, -0.10495807230472565, -0.10243649035692215, -0.09991490840911865, -0.09739332646131516, -0.09487174451351166, -0.09235016256570816, -0.08982858061790466, -0.08730699867010117, -0.08478541672229767, -0.08226383477449417, -0.07974225282669067, -0.07722067087888718, -0.07469908893108368, -0.07217749953269958, -0.06965591758489609, -0.06713433563709259, -0.06461275368928909, -0.062091171741485596, -0.0595695897936821, -0.0570480078458786, -0.054526425898075104, -0.052004843950271606, -0.04948326200246811, -0.04696168005466461, -0.044440098106861115, -0.04191851615905762, -0.03939693421125412, -0.03687535226345062, -0.034353770315647125, -0.031832192093133926, -0.02931061014533043, -0.026789028197526932, -0.024267446249723434, -0.021745864301919937, -0.01922428235411644, -0.016702698543667793, -0.014181116595864296, -0.011659534648060799, -0.009137952700257301, -0.006616370286792517, -0.004094787873327732, -0.0015732059255242348, 0.0009483760222792625, 0.0034699589014053345, 0.005991540849208832, 0.008513122797012329, 0.011034704744815826, 0.013556286692619324, 0.01607786864042282, 0.01859945058822632, 0.021121032536029816, 0.023642616346478462, 0.02616419829428196, 0.028685780242085457, 0.031207362189888954, 0.0337289460003376, 0.0362505279481411, 0.038772109895944595, 0.04129369184374809, 0.04381527379155159, 0.04633685573935509, 0.048858437687158585]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 0.0, 4.0, 4.0, 7.0, 7.0, 7.0, 4.0, 12.0, 13.0, 11.0, 15.0, 22.0, 20.0, 33.0, 38.0, 31.0, 37.0, 40.0, 44.0, 46.0, 45.0, 41.0, 42.0, 36.0, 41.0, 37.0, 39.0, 40.0, 31.0, 26.0, 27.0, 20.0, 26.0, 27.0, 29.0, 21.0, 13.0, 14.0, 10.0, 12.0, 8.0, 7.0, 1.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.02799767255783081, -0.0271872840821743, -0.02637689746916294, -0.02556651085615158, -0.02475612238049507, -0.023945733904838562, -0.023135347291827202, -0.02232496067881584, -0.021514572203159332, -0.020704183727502823, -0.019893797114491463, -0.019083410501480103, -0.018273022025823593, -0.017462633550167084, -0.016652246937155724, -0.015841860324144363, -0.015031471848487854, -0.01422108430415392, -0.013410696759819984, -0.01260030921548605, -0.011789921671152115, -0.01097953412681818, -0.010169146582484245, -0.00935875903815031, -0.008548371493816376, -0.007737983949482441, -0.006927596405148506, -0.006117208860814571, -0.005306821316480637, -0.004496433772146702, -0.003686046227812767, -0.0028756586834788322, -0.0020652711391448975, -0.0012548835948109627, -0.0004444960504770279, 0.0003658914938569069, 0.0011762790381908417, 0.0019866665825247765, 0.0027970541268587112, 0.003607441671192646, 0.004417829215526581, 0.005228216759860516, 0.00603860430419445, 0.006848991848528385, 0.00765937939286232, 0.008469766937196255, 0.00928015448153019, 0.010090542025864124, 0.010900929570198059, 0.011711317114531994, 0.012521704658865929, 0.013332092203199863, 0.014142479747533798, 0.014952867291867733, 0.015763254836201668, 0.016573641449213028, 0.017384029924869537, 0.018194418400526047, 0.019004805013537407, 0.019815191626548767, 0.020625580102205276, 0.021435968577861786, 0.022246355190873146, 0.023056741803884506, 0.023867130279541016]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 8.0, 5.0, 8.0, 4.0, 9.0, 18.0, 17.0, 25.0, 37.0, 63.0, 66.0, 107.0, 139.0, 262.0, 390.0, 713.0, 1769.0, 5370.0, 20114.0, 93108.0, 436446.0, 386032.0, 78262.0, 17539.0, 4733.0, 1514.0, 680.0, 395.0, 223.0, 136.0, 94.0, 75.0, 53.0, 40.0, 27.0, 25.0, 9.0, 13.0, 10.0, 9.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0185699462890625, -0.01798868179321289, -0.01740741729736328, -0.016826152801513672, -0.016244888305664062, -0.015663623809814453, -0.015082359313964844, -0.014501094818115234, -0.013919830322265625, -0.013338565826416016, -0.012757301330566406, -0.012176036834716797, -0.011594772338867188, -0.011013507843017578, -0.010432243347167969, -0.00985097885131836, -0.00926971435546875, -0.00868844985961914, -0.008107185363769531, -0.007525920867919922, -0.0069446563720703125, -0.006363391876220703, -0.005782127380371094, -0.005200862884521484, -0.004619598388671875, -0.004038333892822266, -0.0034570693969726562, -0.002875804901123047, -0.0022945404052734375, -0.0017132759094238281, -0.0011320114135742188, -0.0005507469177246094, 3.0517578125e-05, 0.0006117820739746094, 0.0011930465698242188, 0.0017743110656738281, 0.0023555755615234375, 0.002936840057373047, 0.0035181045532226562, 0.004099369049072266, 0.004680633544921875, 0.005261898040771484, 0.005843162536621094, 0.006424427032470703, 0.0070056915283203125, 0.007586956024169922, 0.008168220520019531, 0.00874948501586914, 0.00933074951171875, 0.00991201400756836, 0.010493278503417969, 0.011074542999267578, 0.011655807495117188, 0.012237071990966797, 0.012818336486816406, 0.013399600982666016, 0.013980865478515625, 0.014562129974365234, 0.015143394470214844, 0.015724658966064453, 0.016305923461914062, 0.016887187957763672, 0.01746845245361328, 0.01804971694946289, 0.0186309814453125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 12.0, 19.0, 25.0, 44.0, 55.0, 73.0, 86.0, 105.0, 99.0, 114.0, 104.0, 73.0, 61.0, 47.0, 31.0, 22.0, 16.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00841522216796875, -0.008121967315673828, -0.007828712463378906, -0.007535457611083984, -0.0072422027587890625, -0.006948947906494141, -0.006655693054199219, -0.006362438201904297, -0.006069183349609375, -0.005775928497314453, -0.005482673645019531, -0.005189418792724609, -0.0048961639404296875, -0.004602909088134766, -0.004309654235839844, -0.004016399383544922, -0.00372314453125, -0.003429889678955078, -0.0031366348266601562, -0.0028433799743652344, -0.0025501251220703125, -0.0022568702697753906, -0.0019636154174804688, -0.0016703605651855469, -0.001377105712890625, -0.0010838508605957031, -0.0007905960083007812, -0.0004973411560058594, -0.0002040863037109375, 8.916854858398438e-05, 0.00038242340087890625, 0.0006756782531738281, 0.00096893310546875, 0.0012621879577636719, 0.0015554428100585938, 0.0018486976623535156, 0.0021419525146484375, 0.0024352073669433594, 0.0027284622192382812, 0.003021717071533203, 0.003314971923828125, 0.003608226776123047, 0.0039014816284179688, 0.004194736480712891, 0.0044879913330078125, 0.004781246185302734, 0.005074501037597656, 0.005367755889892578, 0.0056610107421875, 0.005954265594482422, 0.006247520446777344, 0.006540775299072266, 0.0068340301513671875, 0.007127285003662109, 0.007420539855957031, 0.007713794708251953, 0.008007049560546875, 0.008300304412841797, 0.008593559265136719, 0.00888681411743164, 0.009180068969726562, 0.009473323822021484, 0.009766578674316406, 0.010059833526611328, 0.01035308837890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 8.0, 13.0, 14.0, 11.0, 24.0, 32.0, 58.0, 82.0, 144.0, 298.0, 698.0, 1434.0, 3587.0, 9409.0, 26572.0, 79724.0, 247992.0, 409708.0, 179680.0, 57346.0, 19620.0, 6994.0, 2744.0, 1220.0, 537.0, 232.0, 124.0, 84.0, 50.0, 25.0, 18.0, 12.0, 10.0, 14.0, 7.0, 8.0, 5.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01324462890625, -0.012847542762756348, -0.012450456619262695, -0.012053370475769043, -0.01165628433227539, -0.011259198188781738, -0.010862112045288086, -0.010465025901794434, -0.010067939758300781, -0.009670853614807129, -0.009273767471313477, -0.008876681327819824, -0.008479595184326172, -0.00808250904083252, -0.007685422897338867, -0.007288336753845215, -0.0068912506103515625, -0.00649416446685791, -0.006097078323364258, -0.0056999921798706055, -0.005302906036376953, -0.004905819892883301, -0.0045087337493896484, -0.004111647605895996, -0.0037145614624023438, -0.0033174753189086914, -0.002920389175415039, -0.0025233030319213867, -0.0021262168884277344, -0.001729130744934082, -0.0013320446014404297, -0.0009349584579467773, -0.000537872314453125, -0.00014078617095947266, 0.0002562999725341797, 0.000653386116027832, 0.0010504722595214844, 0.0014475584030151367, 0.001844644546508789, 0.0022417306900024414, 0.0026388168334960938, 0.003035902976989746, 0.0034329891204833984, 0.0038300752639770508, 0.004227161407470703, 0.0046242475509643555, 0.005021333694458008, 0.00541841983795166, 0.0058155059814453125, 0.006212592124938965, 0.006609678268432617, 0.0070067644119262695, 0.007403850555419922, 0.007800936698913574, 0.008198022842407227, 0.008595108985900879, 0.008992195129394531, 0.009389281272888184, 0.009786367416381836, 0.010183453559875488, 0.01058053970336914, 0.010977625846862793, 0.011374711990356445, 0.011771798133850098, 0.01216888427734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 3.0, 8.0, 23.0, 16.0, 20.0, 21.0, 23.0, 15.0, 29.0, 36.0, 38.0, 36.0, 44.0, 38.0, 41.0, 55.0, 46.0, 41.0, 42.0, 45.0, 40.0, 37.0, 31.0, 25.0, 39.0, 36.0, 25.0, 17.0, 16.0, 24.0, 16.0, 8.0, 11.0, 12.0, 8.0, 6.0, 4.0, 2.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0112457275390625, -0.010895967483520508, -0.010546207427978516, -0.010196447372436523, -0.009846687316894531, -0.009496927261352539, -0.009147167205810547, -0.008797407150268555, -0.008447647094726562, -0.00809788703918457, -0.007748126983642578, -0.007398366928100586, -0.007048606872558594, -0.0066988468170166016, -0.006349086761474609, -0.005999326705932617, -0.005649566650390625, -0.005299806594848633, -0.004950046539306641, -0.0046002864837646484, -0.004250526428222656, -0.003900766372680664, -0.003551006317138672, -0.0032012462615966797, -0.0028514862060546875, -0.0025017261505126953, -0.002151966094970703, -0.001802206039428711, -0.0014524459838867188, -0.0011026859283447266, -0.0007529258728027344, -0.0004031658172607422, -5.340576171875e-05, 0.0002963542938232422, 0.0006461143493652344, 0.0009958744049072266, 0.0013456344604492188, 0.001695394515991211, 0.002045154571533203, 0.0023949146270751953, 0.0027446746826171875, 0.0030944347381591797, 0.003444194793701172, 0.003793954849243164, 0.004143714904785156, 0.0044934749603271484, 0.004843235015869141, 0.005192995071411133, 0.005542755126953125, 0.005892515182495117, 0.006242275238037109, 0.0065920352935791016, 0.006941795349121094, 0.007291555404663086, 0.007641315460205078, 0.00799107551574707, 0.008340835571289062, 0.008690595626831055, 0.009040355682373047, 0.009390115737915039, 0.009739875793457031, 0.010089635848999023, 0.010439395904541016, 0.010789155960083008, 0.011138916015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 9.0, 9.0, 20.0, 20.0, 31.0, 50.0, 84.0, 129.0, 197.0, 403.0, 829.0, 1731.0, 4153.0, 11129.0, 33171.0, 122405.0, 397925.0, 339554.0, 94443.0, 26596.0, 8979.0, 3584.0, 1523.0, 679.0, 341.0, 200.0, 119.0, 76.0, 50.0, 25.0, 21.0, 19.0, 13.0, 11.0, 11.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.00588226318359375, -0.005734860897064209, -0.005587458610534668, -0.005440056324005127, -0.005292654037475586, -0.005145251750946045, -0.004997849464416504, -0.004850447177886963, -0.004703044891357422, -0.004555642604827881, -0.00440824031829834, -0.004260838031768799, -0.004113435745239258, -0.003966033458709717, -0.0038186311721801758, -0.0036712288856506348, -0.0035238265991210938, -0.0033764243125915527, -0.0032290220260620117, -0.0030816197395324707, -0.0029342174530029297, -0.0027868151664733887, -0.0026394128799438477, -0.0024920105934143066, -0.0023446083068847656, -0.0021972060203552246, -0.0020498037338256836, -0.0019024014472961426, -0.0017549991607666016, -0.0016075968742370605, -0.0014601945877075195, -0.0013127923011779785, -0.0011653900146484375, -0.0010179877281188965, -0.0008705854415893555, -0.0007231831550598145, -0.0005757808685302734, -0.0004283785820007324, -0.0002809762954711914, -0.0001335740089416504, 1.3828277587890625e-05, 0.00016123056411743164, 0.00030863285064697266, 0.00045603513717651367, 0.0006034374237060547, 0.0007508397102355957, 0.0008982419967651367, 0.0010456442832946777, 0.0011930465698242188, 0.0013404488563537598, 0.0014878511428833008, 0.0016352534294128418, 0.0017826557159423828, 0.0019300580024719238, 0.002077460289001465, 0.002224862575531006, 0.002372264862060547, 0.002519667148590088, 0.002667069435119629, 0.00281447172164917, 0.002961874008178711, 0.003109276294708252, 0.003256678581237793, 0.003404080867767334, 0.003551483154296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 13.0, 0.0, 12.0, 17.0, 15.0, 0.0, 32.0, 24.0, 0.0, 49.0, 41.0, 33.0, 0.0, 42.0, 48.0, 46.0, 0.0, 81.0, 54.0, 75.0, 0.0, 57.0, 51.0, 0.0, 55.0, 57.0, 34.0, 0.0, 43.0, 28.0, 24.0, 0.0, 20.0, 18.0, 12.0, 0.0, 6.0, 5.0, 0.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2079253792762756e-06, -1.1641532182693481e-06, -1.1203810572624207e-06, -1.0766088962554932e-06, -1.0328367352485657e-06, -9.890645742416382e-07, -9.452924132347107e-07, -9.015202522277832e-07, -8.577480912208557e-07, -8.139759302139282e-07, -7.702037692070007e-07, -7.264316082000732e-07, -6.826594471931458e-07, -6.388872861862183e-07, -5.951151251792908e-07, -5.513429641723633e-07, -5.075708031654358e-07, -4.637986421585083e-07, -4.200264811515808e-07, -3.762543201446533e-07, -3.3248215913772583e-07, -2.8870999813079834e-07, -2.4493783712387085e-07, -2.0116567611694336e-07, -1.5739351511001587e-07, -1.1362135410308838e-07, -6.984919309616089e-08, -2.60770320892334e-08, 1.7695128917694092e-08, 6.146728992462158e-08, 1.0523945093154907e-07, 1.4901161193847656e-07, 1.9278377294540405e-07, 2.3655593395233154e-07, 2.8032809495925903e-07, 3.241002559661865e-07, 3.67872416973114e-07, 4.116445779800415e-07, 4.55416738986969e-07, 4.991888999938965e-07, 5.42961061000824e-07, 5.867332220077515e-07, 6.30505383014679e-07, 6.742775440216064e-07, 7.180497050285339e-07, 7.618218660354614e-07, 8.055940270423889e-07, 8.493661880493164e-07, 8.931383490562439e-07, 9.369105100631714e-07, 9.806826710700989e-07, 1.0244548320770264e-06, 1.0682269930839539e-06, 1.1119991540908813e-06, 1.1557713150978088e-06, 1.1995434761047363e-06, 1.2433156371116638e-06, 1.2870877981185913e-06, 1.3308599591255188e-06, 1.3746321201324463e-06, 1.4184042811393738e-06, 1.4621764421463013e-06, 1.5059486031532288e-06, 1.5497207641601562e-06]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 12.0, 17.0, 20.0, 48.0, 84.0, 149.0, 244.0, 454.0, 974.0, 2291.0, 5780.0, 16753.0, 59111.0, 260952.0, 487572.0, 157713.0, 37613.0, 11405.0, 4081.0, 1691.0, 713.0, 388.0, 200.0, 108.0, 70.0, 33.0, 29.0, 9.0, 8.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005687713623046875, -0.005517065525054932, -0.005346417427062988, -0.005175769329071045, -0.0050051212310791016, -0.004834473133087158, -0.004663825035095215, -0.0044931769371032715, -0.004322528839111328, -0.004151880741119385, -0.003981232643127441, -0.003810584545135498, -0.0036399364471435547, -0.0034692883491516113, -0.003298640251159668, -0.0031279921531677246, -0.0029573440551757812, -0.002786695957183838, -0.0026160478591918945, -0.002445399761199951, -0.002274751663208008, -0.0021041035652160645, -0.001933455467224121, -0.0017628073692321777, -0.0015921592712402344, -0.001421511173248291, -0.0012508630752563477, -0.0010802149772644043, -0.0009095668792724609, -0.0007389187812805176, -0.0005682706832885742, -0.00039762258529663086, -0.0002269744873046875, -5.632638931274414e-05, 0.00011432170867919922, 0.0002849698066711426, 0.00045561790466308594, 0.0006262660026550293, 0.0007969141006469727, 0.000967562198638916, 0.0011382102966308594, 0.0013088583946228027, 0.001479506492614746, 0.0016501545906066895, 0.0018208026885986328, 0.001991450786590576, 0.0021620988845825195, 0.002332746982574463, 0.0025033950805664062, 0.0026740431785583496, 0.002844691276550293, 0.0030153393745422363, 0.0031859874725341797, 0.003356635570526123, 0.0035272836685180664, 0.0036979317665100098, 0.003868579864501953, 0.0040392279624938965, 0.00420987606048584, 0.004380524158477783, 0.0045511722564697266, 0.00472182035446167, 0.004892468452453613, 0.005063116550445557, 0.0052337646484375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 10.0, 13.0, 12.0, 6.0, 8.0, 17.0, 33.0, 35.0, 43.0, 52.0, 41.0, 68.0, 64.0, 80.0, 71.0, 73.0, 70.0, 59.0, 47.0, 49.0, 34.0, 30.0, 14.0, 13.0, 9.0, 8.0, 5.0, 5.0, 6.0, 5.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029201507568359375, -0.0028125345706939697, -0.002704918384552002, -0.002597302198410034, -0.0024896860122680664, -0.0023820698261260986, -0.002274453639984131, -0.002166837453842163, -0.0020592212677001953, -0.0019516050815582275, -0.0018439888954162598, -0.001736372709274292, -0.0016287565231323242, -0.0015211403369903564, -0.0014135241508483887, -0.001305907964706421, -0.0011982917785644531, -0.0010906755924224854, -0.0009830594062805176, -0.0008754432201385498, -0.000767827033996582, -0.0006602108478546143, -0.0005525946617126465, -0.0004449784755706787, -0.00033736228942871094, -0.00022974610328674316, -0.0001221299171447754, -1.4513731002807617e-05, 9.310245513916016e-05, 0.00020071864128112793, 0.0003083348274230957, 0.0004159510135650635, 0.0005235671997070312, 0.000631183385848999, 0.0007387995719909668, 0.0008464157581329346, 0.0009540319442749023, 0.0010616481304168701, 0.0011692643165588379, 0.0012768805027008057, 0.0013844966888427734, 0.0014921128749847412, 0.001599729061126709, 0.0017073452472686768, 0.0018149614334106445, 0.0019225776195526123, 0.00203019380569458, 0.002137809991836548, 0.0022454261779785156, 0.0023530423641204834, 0.002460658550262451, 0.002568274736404419, 0.0026758909225463867, 0.0027835071086883545, 0.0028911232948303223, 0.00299873948097229, 0.003106355667114258, 0.0032139718532562256, 0.0033215880393981934, 0.003429204225540161, 0.003536820411682129, 0.0036444365978240967, 0.0037520527839660645, 0.0038596689701080322, 0.00396728515625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 11.0, 28.0, 64.0, 146.0, 272.0, 267.0, 136.0, 54.0, 13.0, 10.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1053183525800705, -0.10201152414083481, -0.09870469570159912, -0.09539787471294403, -0.09209104627370834, -0.08878421783447266, -0.08547738939523697, -0.08217056095600128, -0.07886373996734619, -0.0755569115281105, -0.07225008308887482, -0.06894326210021973, -0.06563643366098404, -0.06232960522174835, -0.059022776782512665, -0.05571594834327698, -0.05240911990404129, -0.0491022914648056, -0.045795466750860214, -0.04248863831162453, -0.03918181359767914, -0.03587498515844345, -0.032568156719207764, -0.029261330142617226, -0.025954503566026688, -0.02264767698943615, -0.01934085041284561, -0.016034021973609924, -0.012727195397019386, -0.009420368820428848, -0.006113540381193161, -0.002806713804602623, 0.0005001053214073181, 0.0038069323636591434, 0.007113759405910969, 0.010420586913824081, 0.01372741349041462, 0.017034240067005157, 0.020341068506240845, 0.023647895082831383, 0.02695472165942192, 0.03026154823601246, 0.033568374812603, 0.036875203251838684, 0.04018203169107437, 0.04348885640501976, 0.04679568484425545, 0.050102509558200836, 0.05340933799743652, 0.05671616643667221, 0.0600229911506176, 0.06332981586456299, 0.06663664430379868, 0.06994347274303436, 0.07325030118227005, 0.07655712962150574, 0.07986395061016083, 0.08317077904939651, 0.0864776074886322, 0.08978442847728729, 0.09309125691652298, 0.09639808535575867, 0.09970491379499435, 0.10301174223423004, 0.10631857067346573]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 7.0, 8.0, 6.0, 6.0, 15.0, 7.0, 19.0, 20.0, 12.0, 35.0, 21.0, 29.0, 30.0, 35.0, 30.0, 34.0, 40.0, 44.0, 41.0, 36.0, 44.0, 37.0, 32.0, 38.0, 40.0, 30.0, 42.0, 24.0, 28.0, 36.0, 26.0, 26.0, 21.0, 19.0, 19.0, 10.0, 8.0, 11.0, 6.0, 11.0, 4.0, 3.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.030152440071105957, -0.029292479157447815, -0.028432518243789673, -0.02757255733013153, -0.02671259641647339, -0.025852635502815247, -0.024992674589157104, -0.024132713675498962, -0.02327275276184082, -0.022412791848182678, -0.021552830934524536, -0.020692870020866394, -0.019832909107208252, -0.01897294819355011, -0.018112987279891968, -0.017253026366233826, -0.016393065452575684, -0.015533104538917542, -0.0146731436252594, -0.013813182711601257, -0.012953221797943115, -0.012093260884284973, -0.011233299970626831, -0.010373339056968689, -0.009513378143310547, -0.008653417229652405, -0.007793456315994263, -0.006933495402336121, -0.0060735344886779785, -0.005213573575019836, -0.004353612661361694, -0.0034936517477035522, -0.00263369083404541, -0.001773729920387268, -0.000913769006729126, -5.380809307098389e-05, 0.0008061528205871582, 0.0016661137342453003, 0.0025260746479034424, 0.0033860355615615845, 0.0042459964752197266, 0.005105957388877869, 0.005965918302536011, 0.006825879216194153, 0.007685840129852295, 0.008545801043510437, 0.009405761957168579, 0.010265722870826721, 0.011125683784484863, 0.011985644698143005, 0.012845605611801147, 0.01370556652545929, 0.014565527439117432, 0.015425488352775574, 0.016285449266433716, 0.017145410180091858, 0.01800537109375, 0.018865332007408142, 0.019725292921066284, 0.020585253834724426, 0.02144521474838257, 0.02230517566204071, 0.023165136575698853, 0.024025097489356995, 0.024885058403015137]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 7.0, 2.0, 6.0, 4.0, 5.0, 10.0, 20.0, 26.0, 29.0, 63.0, 86.0, 162.0, 349.0, 743.0, 1865.0, 6327.0, 26652.0, 239053.0, 3529339.0, 348176.0, 30719.0, 6887.0, 2101.0, 791.0, 405.0, 182.0, 97.0, 55.0, 36.0, 27.0, 23.0, 12.0, 3.0, 4.0, 5.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0159759521484375, -0.015469551086425781, -0.014963150024414062, -0.014456748962402344, -0.013950347900390625, -0.013443946838378906, -0.012937545776367188, -0.012431144714355469, -0.01192474365234375, -0.011418342590332031, -0.010911941528320312, -0.010405540466308594, -0.009899139404296875, -0.009392738342285156, -0.008886337280273438, -0.008379936218261719, -0.00787353515625, -0.007367134094238281, -0.0068607330322265625, -0.006354331970214844, -0.005847930908203125, -0.005341529846191406, -0.0048351287841796875, -0.004328727722167969, -0.00382232666015625, -0.0033159255981445312, -0.0028095245361328125, -0.0023031234741210938, -0.001796722412109375, -0.0012903213500976562, -0.0007839202880859375, -0.00027751922607421875, 0.0002288818359375, 0.0007352828979492188, 0.0012416839599609375, 0.0017480850219726562, 0.002254486083984375, 0.0027608871459960938, 0.0032672882080078125, 0.0037736892700195312, 0.00428009033203125, 0.004786491394042969, 0.0052928924560546875, 0.005799293518066406, 0.006305694580078125, 0.006812095642089844, 0.0073184967041015625, 0.007824897766113281, 0.008331298828125, 0.008837699890136719, 0.009344100952148438, 0.009850502014160156, 0.010356903076171875, 0.010863304138183594, 0.011369705200195312, 0.011876106262207031, 0.01238250732421875, 0.012888908386230469, 0.013395309448242188, 0.013901710510253906, 0.014408111572265625, 0.014914512634277344, 0.015420913696289062, 0.01592731475830078, 0.0164337158203125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 7.0, 19.0, 13.0, 25.0, 41.0, 55.0, 70.0, 82.0, 89.0, 104.0, 97.0, 84.0, 97.0, 60.0, 56.0, 44.0, 17.0, 21.0, 8.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0085906982421875, -0.008302807807922363, -0.008014917373657227, -0.00772702693939209, -0.007439136505126953, -0.007151246070861816, -0.00686335563659668, -0.006575465202331543, -0.006287574768066406, -0.0059996843338012695, -0.005711793899536133, -0.005423903465270996, -0.005136013031005859, -0.004848122596740723, -0.004560232162475586, -0.004272341728210449, -0.0039844512939453125, -0.0036965608596801758, -0.003408670425415039, -0.0031207799911499023, -0.0028328895568847656, -0.002544999122619629, -0.002257108688354492, -0.0019692182540893555, -0.0016813278198242188, -0.001393437385559082, -0.0011055469512939453, -0.0008176565170288086, -0.0005297660827636719, -0.00024187564849853516, 4.601478576660156e-05, 0.0003339052200317383, 0.000621795654296875, 0.0009096860885620117, 0.0011975765228271484, 0.0014854669570922852, 0.0017733573913574219, 0.0020612478256225586, 0.0023491382598876953, 0.002637028694152832, 0.0029249191284179688, 0.0032128095626831055, 0.003500699996948242, 0.003788590431213379, 0.004076480865478516, 0.004364371299743652, 0.004652261734008789, 0.004940152168273926, 0.0052280426025390625, 0.005515933036804199, 0.005803823471069336, 0.006091713905334473, 0.006379604339599609, 0.006667494773864746, 0.006955385208129883, 0.0072432756423950195, 0.007531166076660156, 0.007819056510925293, 0.00810694694519043, 0.008394837379455566, 0.008682727813720703, 0.00897061824798584, 0.009258508682250977, 0.009546399116516113, 0.00983428955078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 5.0, 13.0, 24.0, 19.0, 26.0, 37.0, 68.0, 107.0, 134.0, 240.0, 393.0, 662.0, 1282.0, 2773.0, 6284.0, 16729.0, 55310.0, 265138.0, 2883216.0, 805954.0, 109074.0, 28686.0, 10065.0, 3871.0, 1871.0, 942.0, 498.0, 292.0, 176.0, 129.0, 76.0, 57.0, 33.0, 22.0, 22.0, 12.0, 6.0, 12.0, 6.0, 7.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0095367431640625, -0.009204864501953125, -0.00887298583984375, -0.008541107177734375, -0.008209228515625, -0.007877349853515625, -0.00754547119140625, -0.007213592529296875, -0.0068817138671875, -0.006549835205078125, -0.00621795654296875, -0.005886077880859375, -0.00555419921875, -0.005222320556640625, -0.00489044189453125, -0.004558563232421875, -0.0042266845703125, -0.003894805908203125, -0.00356292724609375, -0.003231048583984375, -0.002899169921875, -0.002567291259765625, -0.00223541259765625, -0.001903533935546875, -0.0015716552734375, -0.001239776611328125, -0.00090789794921875, -0.000576019287109375, -0.000244140625, 8.7738037109375e-05, 0.00041961669921875, 0.000751495361328125, 0.0010833740234375, 0.001415252685546875, 0.00174713134765625, 0.002079010009765625, 0.002410888671875, 0.002742767333984375, 0.00307464599609375, 0.003406524658203125, 0.0037384033203125, 0.004070281982421875, 0.00440216064453125, 0.004734039306640625, 0.00506591796875, 0.005397796630859375, 0.00572967529296875, 0.006061553955078125, 0.0063934326171875, 0.006725311279296875, 0.00705718994140625, 0.007389068603515625, 0.007720947265625, 0.008052825927734375, 0.00838470458984375, 0.008716583251953125, 0.0090484619140625, 0.009380340576171875, 0.00971221923828125, 0.010044097900390625, 0.0103759765625, 0.010707855224609375, 0.01103973388671875, 0.011371612548828125, 0.0117034912109375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 6.0, 13.0, 16.0, 16.0, 21.0, 33.0, 36.0, 59.0, 101.0, 127.0, 237.0, 467.0, 819.0, 845.0, 510.0, 265.0, 140.0, 98.0, 75.0, 42.0, 33.0, 25.0, 16.0, 15.0, 11.0, 18.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00862884521484375, -0.008309602737426758, -0.007990360260009766, -0.0076711177825927734, -0.007351875305175781, -0.007032632827758789, -0.006713390350341797, -0.006394147872924805, -0.0060749053955078125, -0.00575566291809082, -0.005436420440673828, -0.005117177963256836, -0.004797935485839844, -0.0044786930084228516, -0.004159450531005859, -0.003840208053588867, -0.003520965576171875, -0.003201723098754883, -0.0028824806213378906, -0.0025632381439208984, -0.0022439956665039062, -0.001924753189086914, -0.0016055107116699219, -0.0012862682342529297, -0.0009670257568359375, -0.0006477832794189453, -0.0003285408020019531, -9.298324584960938e-06, 0.00030994415283203125, 0.0006291866302490234, 0.0009484291076660156, 0.0012676715850830078, 0.0015869140625, 0.0019061565399169922, 0.0022253990173339844, 0.0025446414947509766, 0.0028638839721679688, 0.003183126449584961, 0.003502368927001953, 0.0038216114044189453, 0.0041408538818359375, 0.00446009635925293, 0.004779338836669922, 0.005098581314086914, 0.005417823791503906, 0.0057370662689208984, 0.006056308746337891, 0.006375551223754883, 0.006694793701171875, 0.007014036178588867, 0.007333278656005859, 0.0076525211334228516, 0.007971763610839844, 0.008291006088256836, 0.008610248565673828, 0.00892949104309082, 0.009248733520507812, 0.009567975997924805, 0.009887218475341797, 0.010206460952758789, 0.010525703430175781, 0.010844945907592773, 0.011164188385009766, 0.011483430862426758, 0.01180267333984375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 22.0, 69.0, 166.0, 263.0, 281.0, 123.0, 48.0, 16.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10016127675771713, -0.09642171859741211, -0.09268216788768768, -0.08894260972738266, -0.08520305156707764, -0.08146350085735321, -0.07772394269704819, -0.07398438453674316, -0.07024483382701874, -0.06650527566671371, -0.06276572495698929, -0.059026166796684265, -0.05528660863637924, -0.05154705420136452, -0.04780749976634979, -0.04406794160604477, -0.040328383445739746, -0.03658882901072502, -0.03284927085042, -0.029109716415405273, -0.0253701601177454, -0.021630603820085526, -0.0178910493850708, -0.014151493087410927, -0.010411936789751053, -0.006672380957752466, -0.0029328251257538795, 0.0008067302405834198, 0.004546286538243294, 0.008285842835903168, 0.012025397270917892, 0.015764953568577766, 0.019504502415657043, 0.023244058713316917, 0.02698361501097679, 0.030723169445991516, 0.03446272760629654, 0.038202282041311264, 0.04194183647632599, 0.04568139463663101, 0.04942094907164574, 0.05316050350666046, 0.056900061666965485, 0.06063961610198021, 0.06437917053699493, 0.06811872869729996, 0.07185828685760498, 0.0755978375673294, 0.07933739572763443, 0.08307695388793945, 0.08681650459766388, 0.0905560627579689, 0.09429562091827393, 0.09803517162799835, 0.10177472978830338, 0.1055142879486084, 0.10925383865833282, 0.11299339681863785, 0.11673294752836227, 0.1204725056886673, 0.12421206384897232, 0.12795162200927734, 0.13169117271900177, 0.1354307234287262, 0.13917028903961182]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 1.0, 8.0, 8.0, 9.0, 21.0, 17.0, 25.0, 28.0, 24.0, 37.0, 33.0, 33.0, 43.0, 33.0, 45.0, 51.0, 50.0, 35.0, 40.0, 39.0, 43.0, 33.0, 44.0, 34.0, 35.0, 37.0, 24.0, 35.0, 28.0, 21.0, 17.0, 11.0, 14.0, 10.0, 5.0, 5.0, 6.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.025185585021972656, -0.024384506046772003, -0.0235834289342165, -0.022782351821660995, -0.021981272846460342, -0.02118019387125969, -0.020379116758704185, -0.01957803964614868, -0.01877696067094803, -0.017975881695747375, -0.01717480458319187, -0.016373727470636368, -0.015572648495435715, -0.014771570451557636, -0.013970492407679558, -0.01316941436380148, -0.012368336319923401, -0.011567258276045322, -0.010766180232167244, -0.009965102188289165, -0.009164024144411087, -0.008362946100533009, -0.00756186805665493, -0.006760790012776852, -0.005959711968898773, -0.005158633925020695, -0.004357555881142616, -0.003556477837264538, -0.0027553997933864594, -0.001954321749508381, -0.0011532437056303024, -0.00035216566175222397, 0.0004489123821258545, 0.001249990426003933, 0.0020510684698820114, 0.00285214651376009, 0.0036532245576381683, 0.004454302601516247, 0.005255380645394325, 0.006056458689272404, 0.006857536733150482, 0.007658614777028561, 0.008459692820906639, 0.009260770864784718, 0.010061848908662796, 0.010862926952540874, 0.011664004996418953, 0.012465083040297031, 0.01326616108417511, 0.014067239128053188, 0.014868317171931267, 0.01566939428448677, 0.016470473259687424, 0.017271552234888077, 0.01807262934744358, 0.018873706459999084, 0.019674785435199738, 0.02047586441040039, 0.021276941522955894, 0.0220780186355114, 0.02287909761071205, 0.023680176585912704, 0.02448125369846821, 0.025282330811023712, 0.026083409786224365]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 10.0, 15.0, 24.0, 20.0, 43.0, 79.0, 116.0, 206.0, 396.0, 832.0, 2525.0, 10164.0, 55905.0, 390744.0, 495597.0, 73749.0, 13157.0, 3028.0, 943.0, 436.0, 221.0, 140.0, 76.0, 42.0, 31.0, 10.0, 18.0, 9.0, 8.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0321044921875, -0.031238555908203125, -0.03037261962890625, -0.029506683349609375, -0.0286407470703125, -0.027774810791015625, -0.02690887451171875, -0.026042938232421875, -0.025177001953125, -0.024311065673828125, -0.02344512939453125, -0.022579193115234375, -0.0217132568359375, -0.020847320556640625, -0.01998138427734375, -0.019115447998046875, -0.01824951171875, -0.017383575439453125, -0.01651763916015625, -0.015651702880859375, -0.0147857666015625, -0.013919830322265625, -0.01305389404296875, -0.012187957763671875, -0.011322021484375, -0.010456085205078125, -0.00959014892578125, -0.008724212646484375, -0.0078582763671875, -0.006992340087890625, -0.00612640380859375, -0.005260467529296875, -0.00439453125, -0.003528594970703125, -0.00266265869140625, -0.001796722412109375, -0.0009307861328125, -6.4849853515625e-05, 0.00080108642578125, 0.001667022705078125, 0.002532958984375, 0.003398895263671875, 0.00426483154296875, 0.005130767822265625, 0.0059967041015625, 0.006862640380859375, 0.00772857666015625, 0.008594512939453125, 0.00946044921875, 0.010326385498046875, 0.01119232177734375, 0.012058258056640625, 0.0129241943359375, 0.013790130615234375, 0.01465606689453125, 0.015522003173828125, 0.016387939453125, 0.017253875732421875, 0.01811981201171875, 0.018985748291015625, 0.0198516845703125, 0.020717620849609375, 0.02158355712890625, 0.022449493408203125, 0.0233154296875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 3.0, 13.0, 18.0, 17.0, 23.0, 50.0, 58.0, 58.0, 92.0, 92.0, 88.0, 104.0, 86.0, 77.0, 65.0, 68.0, 32.0, 26.0, 18.0, 6.0, 4.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00846099853515625, -0.00816655158996582, -0.00787210464477539, -0.007577657699584961, -0.007283210754394531, -0.0069887638092041016, -0.006694316864013672, -0.006399869918823242, -0.0061054229736328125, -0.005810976028442383, -0.005516529083251953, -0.0052220821380615234, -0.004927635192871094, -0.004633188247680664, -0.004338741302490234, -0.004044294357299805, -0.003749847412109375, -0.0034554004669189453, -0.0031609535217285156, -0.002866506576538086, -0.0025720596313476562, -0.0022776126861572266, -0.001983165740966797, -0.0016887187957763672, -0.0013942718505859375, -0.0010998249053955078, -0.0008053779602050781, -0.0005109310150146484, -0.00021648406982421875, 7.796287536621094e-05, 0.0003724098205566406, 0.0006668567657470703, 0.0009613037109375, 0.0012557506561279297, 0.0015501976013183594, 0.001844644546508789, 0.0021390914916992188, 0.0024335384368896484, 0.002727985382080078, 0.003022432327270508, 0.0033168792724609375, 0.003611326217651367, 0.003905773162841797, 0.0042002201080322266, 0.004494667053222656, 0.004789113998413086, 0.005083560943603516, 0.005378007888793945, 0.005672454833984375, 0.005966901779174805, 0.006261348724365234, 0.006555795669555664, 0.006850242614746094, 0.0071446895599365234, 0.007439136505126953, 0.007733583450317383, 0.008028030395507812, 0.008322477340698242, 0.008616924285888672, 0.008911371231079102, 0.009205818176269531, 0.009500265121459961, 0.00979471206665039, 0.01008915901184082, 0.01038360595703125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0, 7.0, 3.0, 5.0, 5.0, 13.0, 20.0, 15.0, 37.0, 56.0, 99.0, 190.0, 386.0, 905.0, 2011.0, 5314.0, 15009.0, 48726.0, 191596.0, 529386.0, 184287.0, 47043.0, 14589.0, 5202.0, 1995.0, 848.0, 356.0, 184.0, 92.0, 63.0, 31.0, 19.0, 23.0, 9.0, 3.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01458740234375, -0.01403665542602539, -0.013485908508300781, -0.012935161590576172, -0.012384414672851562, -0.011833667755126953, -0.011282920837402344, -0.010732173919677734, -0.010181427001953125, -0.009630680084228516, -0.009079933166503906, -0.008529186248779297, -0.007978439331054688, -0.007427692413330078, -0.006876945495605469, -0.006326198577880859, -0.00577545166015625, -0.005224704742431641, -0.004673957824707031, -0.004123210906982422, -0.0035724639892578125, -0.003021717071533203, -0.0024709701538085938, -0.0019202232360839844, -0.001369476318359375, -0.0008187294006347656, -0.00026798248291015625, 0.0002827644348144531, 0.0008335113525390625, 0.0013842582702636719, 0.0019350051879882812, 0.0024857521057128906, 0.0030364990234375, 0.0035872459411621094, 0.004137992858886719, 0.004688739776611328, 0.0052394866943359375, 0.005790233612060547, 0.006340980529785156, 0.006891727447509766, 0.007442474365234375, 0.007993221282958984, 0.008543968200683594, 0.009094715118408203, 0.009645462036132812, 0.010196208953857422, 0.010746955871582031, 0.01129770278930664, 0.01184844970703125, 0.01239919662475586, 0.012949943542480469, 0.013500690460205078, 0.014051437377929688, 0.014602184295654297, 0.015152931213378906, 0.015703678131103516, 0.016254425048828125, 0.016805171966552734, 0.017355918884277344, 0.017906665802001953, 0.018457412719726562, 0.019008159637451172, 0.01955890655517578, 0.02010965347290039, 0.020660400390625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 5.0, 7.0, 7.0, 7.0, 14.0, 12.0, 9.0, 18.0, 29.0, 34.0, 25.0, 34.0, 33.0, 37.0, 38.0, 33.0, 42.0, 44.0, 47.0, 44.0, 50.0, 51.0, 42.0, 35.0, 35.0, 31.0, 30.0, 29.0, 22.0, 29.0, 20.0, 14.0, 17.0, 9.0, 11.0, 9.0, 6.0, 12.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.0115966796875, -0.011211633682250977, -0.010826587677001953, -0.01044154167175293, -0.010056495666503906, -0.009671449661254883, -0.00928640365600586, -0.008901357650756836, -0.008516311645507812, -0.008131265640258789, -0.007746219635009766, -0.007361173629760742, -0.006976127624511719, -0.006591081619262695, -0.006206035614013672, -0.0058209896087646484, -0.005435943603515625, -0.0050508975982666016, -0.004665851593017578, -0.004280805587768555, -0.0038957595825195312, -0.003510713577270508, -0.0031256675720214844, -0.002740621566772461, -0.0023555755615234375, -0.001970529556274414, -0.0015854835510253906, -0.0012004375457763672, -0.0008153915405273438, -0.0004303455352783203, -4.5299530029296875e-05, 0.00033974647521972656, 0.00072479248046875, 0.0011098384857177734, 0.0014948844909667969, 0.0018799304962158203, 0.0022649765014648438, 0.002650022506713867, 0.0030350685119628906, 0.003420114517211914, 0.0038051605224609375, 0.004190206527709961, 0.004575252532958984, 0.004960298538208008, 0.005345344543457031, 0.005730390548706055, 0.006115436553955078, 0.0065004825592041016, 0.006885528564453125, 0.0072705745697021484, 0.007655620574951172, 0.008040666580200195, 0.008425712585449219, 0.008810758590698242, 0.009195804595947266, 0.009580850601196289, 0.009965896606445312, 0.010350942611694336, 0.01073598861694336, 0.011121034622192383, 0.011506080627441406, 0.01189112663269043, 0.012276172637939453, 0.012661218643188477, 0.0130462646484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 7.0, 10.0, 21.0, 35.0, 60.0, 93.0, 169.0, 288.0, 462.0, 888.0, 1614.0, 3133.0, 5998.0, 12416.0, 27105.0, 67146.0, 204810.0, 414119.0, 194698.0, 64896.0, 26258.0, 11984.0, 5791.0, 2952.0, 1627.0, 795.0, 479.0, 263.0, 177.0, 95.0, 57.0, 33.0, 23.0, 11.0, 14.0, 6.0, 3.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004261016845703125, -0.00412982702255249, -0.0039986371994018555, -0.0038674473762512207, -0.003736257553100586, -0.003605067729949951, -0.0034738779067993164, -0.0033426880836486816, -0.003211498260498047, -0.003080308437347412, -0.0029491186141967773, -0.0028179287910461426, -0.002686738967895508, -0.002555549144744873, -0.0024243593215942383, -0.0022931694984436035, -0.0021619796752929688, -0.002030789852142334, -0.0018996000289916992, -0.0017684102058410645, -0.0016372203826904297, -0.001506030559539795, -0.0013748407363891602, -0.0012436509132385254, -0.0011124610900878906, -0.0009812712669372559, -0.0008500814437866211, -0.0007188916206359863, -0.0005877017974853516, -0.0004565119743347168, -0.00032532215118408203, -0.00019413232803344727, -6.29425048828125e-05, 6.824731826782227e-05, 0.00019943714141845703, 0.0003306269645690918, 0.00046181678771972656, 0.0005930066108703613, 0.0007241964340209961, 0.0008553862571716309, 0.0009865760803222656, 0.0011177659034729004, 0.0012489557266235352, 0.00138014554977417, 0.0015113353729248047, 0.0016425251960754395, 0.0017737150192260742, 0.001904904842376709, 0.0020360946655273438, 0.0021672844886779785, 0.0022984743118286133, 0.002429664134979248, 0.002560853958129883, 0.0026920437812805176, 0.0028232336044311523, 0.002954423427581787, 0.003085613250732422, 0.0032168030738830566, 0.0033479928970336914, 0.003479182720184326, 0.003610372543334961, 0.0037415623664855957, 0.0038727521896362305, 0.004003942012786865, 0.0041351318359375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 10.0, 10.0, 12.0, 19.0, 14.0, 16.0, 19.0, 30.0, 37.0, 42.0, 34.0, 47.0, 0.0, 49.0, 58.0, 65.0, 61.0, 53.0, 68.0, 44.0, 46.0, 51.0, 43.0, 39.0, 29.0, 27.0, 11.0, 15.0, 0.0, 11.0, 9.0, 8.0, 9.0, 7.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.9669532775878906e-06, -1.911073923110962e-06, -1.8551945686340332e-06, -1.7993152141571045e-06, -1.7434358596801758e-06, -1.687556505203247e-06, -1.6316771507263184e-06, -1.5757977962493896e-06, -1.519918441772461e-06, -1.4640390872955322e-06, -1.4081597328186035e-06, -1.3522803783416748e-06, -1.296401023864746e-06, -1.2405216693878174e-06, -1.1846423149108887e-06, -1.12876296043396e-06, -1.0728836059570312e-06, -1.0170042514801025e-06, -9.611248970031738e-07, -9.052455425262451e-07, -8.493661880493164e-07, -7.934868335723877e-07, -7.37607479095459e-07, -6.817281246185303e-07, -6.258487701416016e-07, -5.699694156646729e-07, -5.140900611877441e-07, -4.5821070671081543e-07, -4.023313522338867e-07, -3.46451997756958e-07, -2.905726432800293e-07, -2.3469328880310059e-07, -1.7881393432617188e-07, -1.2293457984924316e-07, -6.705522537231445e-08, -1.1175870895385742e-08, 4.470348358154297e-08, 1.0058283805847168e-07, 1.564621925354004e-07, 2.123415470123291e-07, 2.682209014892578e-07, 3.241002559661865e-07, 3.7997961044311523e-07, 4.3585896492004395e-07, 4.917383193969727e-07, 5.476176738739014e-07, 6.034970283508301e-07, 6.593763828277588e-07, 7.152557373046875e-07, 7.711350917816162e-07, 8.270144462585449e-07, 8.828938007354736e-07, 9.387731552124023e-07, 9.94652509689331e-07, 1.0505318641662598e-06, 1.1064112186431885e-06, 1.1622905731201172e-06, 1.218169927597046e-06, 1.2740492820739746e-06, 1.3299286365509033e-06, 1.385807991027832e-06, 1.4416873455047607e-06, 1.4975666999816895e-06, 1.5534460544586182e-06, 1.6093254089355469e-06]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 6.0, 6.0, 8.0, 9.0, 25.0, 31.0, 43.0, 68.0, 134.0, 204.0, 414.0, 741.0, 1337.0, 2624.0, 5206.0, 11274.0, 26576.0, 69611.0, 213638.0, 401937.0, 201916.0, 66381.0, 25086.0, 10771.0, 5072.0, 2528.0, 1268.0, 697.0, 390.0, 221.0, 120.0, 75.0, 51.0, 20.0, 23.0, 15.0, 9.0, 4.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0042266845703125, -0.004092395305633545, -0.00395810604095459, -0.0038238167762756348, -0.0036895275115966797, -0.0035552382469177246, -0.0034209489822387695, -0.0032866597175598145, -0.0031523704528808594, -0.0030180811882019043, -0.0028837919235229492, -0.002749502658843994, -0.002615213394165039, -0.002480924129486084, -0.002346634864807129, -0.002212345600128174, -0.0020780563354492188, -0.0019437670707702637, -0.0018094778060913086, -0.0016751885414123535, -0.0015408992767333984, -0.0014066100120544434, -0.0012723207473754883, -0.0011380314826965332, -0.0010037422180175781, -0.000869452953338623, -0.000735163688659668, -0.0006008744239807129, -0.0004665851593017578, -0.00033229589462280273, -0.00019800662994384766, -6.371736526489258e-05, 7.05718994140625e-05, 0.00020486116409301758, 0.00033915042877197266, 0.00047343969345092773, 0.0006077289581298828, 0.0007420182228088379, 0.000876307487487793, 0.001010596752166748, 0.0011448860168457031, 0.0012791752815246582, 0.0014134645462036133, 0.0015477538108825684, 0.0016820430755615234, 0.0018163323402404785, 0.0019506216049194336, 0.0020849108695983887, 0.0022192001342773438, 0.002353489398956299, 0.002487778663635254, 0.002622067928314209, 0.002756357192993164, 0.002890646457672119, 0.0030249357223510742, 0.0031592249870300293, 0.0032935142517089844, 0.0034278035163879395, 0.0035620927810668945, 0.0036963820457458496, 0.0038306713104248047, 0.00396496057510376, 0.004099249839782715, 0.00423353910446167, 0.004367828369140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 4.0, 4.0, 7.0, 11.0, 8.0, 18.0, 24.0, 17.0, 27.0, 35.0, 56.0, 73.0, 69.0, 93.0, 93.0, 90.0, 78.0, 47.0, 45.0, 43.0, 29.0, 31.0, 21.0, 20.0, 15.0, 8.0, 8.0, 11.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004528045654296875, -0.0043808817863464355, -0.004233717918395996, -0.004086554050445557, -0.003939390182495117, -0.0037922263145446777, -0.0036450624465942383, -0.003497898578643799, -0.0033507347106933594, -0.00320357084274292, -0.0030564069747924805, -0.002909243106842041, -0.0027620792388916016, -0.002614915370941162, -0.0024677515029907227, -0.002320587635040283, -0.0021734237670898438, -0.0020262598991394043, -0.0018790960311889648, -0.0017319321632385254, -0.001584768295288086, -0.0014376044273376465, -0.001290440559387207, -0.0011432766914367676, -0.0009961128234863281, -0.0008489489555358887, -0.0007017850875854492, -0.0005546212196350098, -0.0004074573516845703, -0.00026029348373413086, -0.0001131296157836914, 3.403425216674805e-05, 0.0001811981201171875, 0.00032836198806762695, 0.0004755258560180664, 0.0006226897239685059, 0.0007698535919189453, 0.0009170174598693848, 0.0010641813278198242, 0.0012113451957702637, 0.0013585090637207031, 0.0015056729316711426, 0.001652836799621582, 0.0018000006675720215, 0.001947164535522461, 0.0020943284034729004, 0.00224149227142334, 0.0023886561393737793, 0.0025358200073242188, 0.002682983875274658, 0.0028301477432250977, 0.002977311611175537, 0.0031244754791259766, 0.003271639347076416, 0.0034188032150268555, 0.003565967082977295, 0.0037131309509277344, 0.003860294818878174, 0.004007458686828613, 0.004154622554779053, 0.004301786422729492, 0.004448950290679932, 0.004596114158630371, 0.0047432780265808105, 0.00489044189453125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 10.0, 18.0, 47.0, 94.0, 187.0, 247.0, 193.0, 100.0, 56.0, 27.0, 11.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14375555515289307, -0.1405414491891861, -0.13732734322547913, -0.13411323726177216, -0.13089913129806519, -0.12768502533435822, -0.12447091937065125, -0.12125681340694427, -0.1180427074432373, -0.11482860147953033, -0.11161449551582336, -0.1084003895521164, -0.10518628358840942, -0.10197217762470245, -0.09875807166099548, -0.09554396569728851, -0.09232985973358154, -0.08911575376987457, -0.0859016478061676, -0.08268754184246063, -0.07947343587875366, -0.07625932991504669, -0.07304522395133972, -0.06983111798763275, -0.06661700457334518, -0.06340289860963821, -0.060188792645931244, -0.056974686682224274, -0.0537605807185173, -0.05054647475481033, -0.04733236879110336, -0.04411826282739639, -0.04090415686368942, -0.03769005089998245, -0.03447594493627548, -0.03126183897256851, -0.028047733008861542, -0.024833625182509422, -0.021619519218802452, -0.018405413255095482, -0.015191307291388512, -0.011977201327681541, -0.008763095363974571, -0.005548988468945026, -0.002334882505238056, 0.0008792243897914886, 0.004093330353498459, 0.007307436317205429, 0.0105215422809124, 0.01373564824461937, 0.01694975420832634, 0.02016386017203331, 0.02337796613574028, 0.0265920739620924, 0.02980617992579937, 0.03302028775215149, 0.03623439371585846, 0.03944849967956543, 0.0426626056432724, 0.04587671160697937, 0.04909081757068634, 0.05230492353439331, 0.05551902949810028, 0.05873313546180725, 0.06194724142551422]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 9.0, 3.0, 8.0, 3.0, 10.0, 9.0, 12.0, 11.0, 24.0, 21.0, 14.0, 17.0, 17.0, 23.0, 33.0, 25.0, 34.0, 36.0, 28.0, 37.0, 29.0, 37.0, 35.0, 34.0, 35.0, 35.0, 33.0, 46.0, 28.0, 30.0, 33.0, 27.0, 33.0, 23.0, 26.0, 18.0, 18.0, 9.0, 18.0, 12.0, 13.0, 14.0, 8.0, 12.0, 2.0, 9.0, 3.0, 4.0, 1.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.027138233184814453, -0.026266587898135185, -0.025394942611455917, -0.02452329732477665, -0.02365165203809738, -0.022780006751418114, -0.021908361464738846, -0.021036716178059578, -0.02016507089138031, -0.019293425604701042, -0.018421780318021774, -0.017550135031342506, -0.01667848974466324, -0.01580684445798397, -0.014935199171304703, -0.014063553884625435, -0.013191908597946167, -0.012320263311266899, -0.011448618024587631, -0.010576972737908363, -0.009705327451229095, -0.008833682164549828, -0.00796203687787056, -0.007090391591191292, -0.006218746304512024, -0.005347101017832756, -0.004475455731153488, -0.0036038104444742203, -0.0027321651577949524, -0.0018605198711156845, -0.0009888745844364166, -0.00011722929775714874, 0.0007544159889221191, 0.001626061275601387, 0.002497706562280655, 0.003369351848959923, 0.004240997135639191, 0.0051126424223184586, 0.0059842877089977264, 0.006855932995676994, 0.007727578282356262, 0.00859922356903553, 0.009470868855714798, 0.010342514142394066, 0.011214159429073334, 0.012085804715752602, 0.01295745000243187, 0.013829095289111137, 0.014700740575790405, 0.015572385862469673, 0.01644403114914894, 0.01731567643582821, 0.018187321722507477, 0.019058967009186745, 0.019930612295866013, 0.02080225758254528, 0.02167390286922455, 0.022545548155903816, 0.023417193442583084, 0.024288838729262352, 0.02516048401594162, 0.026032129302620888, 0.026903774589300156, 0.027775419875979424, 0.02864706516265869]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 15.0, 13.0, 20.0, 16.0, 30.0, 43.0, 62.0, 107.0, 199.0, 314.0, 804.0, 1896.0, 4994.0, 15772.0, 59481.0, 496162.0, 2996061.0, 534592.0, 59998.0, 15269.0, 4933.0, 1845.0, 755.0, 379.0, 184.0, 104.0, 65.0, 46.0, 34.0, 19.0, 11.0, 11.0, 9.0, 8.0, 3.0, 4.0, 9.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01297760009765625, -0.0125657320022583, -0.012153863906860352, -0.011741995811462402, -0.011330127716064453, -0.010918259620666504, -0.010506391525268555, -0.010094523429870605, -0.009682655334472656, -0.009270787239074707, -0.008858919143676758, -0.008447051048278809, -0.00803518295288086, -0.00762331485748291, -0.007211446762084961, -0.006799578666687012, -0.0063877105712890625, -0.005975842475891113, -0.005563974380493164, -0.005152106285095215, -0.004740238189697266, -0.004328370094299316, -0.003916501998901367, -0.003504633903503418, -0.0030927658081054688, -0.0026808977127075195, -0.0022690296173095703, -0.001857161521911621, -0.0014452934265136719, -0.0010334253311157227, -0.0006215572357177734, -0.00020968914031982422, 0.000202178955078125, 0.0006140470504760742, 0.0010259151458740234, 0.0014377832412719727, 0.0018496513366699219, 0.002261519432067871, 0.0026733875274658203, 0.0030852556228637695, 0.0034971237182617188, 0.003908991813659668, 0.004320859909057617, 0.004732728004455566, 0.005144596099853516, 0.005556464195251465, 0.005968332290649414, 0.006380200386047363, 0.0067920684814453125, 0.007203936576843262, 0.007615804672241211, 0.00802767276763916, 0.00843954086303711, 0.008851408958435059, 0.009263277053833008, 0.009675145149230957, 0.010087013244628906, 0.010498881340026855, 0.010910749435424805, 0.011322617530822754, 0.011734485626220703, 0.012146353721618652, 0.012558221817016602, 0.01297008991241455, 0.0133819580078125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 8.0, 9.0, 17.0, 30.0, 38.0, 39.0, 57.0, 64.0, 65.0, 88.0, 86.0, 82.0, 74.0, 62.0, 80.0, 59.0, 49.0, 31.0, 25.0, 19.0, 12.0, 8.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00803375244140625, -0.007756710052490234, -0.007479667663574219, -0.007202625274658203, -0.0069255828857421875, -0.006648540496826172, -0.006371498107910156, -0.006094455718994141, -0.005817413330078125, -0.005540370941162109, -0.005263328552246094, -0.004986286163330078, -0.0047092437744140625, -0.004432201385498047, -0.004155158996582031, -0.0038781166076660156, -0.00360107421875, -0.0033240318298339844, -0.0030469894409179688, -0.002769947052001953, -0.0024929046630859375, -0.002215862274169922, -0.0019388198852539062, -0.0016617774963378906, -0.001384735107421875, -0.0011076927185058594, -0.0008306503295898438, -0.0005536079406738281, -0.0002765655517578125, 4.76837158203125e-07, 0.00027751922607421875, 0.0005545616149902344, 0.00083160400390625, 0.0011086463928222656, 0.0013856887817382812, 0.0016627311706542969, 0.0019397735595703125, 0.002216815948486328, 0.0024938583374023438, 0.0027709007263183594, 0.003047943115234375, 0.0033249855041503906, 0.0036020278930664062, 0.003879070281982422, 0.0041561126708984375, 0.004433155059814453, 0.004710197448730469, 0.004987239837646484, 0.0052642822265625, 0.005541324615478516, 0.005818367004394531, 0.006095409393310547, 0.0063724517822265625, 0.006649494171142578, 0.006926536560058594, 0.007203578948974609, 0.007480621337890625, 0.007757663726806641, 0.008034706115722656, 0.008311748504638672, 0.008588790893554688, 0.008865833282470703, 0.009142875671386719, 0.009419918060302734, 0.00969696044921875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 6.0, 7.0, 5.0, 15.0, 17.0, 22.0, 35.0, 59.0, 94.0, 169.0, 274.0, 481.0, 833.0, 1706.0, 3612.0, 8035.0, 18815.0, 51190.0, 168915.0, 951568.0, 2463267.0, 377528.0, 93068.0, 31478.0, 12200.0, 5437.0, 2571.0, 1301.0, 680.0, 367.0, 182.0, 147.0, 64.0, 39.0, 31.0, 19.0, 12.0, 7.0, 5.0, 4.0, 0.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00905609130859375, -0.008756875991821289, -0.008457660675048828, -0.008158445358276367, -0.007859230041503906, -0.007560014724731445, -0.007260799407958984, -0.0069615840911865234, -0.0066623687744140625, -0.0063631534576416016, -0.006063938140869141, -0.00576472282409668, -0.005465507507324219, -0.005166292190551758, -0.004867076873779297, -0.004567861557006836, -0.004268646240234375, -0.003969430923461914, -0.003670215606689453, -0.003371000289916992, -0.0030717849731445312, -0.0027725696563720703, -0.0024733543395996094, -0.0021741390228271484, -0.0018749237060546875, -0.0015757083892822266, -0.0012764930725097656, -0.0009772777557373047, -0.0006780624389648438, -0.0003788471221923828, -7.963180541992188e-05, 0.00021958351135253906, 0.000518798828125, 0.0008180141448974609, 0.0011172294616699219, 0.0014164447784423828, 0.0017156600952148438, 0.0020148754119873047, 0.0023140907287597656, 0.0026133060455322266, 0.0029125213623046875, 0.0032117366790771484, 0.0035109519958496094, 0.0038101673126220703, 0.004109382629394531, 0.004408597946166992, 0.004707813262939453, 0.005007028579711914, 0.005306243896484375, 0.005605459213256836, 0.005904674530029297, 0.006203889846801758, 0.006503105163574219, 0.00680232048034668, 0.007101535797119141, 0.0074007511138916016, 0.0076999664306640625, 0.007999181747436523, 0.008298397064208984, 0.008597612380981445, 0.008896827697753906, 0.009196043014526367, 0.009495258331298828, 0.009794473648071289, 0.01009368896484375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 9.0, 5.0, 10.0, 10.0, 15.0, 12.0, 26.0, 34.0, 34.0, 32.0, 62.0, 79.0, 129.0, 133.0, 210.0, 316.0, 470.0, 629.0, 509.0, 386.0, 266.0, 169.0, 121.0, 89.0, 58.0, 59.0, 42.0, 27.0, 29.0, 22.0, 17.0, 16.0, 7.0, 9.0, 4.0, 5.0, 2.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.01025390625, -0.009966850280761719, -0.009679794311523438, -0.009392738342285156, -0.009105682373046875, -0.008818626403808594, -0.008531570434570312, -0.008244514465332031, -0.00795745849609375, -0.007670402526855469, -0.0073833465576171875, -0.007096290588378906, -0.006809234619140625, -0.006522178649902344, -0.0062351226806640625, -0.005948066711425781, -0.0056610107421875, -0.005373954772949219, -0.0050868988037109375, -0.004799842834472656, -0.004512786865234375, -0.004225730895996094, -0.0039386749267578125, -0.0036516189575195312, -0.00336456298828125, -0.0030775070190429688, -0.0027904510498046875, -0.0025033950805664062, -0.002216339111328125, -0.0019292831420898438, -0.0016422271728515625, -0.0013551712036132812, -0.001068115234375, -0.0007810592651367188, -0.0004940032958984375, -0.00020694732666015625, 8.0108642578125e-05, 0.00036716461181640625, 0.0006542205810546875, 0.0009412765502929688, 0.00122833251953125, 0.0015153884887695312, 0.0018024444580078125, 0.0020895004272460938, 0.002376556396484375, 0.0026636123657226562, 0.0029506683349609375, 0.0032377243041992188, 0.0035247802734375, 0.0038118362426757812, 0.0040988922119140625, 0.004385948181152344, 0.004673004150390625, 0.004960060119628906, 0.0052471160888671875, 0.005534172058105469, 0.00582122802734375, 0.006108283996582031, 0.0063953399658203125, 0.006682395935058594, 0.006969451904296875, 0.007256507873535156, 0.0075435638427734375, 0.007830619812011719, 0.00811767578125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 17.0, 28.0, 77.0, 115.0, 176.0, 203.0, 150.0, 116.0, 49.0, 38.0, 16.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11348187178373337, -0.11067906767129898, -0.107876256108284, -0.10507345199584961, -0.10227064788341522, -0.09946784377098083, -0.09666503965854645, -0.09386222809553146, -0.09105942398309708, -0.08825661987066269, -0.0854538083076477, -0.08265100419521332, -0.07984820008277893, -0.07704539597034454, -0.07424259185791016, -0.07143978029489517, -0.06863697618246078, -0.0658341720700264, -0.06303136050701141, -0.060228556394577026, -0.05742575228214264, -0.05462294816970825, -0.051820140331983566, -0.04901733249425888, -0.04621452838182449, -0.043411724269390106, -0.04060891643166542, -0.037806108593940735, -0.03500330448150635, -0.03220050036907196, -0.029397692531347275, -0.02659488655626774, -0.023792080581188202, -0.020989274606108665, -0.01818646863102913, -0.015383662655949593, -0.012580856680870056, -0.00977805070579052, -0.006975244730710983, -0.004172438755631447, -0.0013696327805519104, 0.001433173194527626, 0.0042359791696071625, 0.007038785144686699, 0.009841591119766235, 0.012644397094845772, 0.015447203069925308, 0.018250009045004845, 0.02105281502008438, 0.023855620995163918, 0.026658426970243454, 0.02946123294532299, 0.03226403892040253, 0.035066843032836914, 0.0378696508705616, 0.040672458708286285, 0.04347526282072067, 0.04627806693315506, 0.049080874770879745, 0.05188368260860443, 0.05468648672103882, 0.057489290833473206, 0.06029209867119789, 0.06309490650892258, 0.06589771062135696]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 6.0, 3.0, 5.0, 7.0, 12.0, 11.0, 17.0, 16.0, 18.0, 22.0, 28.0, 31.0, 25.0, 27.0, 35.0, 49.0, 40.0, 44.0, 40.0, 48.0, 46.0, 41.0, 53.0, 38.0, 36.0, 33.0, 35.0, 35.0, 32.0, 29.0, 15.0, 25.0, 22.0, 13.0, 11.0, 11.0, 10.0, 3.0, 3.0, 8.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.030679166316986084, -0.029681259766221046, -0.02868335321545601, -0.02768544666469097, -0.026687540113925934, -0.025689633563160896, -0.02469172701239586, -0.02369382046163082, -0.022695913910865784, -0.021698007360100746, -0.02070010080933571, -0.01970219425857067, -0.018704287707805634, -0.017706381157040596, -0.01670847460627556, -0.01571056805551052, -0.014712661504745483, -0.013714754953980446, -0.012716848403215408, -0.01171894185245037, -0.010721035301685333, -0.009723128750920296, -0.008725222200155258, -0.007727315649390221, -0.006729409098625183, -0.005731502547860146, -0.004733595997095108, -0.0037356894463300705, -0.002737782895565033, -0.0017398763447999954, -0.0007419697940349579, 0.00025593675673007965, 0.0012538433074951172, 0.0022517498582601547, 0.0032496564090251923, 0.00424756295979023, 0.005245469510555267, 0.006243376061320305, 0.007241282612085342, 0.00823918916285038, 0.009237095713615417, 0.010235002264380455, 0.011232908815145493, 0.01223081536591053, 0.013228721916675568, 0.014226628467440605, 0.015224535018205643, 0.01622244156897068, 0.017220348119735718, 0.018218254670500755, 0.019216161221265793, 0.02021406777203083, 0.021211974322795868, 0.022209880873560905, 0.023207787424325943, 0.02420569397509098, 0.025203600525856018, 0.026201507076621056, 0.027199413627386093, 0.02819732017815113, 0.029195226728916168, 0.030193133279681206, 0.031191039830446243, 0.03218894451856613, 0.03318685293197632]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 0.0, 13.0, 15.0, 32.0, 47.0, 96.0, 197.0, 404.0, 1007.0, 3256.0, 14751.0, 90785.0, 522938.0, 349882.0, 52415.0, 9045.0, 2180.0, 774.0, 353.0, 170.0, 69.0, 48.0, 27.0, 14.0, 8.0, 8.0, 8.0, 0.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.030364990234375, -0.029468059539794922, -0.028571128845214844, -0.027674198150634766, -0.026777267456054688, -0.02588033676147461, -0.02498340606689453, -0.024086475372314453, -0.023189544677734375, -0.022292613983154297, -0.02139568328857422, -0.02049875259399414, -0.019601821899414062, -0.018704891204833984, -0.017807960510253906, -0.016911029815673828, -0.01601409912109375, -0.015117168426513672, -0.014220237731933594, -0.013323307037353516, -0.012426376342773438, -0.01152944564819336, -0.010632514953613281, -0.009735584259033203, -0.008838653564453125, -0.007941722869873047, -0.007044792175292969, -0.006147861480712891, -0.0052509307861328125, -0.004354000091552734, -0.0034570693969726562, -0.002560138702392578, -0.0016632080078125, -0.0007662773132324219, 0.00013065338134765625, 0.0010275840759277344, 0.0019245147705078125, 0.0028214454650878906, 0.0037183761596679688, 0.004615306854248047, 0.005512237548828125, 0.006409168243408203, 0.007306098937988281, 0.00820302963256836, 0.009099960327148438, 0.009996891021728516, 0.010893821716308594, 0.011790752410888672, 0.01268768310546875, 0.013584613800048828, 0.014481544494628906, 0.015378475189208984, 0.016275405883789062, 0.01717233657836914, 0.01806926727294922, 0.018966197967529297, 0.019863128662109375, 0.020760059356689453, 0.02165699005126953, 0.02255392074584961, 0.023450851440429688, 0.024347782135009766, 0.025244712829589844, 0.026141643524169922, 0.02703857421875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 10.0, 10.0, 15.0, 19.0, 30.0, 34.0, 52.0, 53.0, 66.0, 67.0, 63.0, 80.0, 74.0, 85.0, 59.0, 54.0, 56.0, 48.0, 31.0, 23.0, 21.0, 20.0, 8.0, 10.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00765228271484375, -0.00739741325378418, -0.007142543792724609, -0.006887674331665039, -0.006632804870605469, -0.0063779354095458984, -0.006123065948486328, -0.005868196487426758, -0.0056133270263671875, -0.005358457565307617, -0.005103588104248047, -0.0048487186431884766, -0.004593849182128906, -0.004338979721069336, -0.004084110260009766, -0.0038292407989501953, -0.003574371337890625, -0.0033195018768310547, -0.0030646324157714844, -0.002809762954711914, -0.0025548934936523438, -0.0023000240325927734, -0.002045154571533203, -0.0017902851104736328, -0.0015354156494140625, -0.0012805461883544922, -0.0010256767272949219, -0.0007708072662353516, -0.0005159378051757812, -0.00026106834411621094, -6.198883056640625e-06, 0.0002486705780029297, 0.0005035400390625, 0.0007584095001220703, 0.0010132789611816406, 0.001268148422241211, 0.0015230178833007812, 0.0017778873443603516, 0.002032756805419922, 0.002287626266479492, 0.0025424957275390625, 0.002797365188598633, 0.003052234649658203, 0.0033071041107177734, 0.0035619735717773438, 0.003816843032836914, 0.004071712493896484, 0.004326581954956055, 0.004581451416015625, 0.004836320877075195, 0.005091190338134766, 0.005346059799194336, 0.005600929260253906, 0.0058557987213134766, 0.006110668182373047, 0.006365537643432617, 0.0066204071044921875, 0.006875276565551758, 0.007130146026611328, 0.0073850154876708984, 0.007639884948730469, 0.007894754409790039, 0.00814962387084961, 0.00840449333190918, 0.00865936279296875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 4.0, 16.0, 12.0, 18.0, 38.0, 65.0, 87.0, 154.0, 236.0, 478.0, 1009.0, 2242.0, 5506.0, 16071.0, 53391.0, 201981.0, 469718.0, 213777.0, 56387.0, 16860.0, 5850.0, 2398.0, 1075.0, 503.0, 245.0, 146.0, 90.0, 56.0, 29.0, 28.0, 23.0, 14.0, 13.0, 3.0, 10.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0155181884765625, -0.014974117279052734, -0.014430046081542969, -0.013885974884033203, -0.013341903686523438, -0.012797832489013672, -0.012253761291503906, -0.01170969009399414, -0.011165618896484375, -0.01062154769897461, -0.010077476501464844, -0.009533405303955078, -0.008989334106445312, -0.008445262908935547, -0.007901191711425781, -0.007357120513916016, -0.00681304931640625, -0.006268978118896484, -0.005724906921386719, -0.005180835723876953, -0.0046367645263671875, -0.004092693328857422, -0.0035486221313476562, -0.0030045509338378906, -0.002460479736328125, -0.0019164085388183594, -0.0013723373413085938, -0.0008282661437988281, -0.0002841949462890625, 0.0002598762512207031, 0.0008039474487304688, 0.0013480186462402344, 0.00189208984375, 0.0024361610412597656, 0.0029802322387695312, 0.003524303436279297, 0.0040683746337890625, 0.004612445831298828, 0.005156517028808594, 0.005700588226318359, 0.006244659423828125, 0.006788730621337891, 0.007332801818847656, 0.007876873016357422, 0.008420944213867188, 0.008965015411376953, 0.009509086608886719, 0.010053157806396484, 0.01059722900390625, 0.011141300201416016, 0.011685371398925781, 0.012229442596435547, 0.012773513793945312, 0.013317584991455078, 0.013861656188964844, 0.01440572738647461, 0.014949798583984375, 0.01549386978149414, 0.016037940979003906, 0.016582012176513672, 0.017126083374023438, 0.017670154571533203, 0.01821422576904297, 0.018758296966552734, 0.0193023681640625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 6.0, 7.0, 9.0, 13.0, 24.0, 23.0, 33.0, 33.0, 30.0, 33.0, 35.0, 41.0, 43.0, 52.0, 43.0, 54.0, 60.0, 55.0, 46.0, 38.0, 38.0, 33.0, 29.0, 36.0, 42.0, 33.0, 21.0, 18.0, 17.0, 11.0, 12.0, 5.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01294708251953125, -0.012468934059143066, -0.011990785598754883, -0.0115126371383667, -0.011034488677978516, -0.010556340217590332, -0.010078191757202148, -0.009600043296813965, -0.009121894836425781, -0.008643746376037598, -0.008165597915649414, -0.0076874494552612305, -0.007209300994873047, -0.006731152534484863, -0.00625300407409668, -0.005774855613708496, -0.0052967071533203125, -0.004818558692932129, -0.004340410232543945, -0.0038622617721557617, -0.003384113311767578, -0.0029059648513793945, -0.002427816390991211, -0.0019496679306030273, -0.0014715194702148438, -0.0009933710098266602, -0.0005152225494384766, -3.707408905029297e-05, 0.0004410743713378906, 0.0009192228317260742, 0.0013973712921142578, 0.0018755197525024414, 0.002353668212890625, 0.0028318166732788086, 0.003309965133666992, 0.0037881135940551758, 0.004266262054443359, 0.004744410514831543, 0.0052225589752197266, 0.00570070743560791, 0.006178855895996094, 0.006657004356384277, 0.007135152816772461, 0.0076133012771606445, 0.008091449737548828, 0.008569598197937012, 0.009047746658325195, 0.009525895118713379, 0.010004043579101562, 0.010482192039489746, 0.01096034049987793, 0.011438488960266113, 0.011916637420654297, 0.01239478588104248, 0.012872934341430664, 0.013351082801818848, 0.013829231262207031, 0.014307379722595215, 0.014785528182983398, 0.015263676643371582, 0.015741825103759766, 0.01621997356414795, 0.016698122024536133, 0.017176270484924316, 0.0176544189453125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 8.0, 15.0, 14.0, 5.0, 18.0, 26.0, 42.0, 84.0, 143.0, 217.0, 359.0, 635.0, 1065.0, 1889.0, 3876.0, 9041.0, 23444.0, 69596.0, 235264.0, 440899.0, 175431.0, 53462.0, 18464.0, 7411.0, 3199.0, 1726.0, 886.0, 499.0, 291.0, 174.0, 115.0, 102.0, 62.0, 33.0, 26.0, 11.0, 8.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00621795654296875, -0.006037116050720215, -0.00585627555847168, -0.0056754350662231445, -0.005494594573974609, -0.005313754081726074, -0.005132913589477539, -0.004952073097229004, -0.004771232604980469, -0.004590392112731934, -0.0044095516204833984, -0.004228711128234863, -0.004047870635986328, -0.003867030143737793, -0.003686189651489258, -0.0035053491592407227, -0.0033245086669921875, -0.0031436681747436523, -0.002962827682495117, -0.002781987190246582, -0.002601146697998047, -0.0024203062057495117, -0.0022394657135009766, -0.0020586252212524414, -0.0018777847290039062, -0.001696944236755371, -0.001516103744506836, -0.0013352632522583008, -0.0011544227600097656, -0.0009735822677612305, -0.0007927417755126953, -0.0006119012832641602, -0.000431060791015625, -0.00025022029876708984, -6.937980651855469e-05, 0.00011146068572998047, 0.0002923011779785156, 0.0004731416702270508, 0.0006539821624755859, 0.0008348226547241211, 0.0010156631469726562, 0.0011965036392211914, 0.0013773441314697266, 0.0015581846237182617, 0.0017390251159667969, 0.001919865608215332, 0.002100706100463867, 0.0022815465927124023, 0.0024623870849609375, 0.0026432275772094727, 0.002824068069458008, 0.003004908561706543, 0.003185749053955078, 0.0033665895462036133, 0.0035474300384521484, 0.0037282705307006836, 0.003909111022949219, 0.004089951515197754, 0.004270792007446289, 0.004451632499694824, 0.004632472991943359, 0.0048133134841918945, 0.00499415397644043, 0.005174994468688965, 0.0053558349609375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 9.0, 3.0, 7.0, 9.0, 17.0, 21.0, 10.0, 23.0, 54.0, 38.0, 46.0, 22.0, 109.0, 58.0, 48.0, 43.0, 49.0, 102.0, 46.0, 53.0, 30.0, 74.0, 37.0, 23.0, 11.0, 21.0, 11.0, 13.0, 2.0, 4.0, 1.0, 1.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-06, -2.310611307621002e-06, -2.2370368242263794e-06, -2.1634623408317566e-06, -2.089887857437134e-06, -2.016313374042511e-06, -1.942738890647888e-06, -1.8691644072532654e-06, -1.7955899238586426e-06, -1.7220154404640198e-06, -1.648440957069397e-06, -1.5748664736747742e-06, -1.5012919902801514e-06, -1.4277175068855286e-06, -1.3541430234909058e-06, -1.280568540096283e-06, -1.2069940567016602e-06, -1.1334195733070374e-06, -1.0598450899124146e-06, -9.862706065177917e-07, -9.126961231231689e-07, -8.391216397285461e-07, -7.655471563339233e-07, -6.919726729393005e-07, -6.183981895446777e-07, -5.448237061500549e-07, -4.7124922275543213e-07, -3.976747393608093e-07, -3.241002559661865e-07, -2.505257725715637e-07, -1.7695128917694092e-07, -1.0337680578231812e-07, -2.9802322387695312e-08, 4.377216100692749e-08, 1.1734664440155029e-07, 1.909211277961731e-07, 2.644956111907959e-07, 3.380700945854187e-07, 4.116445779800415e-07, 4.852190613746643e-07, 5.587935447692871e-07, 6.323680281639099e-07, 7.059425115585327e-07, 7.795169949531555e-07, 8.530914783477783e-07, 9.266659617424011e-07, 1.000240445137024e-06, 1.0738149285316467e-06, 1.1473894119262695e-06, 1.2209638953208923e-06, 1.2945383787155151e-06, 1.368112862110138e-06, 1.4416873455047607e-06, 1.5152618288993835e-06, 1.5888363122940063e-06, 1.6624107956886292e-06, 1.735985279083252e-06, 1.8095597624778748e-06, 1.8831342458724976e-06, 1.9567087292671204e-06, 2.030283212661743e-06, 2.103857696056366e-06, 2.1774321794509888e-06, 2.2510066628456116e-06, 2.3245811462402344e-06]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 4.0, 11.0, 6.0, 9.0, 11.0, 26.0, 40.0, 48.0, 62.0, 130.0, 249.0, 535.0, 1213.0, 2856.0, 7455.0, 24065.0, 97478.0, 419428.0, 377529.0, 84329.0, 21338.0, 6886.0, 2560.0, 1165.0, 543.0, 248.0, 122.0, 83.0, 30.0, 22.0, 19.0, 19.0, 10.0, 4.0, 4.0, 8.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00738525390625, -0.007161140441894531, -0.0069370269775390625, -0.006712913513183594, -0.006488800048828125, -0.006264686584472656, -0.0060405731201171875, -0.005816459655761719, -0.00559234619140625, -0.005368232727050781, -0.0051441192626953125, -0.004920005798339844, -0.004695892333984375, -0.004471778869628906, -0.0042476654052734375, -0.004023551940917969, -0.0037994384765625, -0.0035753250122070312, -0.0033512115478515625, -0.0031270980834960938, -0.002902984619140625, -0.0026788711547851562, -0.0024547576904296875, -0.0022306442260742188, -0.00200653076171875, -0.0017824172973632812, -0.0015583038330078125, -0.0013341903686523438, -0.001110076904296875, -0.0008859634399414062, -0.0006618499755859375, -0.00043773651123046875, -0.000213623046875, 1.049041748046875e-05, 0.0002346038818359375, 0.00045871734619140625, 0.000682830810546875, 0.0009069442749023438, 0.0011310577392578125, 0.0013551712036132812, 0.00157928466796875, 0.0018033981323242188, 0.0020275115966796875, 0.0022516250610351562, 0.002475738525390625, 0.0026998519897460938, 0.0029239654541015625, 0.0031480789184570312, 0.0033721923828125, 0.0035963058471679688, 0.0038204193115234375, 0.004044532775878906, 0.004268646240234375, 0.004492759704589844, 0.0047168731689453125, 0.004940986633300781, 0.00516510009765625, 0.005389213562011719, 0.0056133270263671875, 0.005837440490722656, 0.006061553955078125, 0.006285667419433594, 0.0065097808837890625, 0.006733894348144531, 0.0069580078125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 3.0, 5.0, 3.0, 13.0, 19.0, 37.0, 35.0, 37.0, 36.0, 63.0, 77.0, 84.0, 109.0, 83.0, 78.0, 73.0, 49.0, 53.0, 33.0, 22.0, 20.0, 11.0, 14.0, 6.0, 7.0, 2.0, 2.0, 6.0, 1.0, 5.0, 4.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0058746337890625, -0.005690276622772217, -0.005505919456481934, -0.00532156229019165, -0.005137205123901367, -0.004952847957611084, -0.004768490791320801, -0.004584133625030518, -0.004399776458740234, -0.004215419292449951, -0.004031062126159668, -0.0038467049598693848, -0.0036623477935791016, -0.0034779906272888184, -0.003293633460998535, -0.003109276294708252, -0.0029249191284179688, -0.0027405619621276855, -0.0025562047958374023, -0.002371847629547119, -0.002187490463256836, -0.0020031332969665527, -0.0018187761306762695, -0.0016344189643859863, -0.0014500617980957031, -0.00126570463180542, -0.0010813474655151367, -0.0008969902992248535, -0.0007126331329345703, -0.0005282759666442871, -0.0003439188003540039, -0.0001595616340637207, 2.47955322265625e-05, 0.0002091526985168457, 0.0003935098648071289, 0.0005778670310974121, 0.0007622241973876953, 0.0009465813636779785, 0.0011309385299682617, 0.001315295696258545, 0.0014996528625488281, 0.0016840100288391113, 0.0018683671951293945, 0.0020527243614196777, 0.002237081527709961, 0.002421438694000244, 0.0026057958602905273, 0.0027901530265808105, 0.0029745101928710938, 0.003158867359161377, 0.00334322452545166, 0.0035275816917419434, 0.0037119388580322266, 0.0038962960243225098, 0.004080653190612793, 0.004265010356903076, 0.004449367523193359, 0.004633724689483643, 0.004818081855773926, 0.005002439022064209, 0.005186796188354492, 0.005371153354644775, 0.005555510520935059, 0.005739867687225342, 0.005924224853515625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 9.0, 6.0, 25.0, 90.0, 226.0, 344.0, 199.0, 61.0, 21.0, 8.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22407685220241547, -0.21868209540843964, -0.2132873386144638, -0.20789258182048798, -0.20249783992767334, -0.1971030831336975, -0.19170832633972168, -0.18631356954574585, -0.18091881275177002, -0.1755240559577942, -0.17012929916381836, -0.16473454236984253, -0.1593397855758667, -0.15394504368305206, -0.14855028688907623, -0.1431555300951004, -0.13776077330112457, -0.13236601650714874, -0.1269712597131729, -0.12157651036977768, -0.11618175357580185, -0.11078699678182602, -0.10539224743843079, -0.09999749064445496, -0.09460273385047913, -0.0892079770565033, -0.08381322026252747, -0.07841847091913223, -0.0730237141251564, -0.06762895733118057, -0.06223420426249504, -0.05683945119380951, -0.05144468694925308, -0.04604993015527725, -0.04065517708659172, -0.03526042401790619, -0.02986566722393036, -0.024470912292599678, -0.019076157361268997, -0.013681404292583466, -0.008286647498607635, -0.0028918925672769547, 0.002502862364053726, 0.007897617295384407, 0.013292372226715088, 0.01868712715804577, 0.02408188208937645, 0.02947663515806198, 0.03487139195203781, 0.04026614874601364, 0.04566090181469917, 0.051055654883384705, 0.056450411677360535, 0.061845168471336365, 0.0672399252653122, 0.07263467460870743, 0.07802943140268326, 0.08342418819665909, 0.08881893754005432, 0.09421369433403015, 0.09960845112800598, 0.10500320792198181, 0.11039796471595764, 0.11579271405935287, 0.1211874708533287]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 8.0, 11.0, 3.0, 11.0, 10.0, 12.0, 16.0, 22.0, 21.0, 24.0, 17.0, 29.0, 28.0, 40.0, 31.0, 35.0, 42.0, 39.0, 35.0, 47.0, 53.0, 44.0, 40.0, 27.0, 43.0, 37.0, 25.0, 39.0, 30.0, 27.0, 22.0, 24.0, 16.0, 14.0, 14.0, 12.0, 5.0, 8.0, 8.0, 3.0, 5.0, 6.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03306734561920166, -0.03200966492295265, -0.030951982364058495, -0.029894299805164337, -0.02883661910891533, -0.02777893841266632, -0.026721255853772163, -0.025663573294878006, -0.024605892598628998, -0.02354821190237999, -0.022490529343485832, -0.021432846784591675, -0.020375166088342667, -0.01931748539209366, -0.0182598028331995, -0.017202120274305344, -0.016144439578056335, -0.015086757950484753, -0.01402907632291317, -0.012971394695341587, -0.011913713067770004, -0.010856031440198421, -0.009798349812626839, -0.008740668185055256, -0.007682986557483673, -0.00662530492991209, -0.0055676233023405075, -0.004509941674768925, -0.003452260047197342, -0.002394578419625759, -0.0013368967920541763, -0.00027921516448259354, 0.0007784664630889893, 0.001836148090660572, 0.002893829718232155, 0.003951511345803738, 0.0050091929733753204, 0.006066874600946903, 0.007124556228518486, 0.008182237856090069, 0.009239919483661652, 0.010297601111233234, 0.011355282738804817, 0.0124129643663764, 0.013470645993947983, 0.014528327621519566, 0.015586009249091148, 0.016643691807985306, 0.017701372504234314, 0.018759053200483322, 0.01981673575937748, 0.020874418318271637, 0.021932099014520645, 0.022989779710769653, 0.02404746226966381, 0.025105144828557968, 0.026162825524806976, 0.027220506221055984, 0.028278188779950142, 0.0293358713388443, 0.030393552035093307, 0.031451232731342316, 0.03250891715288162, 0.03356659784913063, 0.03462427854537964]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 6.0, 15.0, 17.0, 21.0, 43.0, 39.0, 92.0, 167.0, 370.0, 754.0, 1654.0, 3719.0, 10137.0, 31269.0, 126682.0, 1203230.0, 2437208.0, 302987.0, 50629.0, 15005.0, 5593.0, 2332.0, 1083.0, 518.0, 279.0, 158.0, 105.0, 53.0, 34.0, 19.0, 13.0, 7.0, 14.0, 12.0, 1.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.014862060546875, -0.014427661895751953, -0.013993263244628906, -0.01355886459350586, -0.013124465942382812, -0.012690067291259766, -0.012255668640136719, -0.011821269989013672, -0.011386871337890625, -0.010952472686767578, -0.010518074035644531, -0.010083675384521484, -0.009649276733398438, -0.00921487808227539, -0.008780479431152344, -0.008346080780029297, -0.00791168212890625, -0.007477283477783203, -0.007042884826660156, -0.006608486175537109, -0.0061740875244140625, -0.005739688873291016, -0.005305290222167969, -0.004870891571044922, -0.004436492919921875, -0.004002094268798828, -0.0035676956176757812, -0.0031332969665527344, -0.0026988983154296875, -0.0022644996643066406, -0.0018301010131835938, -0.0013957023620605469, -0.0009613037109375, -0.0005269050598144531, -9.250640869140625e-05, 0.0003418922424316406, 0.0007762908935546875, 0.0012106895446777344, 0.0016450881958007812, 0.002079486846923828, 0.002513885498046875, 0.002948284149169922, 0.0033826828002929688, 0.0038170814514160156, 0.0042514801025390625, 0.004685878753662109, 0.005120277404785156, 0.005554676055908203, 0.00598907470703125, 0.006423473358154297, 0.006857872009277344, 0.007292270660400391, 0.0077266693115234375, 0.008161067962646484, 0.008595466613769531, 0.009029865264892578, 0.009464263916015625, 0.009898662567138672, 0.010333061218261719, 0.010767459869384766, 0.011201858520507812, 0.01163625717163086, 0.012070655822753906, 0.012505054473876953, 0.012939453125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 7.0, 7.0, 15.0, 16.0, 19.0, 21.0, 38.0, 42.0, 53.0, 69.0, 63.0, 80.0, 93.0, 76.0, 76.0, 73.0, 60.0, 52.0, 35.0, 30.0, 28.0, 22.0, 12.0, 6.0, 4.0, 6.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00774383544921875, -0.007465362548828125, -0.0071868896484375, -0.006908416748046875, -0.00662994384765625, -0.006351470947265625, -0.006072998046875, -0.005794525146484375, -0.00551605224609375, -0.005237579345703125, -0.0049591064453125, -0.004680633544921875, -0.00440216064453125, -0.004123687744140625, -0.00384521484375, -0.003566741943359375, -0.00328826904296875, -0.003009796142578125, -0.0027313232421875, -0.002452850341796875, -0.00217437744140625, -0.001895904541015625, -0.001617431640625, -0.001338958740234375, -0.00106048583984375, -0.000782012939453125, -0.0005035400390625, -0.000225067138671875, 5.340576171875e-05, 0.000331878662109375, 0.0006103515625, 0.000888824462890625, 0.00116729736328125, 0.001445770263671875, 0.0017242431640625, 0.002002716064453125, 0.00228118896484375, 0.002559661865234375, 0.002838134765625, 0.003116607666015625, 0.00339508056640625, 0.003673553466796875, 0.0039520263671875, 0.004230499267578125, 0.00450897216796875, 0.004787445068359375, 0.00506591796875, 0.005344390869140625, 0.00562286376953125, 0.005901336669921875, 0.0061798095703125, 0.006458282470703125, 0.00673675537109375, 0.007015228271484375, 0.007293701171875, 0.007572174072265625, 0.00785064697265625, 0.008129119873046875, 0.0084075927734375, 0.008686065673828125, 0.00896453857421875, 0.009243011474609375, 0.009521484375, 0.009799957275390625, 0.01007843017578125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 9.0, 13.0, 20.0, 18.0, 44.0, 73.0, 132.0, 258.0, 452.0, 858.0, 1775.0, 3767.0, 9744.0, 31789.0, 146227.0, 1630549.0, 2136431.0, 177058.0, 36147.0, 10879.0, 4163.0, 1852.0, 903.0, 497.0, 260.0, 146.0, 91.0, 46.0, 24.0, 24.0, 15.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01485443115234375, -0.014376044273376465, -0.01389765739440918, -0.013419270515441895, -0.01294088363647461, -0.012462496757507324, -0.011984109878540039, -0.011505722999572754, -0.011027336120605469, -0.010548949241638184, -0.010070562362670898, -0.009592175483703613, -0.009113788604736328, -0.008635401725769043, -0.008157014846801758, -0.007678627967834473, -0.0072002410888671875, -0.006721854209899902, -0.006243467330932617, -0.005765080451965332, -0.005286693572998047, -0.004808306694030762, -0.0043299198150634766, -0.0038515329360961914, -0.0033731460571289062, -0.002894759178161621, -0.002416372299194336, -0.0019379854202270508, -0.0014595985412597656, -0.0009812116622924805, -0.0005028247833251953, -2.4437904357910156e-05, 0.000453948974609375, 0.0009323358535766602, 0.0014107227325439453, 0.0018891096115112305, 0.0023674964904785156, 0.0028458833694458008, 0.003324270248413086, 0.003802657127380371, 0.004281044006347656, 0.004759430885314941, 0.0052378177642822266, 0.005716204643249512, 0.006194591522216797, 0.006672978401184082, 0.007151365280151367, 0.007629752159118652, 0.008108139038085938, 0.008586525917053223, 0.009064912796020508, 0.009543299674987793, 0.010021686553955078, 0.010500073432922363, 0.010978460311889648, 0.011456847190856934, 0.011935234069824219, 0.012413620948791504, 0.012892007827758789, 0.013370394706726074, 0.01384878158569336, 0.014327168464660645, 0.01480555534362793, 0.015283942222595215, 0.0157623291015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 2.0, 3.0, 7.0, 9.0, 2.0, 6.0, 5.0, 17.0, 26.0, 30.0, 50.0, 66.0, 69.0, 121.0, 146.0, 228.0, 357.0, 540.0, 740.0, 539.0, 355.0, 210.0, 151.0, 115.0, 68.0, 48.0, 41.0, 25.0, 20.0, 13.0, 11.0, 15.0, 14.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0117645263671875, -0.011377811431884766, -0.010991096496582031, -0.010604381561279297, -0.010217666625976562, -0.009830951690673828, -0.009444236755371094, -0.00905752182006836, -0.008670806884765625, -0.00828409194946289, -0.007897377014160156, -0.007510662078857422, -0.0071239471435546875, -0.006737232208251953, -0.006350517272949219, -0.005963802337646484, -0.00557708740234375, -0.005190372467041016, -0.004803657531738281, -0.004416942596435547, -0.0040302276611328125, -0.003643512725830078, -0.0032567977905273438, -0.0028700828552246094, -0.002483367919921875, -0.0020966529846191406, -0.0017099380493164062, -0.0013232231140136719, -0.0009365081787109375, -0.0005497932434082031, -0.00016307830810546875, 0.00022363662719726562, 0.0006103515625, 0.0009970664978027344, 0.0013837814331054688, 0.0017704963684082031, 0.0021572113037109375, 0.002543926239013672, 0.0029306411743164062, 0.0033173561096191406, 0.003704071044921875, 0.004090785980224609, 0.004477500915527344, 0.004864215850830078, 0.0052509307861328125, 0.005637645721435547, 0.006024360656738281, 0.006411075592041016, 0.00679779052734375, 0.007184505462646484, 0.007571220397949219, 0.007957935333251953, 0.008344650268554688, 0.008731365203857422, 0.009118080139160156, 0.00950479507446289, 0.009891510009765625, 0.01027822494506836, 0.010664939880371094, 0.011051654815673828, 0.011438369750976562, 0.011825084686279297, 0.012211799621582031, 0.012598514556884766, 0.0129852294921875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 10.0, 20.0, 31.0, 61.0, 101.0, 145.0, 165.0, 147.0, 129.0, 76.0, 50.0, 26.0, 10.0, 11.0, 9.0, 2.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09911265224218369, -0.09618844091892242, -0.09326422214508057, -0.0903400108218193, -0.08741579204797745, -0.08449158072471619, -0.08156736195087433, -0.07864315062761307, -0.0757189393043518, -0.07279472798109055, -0.06987050920724869, -0.06694629788398743, -0.06402207911014557, -0.06109786778688431, -0.05817365273833275, -0.05524943768978119, -0.05232522264122963, -0.04940100759267807, -0.04647679254412651, -0.04355257749557495, -0.04062836617231369, -0.03770415112376213, -0.03477993607521057, -0.03185572475194931, -0.0289315078407526, -0.026007292792201042, -0.023083079606294632, -0.020158864557743073, -0.017234649509191513, -0.014310436323285103, -0.011386221274733543, -0.008462008088827133, -0.005537793040275574, -0.0026135786902159452, 0.00031063565984368324, 0.0032348502427339554, 0.00615906435996294, 0.009083278477191925, 0.012007493525743484, 0.014931706711649895, 0.017855921760201454, 0.020780136808753014, 0.023704349994659424, 0.026628565043210983, 0.029552780091762543, 0.032476991415023804, 0.03540121018886566, 0.03832542151212692, 0.04124963656067848, 0.04417385160923004, 0.0470980666577816, 0.05002228170633316, 0.05294649302959442, 0.05587070807814598, 0.05879492312669754, 0.0617191344499588, 0.06464335322380066, 0.06756756454706192, 0.07049178332090378, 0.07341599464416504, 0.0763402134180069, 0.07926442474126816, 0.08218863606452942, 0.08511285483837128, 0.08803706616163254]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 1.0, 6.0, 6.0, 11.0, 19.0, 9.0, 13.0, 14.0, 15.0, 18.0, 9.0, 26.0, 19.0, 31.0, 28.0, 33.0, 30.0, 32.0, 36.0, 37.0, 42.0, 41.0, 38.0, 42.0, 42.0, 42.0, 33.0, 37.0, 43.0, 29.0, 35.0, 32.0, 21.0, 25.0, 18.0, 10.0, 19.0, 10.0, 7.0, 14.0, 9.0, 4.0, 5.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.036873579025268555, -0.03577630594372749, -0.03467903286218643, -0.03358175978064537, -0.03248448669910431, -0.03138721361756325, -0.030289940536022186, -0.029192667454481125, -0.028095394372940063, -0.026998121291399002, -0.02590084820985794, -0.02480357512831688, -0.023706302046775818, -0.022609028965234756, -0.021511755883693695, -0.020414482802152634, -0.019317209720611572, -0.01821993663907051, -0.01712266355752945, -0.016025390475988388, -0.014928117394447327, -0.013830844312906265, -0.012733571231365204, -0.011636298149824142, -0.010539025068283081, -0.00944175198674202, -0.008344478905200958, -0.007247205823659897, -0.0061499327421188354, -0.005052659660577774, -0.003955386579036713, -0.0028581134974956512, -0.0017608404159545898, -0.0006635673344135284, 0.00043370574712753296, 0.0015309788286685944, 0.0026282519102096558, 0.003725524991750717, 0.0048227980732917786, 0.00592007115483284, 0.007017344236373901, 0.008114617317914963, 0.009211890399456024, 0.010309163480997086, 0.011406436562538147, 0.012503709644079208, 0.01360098272562027, 0.014698255807161331, 0.015795528888702393, 0.016892801970243454, 0.017990075051784515, 0.019087348133325577, 0.020184621214866638, 0.0212818942964077, 0.02237916737794876, 0.023476440459489822, 0.024573713541030884, 0.025670986622571945, 0.026768259704113007, 0.027865532785654068, 0.02896280586719513, 0.03006007894873619, 0.031157352030277252, 0.032254625111818314, 0.033351898193359375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 5.0, 3.0, 7.0, 10.0, 20.0, 21.0, 32.0, 56.0, 65.0, 130.0, 153.0, 261.0, 448.0, 785.0, 1319.0, 2542.0, 4982.0, 10217.0, 22181.0, 52157.0, 130621.0, 304028.0, 298255.0, 127627.0, 50542.0, 21661.0, 9955.0, 4669.0, 2560.0, 1327.0, 694.0, 433.0, 287.0, 163.0, 111.0, 66.0, 59.0, 32.0, 18.0, 12.0, 13.0, 14.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01242828369140625, -0.012013792991638184, -0.011599302291870117, -0.01118481159210205, -0.010770320892333984, -0.010355830192565918, -0.009941339492797852, -0.009526848793029785, -0.009112358093261719, -0.008697867393493652, -0.008283376693725586, -0.00786888599395752, -0.007454395294189453, -0.007039904594421387, -0.00662541389465332, -0.006210923194885254, -0.0057964324951171875, -0.005381941795349121, -0.004967451095581055, -0.004552960395812988, -0.004138469696044922, -0.0037239789962768555, -0.003309488296508789, -0.0028949975967407227, -0.0024805068969726562, -0.00206601619720459, -0.0016515254974365234, -0.001237034797668457, -0.0008225440979003906, -0.0004080533981323242, 6.4373016357421875e-06, 0.0004209280014038086, 0.000835418701171875, 0.0012499094009399414, 0.0016644001007080078, 0.0020788908004760742, 0.0024933815002441406, 0.002907872200012207, 0.0033223628997802734, 0.00373685359954834, 0.004151344299316406, 0.004565834999084473, 0.004980325698852539, 0.0053948163986206055, 0.005809307098388672, 0.006223797798156738, 0.006638288497924805, 0.007052779197692871, 0.0074672698974609375, 0.007881760597229004, 0.00829625129699707, 0.008710741996765137, 0.009125232696533203, 0.00953972339630127, 0.009954214096069336, 0.010368704795837402, 0.010783195495605469, 0.011197686195373535, 0.011612176895141602, 0.012026667594909668, 0.012441158294677734, 0.0128556489944458, 0.013270139694213867, 0.013684630393981934, 0.01409912109375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 2.0, 9.0, 9.0, 11.0, 16.0, 15.0, 34.0, 31.0, 37.0, 51.0, 52.0, 47.0, 62.0, 60.0, 72.0, 70.0, 60.0, 49.0, 52.0, 57.0, 42.0, 43.0, 25.0, 28.0, 12.0, 11.0, 9.0, 9.0, 7.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.008087158203125, -0.007824540138244629, -0.007561922073364258, -0.007299304008483887, -0.007036685943603516, -0.0067740678787231445, -0.0065114498138427734, -0.006248831748962402, -0.005986213684082031, -0.00572359561920166, -0.005460977554321289, -0.005198359489440918, -0.004935741424560547, -0.004673123359680176, -0.004410505294799805, -0.004147887229919434, -0.0038852691650390625, -0.0036226511001586914, -0.0033600330352783203, -0.0030974149703979492, -0.002834796905517578, -0.002572178840637207, -0.002309560775756836, -0.002046942710876465, -0.0017843246459960938, -0.0015217065811157227, -0.0012590885162353516, -0.0009964704513549805, -0.0007338523864746094, -0.0004712343215942383, -0.0002086162567138672, 5.4001808166503906e-05, 0.000316619873046875, 0.0005792379379272461, 0.0008418560028076172, 0.0011044740676879883, 0.0013670921325683594, 0.0016297101974487305, 0.0018923282623291016, 0.0021549463272094727, 0.0024175643920898438, 0.002680182456970215, 0.002942800521850586, 0.003205418586730957, 0.003468036651611328, 0.0037306547164916992, 0.00399327278137207, 0.004255890846252441, 0.0045185089111328125, 0.004781126976013184, 0.005043745040893555, 0.005306363105773926, 0.005568981170654297, 0.005831599235534668, 0.006094217300415039, 0.00635683536529541, 0.006619453430175781, 0.006882071495056152, 0.0071446895599365234, 0.0074073076248168945, 0.007669925689697266, 0.007932543754577637, 0.008195161819458008, 0.008457779884338379, 0.00872039794921875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 9.0, 2.0, 6.0, 10.0, 16.0, 20.0, 40.0, 58.0, 110.0, 204.0, 424.0, 855.0, 1960.0, 4588.0, 11420.0, 29426.0, 86862.0, 291155.0, 408835.0, 139417.0, 44525.0, 16728.0, 6630.0, 2742.0, 1264.0, 576.0, 306.0, 149.0, 87.0, 52.0, 21.0, 20.0, 14.0, 11.0, 6.0, 3.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0186767578125, -0.01816082000732422, -0.017644882202148438, -0.017128944396972656, -0.016613006591796875, -0.016097068786621094, -0.015581130981445312, -0.015065193176269531, -0.01454925537109375, -0.014033317565917969, -0.013517379760742188, -0.013001441955566406, -0.012485504150390625, -0.011969566345214844, -0.011453628540039062, -0.010937690734863281, -0.0104217529296875, -0.009905815124511719, -0.009389877319335938, -0.008873939514160156, -0.008358001708984375, -0.007842063903808594, -0.0073261260986328125, -0.006810188293457031, -0.00629425048828125, -0.005778312683105469, -0.0052623748779296875, -0.004746437072753906, -0.004230499267578125, -0.0037145614624023438, -0.0031986236572265625, -0.0026826858520507812, -0.002166748046875, -0.0016508102416992188, -0.0011348724365234375, -0.0006189346313476562, -0.000102996826171875, 0.00041294097900390625, 0.0009288787841796875, 0.0014448165893554688, 0.00196075439453125, 0.0024766921997070312, 0.0029926300048828125, 0.0035085678100585938, 0.004024505615234375, 0.004540443420410156, 0.0050563812255859375, 0.005572319030761719, 0.0060882568359375, 0.006604194641113281, 0.0071201324462890625, 0.007636070251464844, 0.008152008056640625, 0.008667945861816406, 0.009183883666992188, 0.009699821472167969, 0.01021575927734375, 0.010731697082519531, 0.011247634887695312, 0.011763572692871094, 0.012279510498046875, 0.012795448303222656, 0.013311386108398438, 0.013827323913574219, 0.01434326171875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 9.0, 5.0, 9.0, 7.0, 17.0, 16.0, 11.0, 25.0, 20.0, 26.0, 32.0, 41.0, 36.0, 35.0, 43.0, 39.0, 47.0, 49.0, 46.0, 41.0, 53.0, 44.0, 40.0, 32.0, 38.0, 23.0, 26.0, 20.0, 30.0, 24.0, 12.0, 13.0, 17.0, 7.0, 10.0, 9.0, 8.0, 11.0, 3.0, 8.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01549530029296875, -0.014978766441345215, -0.01446223258972168, -0.013945698738098145, -0.01342916488647461, -0.012912631034851074, -0.012396097183227539, -0.011879563331604004, -0.011363029479980469, -0.010846495628356934, -0.010329961776733398, -0.009813427925109863, -0.009296894073486328, -0.008780360221862793, -0.008263826370239258, -0.007747292518615723, -0.0072307586669921875, -0.006714224815368652, -0.006197690963745117, -0.005681157112121582, -0.005164623260498047, -0.004648089408874512, -0.0041315555572509766, -0.0036150217056274414, -0.0030984878540039062, -0.002581954002380371, -0.002065420150756836, -0.0015488862991333008, -0.0010323524475097656, -0.0005158185958862305, 7.152557373046875e-07, 0.0005172491073608398, 0.001033782958984375, 0.0015503168106079102, 0.0020668506622314453, 0.0025833845138549805, 0.0030999183654785156, 0.0036164522171020508, 0.004132986068725586, 0.004649519920349121, 0.005166053771972656, 0.005682587623596191, 0.0061991214752197266, 0.006715655326843262, 0.007232189178466797, 0.007748723030090332, 0.008265256881713867, 0.008781790733337402, 0.009298324584960938, 0.009814858436584473, 0.010331392288208008, 0.010847926139831543, 0.011364459991455078, 0.011880993843078613, 0.012397527694702148, 0.012914061546325684, 0.013430595397949219, 0.013947129249572754, 0.014463663101196289, 0.014980196952819824, 0.01549673080444336, 0.016013264656066895, 0.01652979850769043, 0.017046332359313965, 0.0175628662109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 9.0, 7.0, 8.0, 20.0, 15.0, 15.0, 30.0, 62.0, 97.0, 173.0, 269.0, 576.0, 1017.0, 1986.0, 4036.0, 9038.0, 23314.0, 69938.0, 230108.0, 413934.0, 198251.0, 59618.0, 20370.0, 8031.0, 3662.0, 1835.0, 942.0, 496.0, 286.0, 165.0, 99.0, 41.0, 35.0, 22.0, 14.0, 9.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0039215087890625, -0.00380060076713562, -0.0036796927452087402, -0.0035587847232818604, -0.0034378767013549805, -0.0033169686794281006, -0.0031960606575012207, -0.003075152635574341, -0.002954244613647461, -0.002833336591720581, -0.002712428569793701, -0.0025915205478668213, -0.0024706125259399414, -0.0023497045040130615, -0.0022287964820861816, -0.0021078884601593018, -0.001986980438232422, -0.001866072416305542, -0.0017451643943786621, -0.0016242563724517822, -0.0015033483505249023, -0.0013824403285980225, -0.0012615323066711426, -0.0011406242847442627, -0.0010197162628173828, -0.0008988082408905029, -0.000777900218963623, -0.0006569921970367432, -0.0005360841751098633, -0.0004151761531829834, -0.0002942681312561035, -0.00017336010932922363, -5.245208740234375e-05, 6.845593452453613e-05, 0.00018936395645141602, 0.0003102719783782959, 0.0004311800003051758, 0.0005520880222320557, 0.0006729960441589355, 0.0007939040660858154, 0.0009148120880126953, 0.0010357201099395752, 0.001156628131866455, 0.001277536153793335, 0.0013984441757202148, 0.0015193521976470947, 0.0016402602195739746, 0.0017611682415008545, 0.0018820762634277344, 0.0020029842853546143, 0.002123892307281494, 0.002244800329208374, 0.002365708351135254, 0.002486616373062134, 0.0026075243949890137, 0.0027284324169158936, 0.0028493404388427734, 0.0029702484607696533, 0.003091156482696533, 0.003212064504623413, 0.003332972526550293, 0.003453880548477173, 0.0035747885704040527, 0.0036956965923309326, 0.0038166046142578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 9.0, 2.0, 6.0, 4.0, 12.0, 17.0, 18.0, 18.0, 30.0, 31.0, 49.0, 40.0, 49.0, 50.0, 0.0, 63.0, 58.0, 56.0, 63.0, 61.0, 64.0, 56.0, 33.0, 32.0, 37.0, 28.0, 32.0, 16.0, 17.0, 18.0, 8.0, 4.0, 5.0, 6.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9669532775878906e-06, -1.909211277961731e-06, -1.8514692783355713e-06, -1.7937272787094116e-06, -1.735985279083252e-06, -1.6782432794570923e-06, -1.6205012798309326e-06, -1.562759280204773e-06, -1.5050172805786133e-06, -1.4472752809524536e-06, -1.389533281326294e-06, -1.3317912817001343e-06, -1.2740492820739746e-06, -1.216307282447815e-06, -1.1585652828216553e-06, -1.1008232831954956e-06, -1.043081283569336e-06, -9.853392839431763e-07, -9.275972843170166e-07, -8.698552846908569e-07, -8.121132850646973e-07, -7.543712854385376e-07, -6.966292858123779e-07, -6.388872861862183e-07, -5.811452865600586e-07, -5.234032869338989e-07, -4.6566128730773926e-07, -4.079192876815796e-07, -3.501772880554199e-07, -2.9243528842926025e-07, -2.3469328880310059e-07, -1.7695128917694092e-07, -1.1920928955078125e-07, -6.146728992462158e-08, -3.725290298461914e-09, 5.4016709327697754e-08, 1.1175870895385742e-07, 1.695007085800171e-07, 2.2724270820617676e-07, 2.849847078323364e-07, 3.427267074584961e-07, 4.0046870708465576e-07, 4.5821070671081543e-07, 5.159527063369751e-07, 5.736947059631348e-07, 6.314367055892944e-07, 6.891787052154541e-07, 7.469207048416138e-07, 8.046627044677734e-07, 8.624047040939331e-07, 9.201467037200928e-07, 9.778887033462524e-07, 1.0356307029724121e-06, 1.0933727025985718e-06, 1.1511147022247314e-06, 1.2088567018508911e-06, 1.2665987014770508e-06, 1.3243407011032104e-06, 1.3820827007293701e-06, 1.4398247003555298e-06, 1.4975666999816895e-06, 1.5553086996078491e-06, 1.6130506992340088e-06, 1.6707926988601685e-06, 1.7285346984863281e-06]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 12.0, 4.0, 6.0, 10.0, 20.0, 30.0, 53.0, 55.0, 98.0, 145.0, 221.0, 400.0, 608.0, 1167.0, 2180.0, 4687.0, 11466.0, 31538.0, 96972.0, 282758.0, 372862.0, 161148.0, 50844.0, 17520.0, 7029.0, 3132.0, 1540.0, 791.0, 436.0, 286.0, 181.0, 128.0, 67.0, 49.0, 25.0, 28.0, 14.0, 8.0, 8.0, 8.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0032806396484375, -0.0031683743000030518, -0.0030561089515686035, -0.0029438436031341553, -0.002831578254699707, -0.002719312906265259, -0.0026070475578308105, -0.0024947822093963623, -0.002382516860961914, -0.002270251512527466, -0.0021579861640930176, -0.0020457208156585693, -0.001933455467224121, -0.0018211901187896729, -0.0017089247703552246, -0.0015966594219207764, -0.0014843940734863281, -0.0013721287250518799, -0.0012598633766174316, -0.0011475980281829834, -0.0010353326797485352, -0.0009230673313140869, -0.0008108019828796387, -0.0006985366344451904, -0.0005862712860107422, -0.00047400593757629395, -0.0003617405891418457, -0.00024947524070739746, -0.00013720989227294922, -2.4944543838500977e-05, 8.732080459594727e-05, 0.0001995861530303955, 0.00031185150146484375, 0.000424116849899292, 0.0005363821983337402, 0.0006486475467681885, 0.0007609128952026367, 0.000873178243637085, 0.0009854435920715332, 0.0010977089405059814, 0.0012099742889404297, 0.001322239637374878, 0.0014345049858093262, 0.0015467703342437744, 0.0016590356826782227, 0.001771301031112671, 0.0018835663795471191, 0.0019958317279815674, 0.0021080970764160156, 0.002220362424850464, 0.002332627773284912, 0.0024448931217193604, 0.0025571584701538086, 0.002669423818588257, 0.002781689167022705, 0.0028939545154571533, 0.0030062198638916016, 0.00311848521232605, 0.003230750560760498, 0.0033430159091949463, 0.0034552812576293945, 0.0035675466060638428, 0.003679811954498291, 0.0037920773029327393, 0.0039043426513671875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 6.0, 11.0, 7.0, 13.0, 28.0, 17.0, 25.0, 32.0, 33.0, 48.0, 62.0, 68.0, 64.0, 69.0, 79.0, 89.0, 57.0, 45.0, 48.0, 44.0, 28.0, 27.0, 19.0, 15.0, 9.0, 8.0, 13.0, 10.0, 2.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00319671630859375, -0.0030927956104278564, -0.002988874912261963, -0.0028849542140960693, -0.0027810335159301758, -0.0026771128177642822, -0.0025731921195983887, -0.002469271421432495, -0.0023653507232666016, -0.002261430025100708, -0.0021575093269348145, -0.002053588628768921, -0.0019496679306030273, -0.0018457472324371338, -0.0017418265342712402, -0.0016379058361053467, -0.0015339851379394531, -0.0014300644397735596, -0.001326143741607666, -0.0012222230434417725, -0.001118302345275879, -0.0010143816471099854, -0.0009104609489440918, -0.0008065402507781982, -0.0007026195526123047, -0.0005986988544464111, -0.0004947781562805176, -0.000390857458114624, -0.00028693675994873047, -0.00018301606178283691, -7.909536361694336e-05, 2.4825334548950195e-05, 0.00012874603271484375, 0.0002326667308807373, 0.00033658742904663086, 0.0004405081272125244, 0.000544428825378418, 0.0006483495235443115, 0.0007522702217102051, 0.0008561909198760986, 0.0009601116180419922, 0.0010640323162078857, 0.0011679530143737793, 0.0012718737125396729, 0.0013757944107055664, 0.00147971510887146, 0.0015836358070373535, 0.001687556505203247, 0.0017914772033691406, 0.0018953979015350342, 0.0019993185997009277, 0.0021032392978668213, 0.002207159996032715, 0.0023110806941986084, 0.002415001392364502, 0.0025189220905303955, 0.002622842788696289, 0.0027267634868621826, 0.002830684185028076, 0.0029346048831939697, 0.0030385255813598633, 0.003142446279525757, 0.0032463669776916504, 0.003350287675857544, 0.0034542083740234375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 6.0, 5.0, 10.0, 31.0, 24.0, 47.0, 85.0, 111.0, 134.0, 147.0, 143.0, 91.0, 63.0, 32.0, 36.0, 11.0, 8.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05696502700448036, -0.05472085624933243, -0.052476685494184494, -0.05023251473903656, -0.047988343983888626, -0.04574417322874069, -0.04350000247359276, -0.041255831718444824, -0.03901166096329689, -0.036767490208148956, -0.03452331945300102, -0.03227914869785309, -0.030034977942705154, -0.02779080718755722, -0.025546636432409286, -0.023302465677261353, -0.02105829492211342, -0.018814124166965485, -0.01656995341181755, -0.014325782656669617, -0.012081611901521683, -0.009837441146373749, -0.007593270391225815, -0.005349099636077881, -0.003104928880929947, -0.0008607581257820129, 0.001383412629365921, 0.003627583384513855, 0.005871754139661789, 0.008115924894809723, 0.010360095649957657, 0.01260426640510559, 0.014848440885543823, 0.017092611640691757, 0.01933678239583969, 0.021580953150987625, 0.02382512390613556, 0.026069294661283493, 0.028313465416431427, 0.03055763617157936, 0.032801806926727295, 0.03504597768187523, 0.03729014843702316, 0.0395343191921711, 0.04177848994731903, 0.044022660702466965, 0.0462668314576149, 0.04851100221276283, 0.05075517296791077, 0.0529993437230587, 0.055243514478206635, 0.05748768523335457, 0.0597318559885025, 0.061976026743650436, 0.06422019749879837, 0.066464364528656, 0.06870853900909424, 0.07095271348953247, 0.0731968805193901, 0.07544104754924774, 0.07768522202968597, 0.0799293965101242, 0.08217356353998184, 0.08441773056983948, 0.08666190505027771]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 8.0, 10.0, 10.0, 12.0, 16.0, 19.0, 30.0, 36.0, 26.0, 47.0, 47.0, 52.0, 47.0, 59.0, 53.0, 58.0, 65.0, 45.0, 44.0, 46.0, 34.0, 29.0, 29.0, 31.0, 25.0, 21.0, 25.0, 13.0, 16.0, 7.0, 12.0, 4.0, 8.0, 5.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03862154483795166, -0.037302106618881226, -0.03598267212510109, -0.03466323763132095, -0.03334379941225052, -0.032024361193180084, -0.030704926699399948, -0.029385490342974663, -0.028066053986549377, -0.026746617630124092, -0.025427181273698807, -0.02410774491727352, -0.022788308560848236, -0.02146887220442295, -0.020149435847997665, -0.01882999949157238, -0.017510563135147095, -0.01619112677872181, -0.014871690422296524, -0.013552254065871239, -0.012232817709445953, -0.010913381353020668, -0.009593944996595383, -0.008274508640170097, -0.006955072283744812, -0.005635635927319527, -0.004316199570894241, -0.002996763214468956, -0.0016773268580436707, -0.0003578905016183853, 0.0009615458548069, 0.0022809822112321854, 0.0036004185676574707, 0.004919854924082756, 0.006239291280508041, 0.007558727636933327, 0.008878163993358612, 0.010197600349783897, 0.011517036706209183, 0.012836473062634468, 0.014155909419059753, 0.015475345775485039, 0.016794782131910324, 0.01811421848833561, 0.019433654844760895, 0.02075309120118618, 0.022072527557611465, 0.02339196391403675, 0.024711400270462036, 0.02603083662688732, 0.027350272983312607, 0.028669709339737892, 0.029989145696163177, 0.03130858391523361, 0.03262801840901375, 0.033947452902793884, 0.03526689112186432, 0.03658632934093475, 0.03790576383471489, 0.039225198328495026, 0.04054463654756546, 0.041864074766635895, 0.04318350926041603, 0.04450294375419617, 0.0458223819732666]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 13.0, 8.0, 16.0, 40.0, 66.0, 134.0, 285.0, 650.0, 1445.0, 4019.0, 13965.0, 57201.0, 568861.0, 2852867.0, 616712.0, 58417.0, 12847.0, 3945.0, 1492.0, 655.0, 303.0, 146.0, 77.0, 40.0, 29.0, 7.0, 17.0, 4.0, 10.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0134124755859375, -0.012942075729370117, -0.012471675872802734, -0.012001276016235352, -0.011530876159667969, -0.011060476303100586, -0.010590076446533203, -0.01011967658996582, -0.009649276733398438, -0.009178876876831055, -0.008708477020263672, -0.008238077163696289, -0.007767677307128906, -0.0072972774505615234, -0.006826877593994141, -0.006356477737426758, -0.005886077880859375, -0.005415678024291992, -0.004945278167724609, -0.0044748783111572266, -0.004004478454589844, -0.003534078598022461, -0.003063678741455078, -0.0025932788848876953, -0.0021228790283203125, -0.0016524791717529297, -0.0011820793151855469, -0.0007116794586181641, -0.00024127960205078125, 0.00022912025451660156, 0.0006995201110839844, 0.0011699199676513672, 0.00164031982421875, 0.002110719680786133, 0.0025811195373535156, 0.0030515193939208984, 0.0035219192504882812, 0.003992319107055664, 0.004462718963623047, 0.00493311882019043, 0.0054035186767578125, 0.005873918533325195, 0.006344318389892578, 0.006814718246459961, 0.007285118103027344, 0.0077555179595947266, 0.00822591781616211, 0.008696317672729492, 0.009166717529296875, 0.009637117385864258, 0.01010751724243164, 0.010577917098999023, 0.011048316955566406, 0.011518716812133789, 0.011989116668701172, 0.012459516525268555, 0.012929916381835938, 0.01340031623840332, 0.013870716094970703, 0.014341115951538086, 0.014811515808105469, 0.015281915664672852, 0.015752315521240234, 0.016222715377807617, 0.016693115234375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 7.0, 8.0, 14.0, 12.0, 31.0, 27.0, 43.0, 47.0, 64.0, 55.0, 76.0, 70.0, 77.0, 69.0, 76.0, 65.0, 70.0, 41.0, 34.0, 20.0, 29.0, 24.0, 17.0, 7.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006801605224609375, -0.006524264812469482, -0.00624692440032959, -0.005969583988189697, -0.005692243576049805, -0.005414903163909912, -0.0051375627517700195, -0.004860222339630127, -0.004582881927490234, -0.004305541515350342, -0.004028201103210449, -0.0037508606910705566, -0.003473520278930664, -0.0031961798667907715, -0.002918839454650879, -0.0026414990425109863, -0.0023641586303710938, -0.002086818218231201, -0.0018094778060913086, -0.001532137393951416, -0.0012547969818115234, -0.0009774565696716309, -0.0007001161575317383, -0.0004227757453918457, -0.00014543533325195312, 0.00013190507888793945, 0.00040924549102783203, 0.0006865859031677246, 0.0009639263153076172, 0.0012412667274475098, 0.0015186071395874023, 0.001795947551727295, 0.0020732879638671875, 0.00235062837600708, 0.0026279687881469727, 0.0029053092002868652, 0.003182649612426758, 0.0034599900245666504, 0.003737330436706543, 0.0040146708488464355, 0.004292011260986328, 0.004569351673126221, 0.004846692085266113, 0.005124032497406006, 0.0054013729095458984, 0.005678713321685791, 0.005956053733825684, 0.006233394145965576, 0.006510734558105469, 0.006788074970245361, 0.007065415382385254, 0.0073427557945251465, 0.007620096206665039, 0.007897436618804932, 0.008174777030944824, 0.008452117443084717, 0.00872945785522461, 0.009006798267364502, 0.009284138679504395, 0.009561479091644287, 0.00983881950378418, 0.010116159915924072, 0.010393500328063965, 0.010670840740203857, 0.01094818115234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 7.0, 12.0, 26.0, 36.0, 70.0, 109.0, 198.0, 337.0, 629.0, 1297.0, 2821.0, 6922.0, 22046.0, 95851.0, 929592.0, 2851825.0, 222325.0, 40954.0, 11238.0, 4260.0, 1765.0, 928.0, 453.0, 242.0, 148.0, 87.0, 42.0, 27.0, 12.0, 13.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0174713134765625, -0.017014265060424805, -0.01655721664428711, -0.016100168228149414, -0.01564311981201172, -0.015186071395874023, -0.014729022979736328, -0.014271974563598633, -0.013814926147460938, -0.013357877731323242, -0.012900829315185547, -0.012443780899047852, -0.011986732482910156, -0.011529684066772461, -0.011072635650634766, -0.01061558723449707, -0.010158538818359375, -0.00970149040222168, -0.009244441986083984, -0.008787393569946289, -0.008330345153808594, -0.007873296737670898, -0.007416248321533203, -0.006959199905395508, -0.0065021514892578125, -0.006045103073120117, -0.005588054656982422, -0.0051310062408447266, -0.004673957824707031, -0.004216909408569336, -0.0037598609924316406, -0.0033028125762939453, -0.00284576416015625, -0.0023887157440185547, -0.0019316673278808594, -0.001474618911743164, -0.0010175704956054688, -0.0005605220794677734, -0.00010347366333007812, 0.0003535747528076172, 0.0008106231689453125, 0.0012676715850830078, 0.0017247200012207031, 0.0021817684173583984, 0.0026388168334960938, 0.003095865249633789, 0.0035529136657714844, 0.00400996208190918, 0.004467010498046875, 0.00492405891418457, 0.005381107330322266, 0.005838155746459961, 0.006295204162597656, 0.0067522525787353516, 0.007209300994873047, 0.007666349411010742, 0.008123397827148438, 0.008580446243286133, 0.009037494659423828, 0.009494543075561523, 0.009951591491699219, 0.010408639907836914, 0.01086568832397461, 0.011322736740112305, 0.01177978515625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 14.0, 10.0, 15.0, 20.0, 18.0, 30.0, 47.0, 55.0, 77.0, 109.0, 152.0, 250.0, 403.0, 611.0, 698.0, 495.0, 341.0, 205.0, 132.0, 95.0, 81.0, 55.0, 46.0, 30.0, 18.0, 10.0, 8.0, 8.0, 11.0, 5.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.014068603515625, -0.013680219650268555, -0.01329183578491211, -0.012903451919555664, -0.012515068054199219, -0.012126684188842773, -0.011738300323486328, -0.011349916458129883, -0.010961532592773438, -0.010573148727416992, -0.010184764862060547, -0.009796380996704102, -0.009407997131347656, -0.009019613265991211, -0.008631229400634766, -0.00824284553527832, -0.007854461669921875, -0.00746607780456543, -0.007077693939208984, -0.006689310073852539, -0.006300926208496094, -0.0059125423431396484, -0.005524158477783203, -0.005135774612426758, -0.0047473907470703125, -0.004359006881713867, -0.003970623016357422, -0.0035822391510009766, -0.0031938552856445312, -0.002805471420288086, -0.0024170875549316406, -0.0020287036895751953, -0.00164031982421875, -0.0012519359588623047, -0.0008635520935058594, -0.00047516822814941406, -8.678436279296875e-05, 0.00030159950256347656, 0.0006899833679199219, 0.0010783672332763672, 0.0014667510986328125, 0.0018551349639892578, 0.002243518829345703, 0.0026319026947021484, 0.0030202865600585938, 0.003408670425415039, 0.0037970542907714844, 0.00418543815612793, 0.004573822021484375, 0.00496220588684082, 0.005350589752197266, 0.005738973617553711, 0.006127357482910156, 0.0065157413482666016, 0.006904125213623047, 0.007292509078979492, 0.0076808929443359375, 0.008069276809692383, 0.008457660675048828, 0.008846044540405273, 0.009234428405761719, 0.009622812271118164, 0.01001119613647461, 0.010399580001831055, 0.0107879638671875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 12.0, 24.0, 51.0, 138.0, 222.0, 245.0, 178.0, 64.0, 39.0, 17.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1357591301202774, -0.13093794882297516, -0.12611675262451172, -0.12129556387662888, -0.11647437512874603, -0.11165319383144379, -0.10683200508356094, -0.1020108163356781, -0.09718962758779526, -0.09236843883991241, -0.08754725009202957, -0.08272606134414673, -0.07790488004684448, -0.07308368384838104, -0.0682625025510788, -0.06344131380319595, -0.05862012505531311, -0.05379893630743027, -0.048977747559547424, -0.04415656253695488, -0.03933537378907204, -0.034514185041189194, -0.0296929981559515, -0.024871811270713806, -0.020050622522830963, -0.015229434706270695, -0.010408246889710426, -0.005587059073150158, -0.0007658712565898895, 0.0040553174912929535, 0.008876504376530647, 0.013697691261768341, 0.01851886510848999, 0.023340053856372833, 0.028161240741610527, 0.03298242762684822, 0.037803616374731064, 0.04262480512261391, 0.04744599014520645, 0.052267178893089294, 0.05708836764097214, 0.06190955638885498, 0.06673074513673782, 0.07155193388462067, 0.07637311518192291, 0.08119431138038635, 0.0860154926776886, 0.09083668142557144, 0.09565787017345428, 0.10047905892133713, 0.10530024766921997, 0.11012143641710281, 0.11494262516498566, 0.1197638064622879, 0.12458499521017075, 0.1294061839580536, 0.13422736525535583, 0.13904854655265808, 0.14386974275112152, 0.14869092404842377, 0.1535121202468872, 0.15833330154418945, 0.1631544977426529, 0.16797567903995514, 0.17279687523841858]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 5.0, 9.0, 6.0, 10.0, 9.0, 12.0, 21.0, 15.0, 11.0, 22.0, 21.0, 29.0, 27.0, 42.0, 34.0, 41.0, 41.0, 33.0, 53.0, 44.0, 53.0, 48.0, 36.0, 41.0, 33.0, 37.0, 36.0, 37.0, 29.0, 20.0, 26.0, 16.0, 19.0, 12.0, 16.0, 8.0, 12.0, 11.0, 9.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.044017016887664795, -0.04279964789748192, -0.04158227890729904, -0.040364913642406464, -0.03914754465222359, -0.03793017566204071, -0.03671281039714813, -0.035495441406965256, -0.03427807241678238, -0.0330607034265995, -0.031843334436416626, -0.030625969171524048, -0.02940860018134117, -0.028191231191158295, -0.026973864063620567, -0.02575649693608284, -0.024539127945899963, -0.023321758955717087, -0.02210439182817936, -0.020887024700641632, -0.019669655710458755, -0.01845228672027588, -0.01723491959273815, -0.016017552465200424, -0.014800183475017548, -0.013582815416157246, -0.012365447357296944, -0.011148079298436642, -0.00993071123957634, -0.008713343180716038, -0.007495975121855736, -0.006278607062995434, -0.005061239004135132, -0.00384387094527483, -0.002626502886414528, -0.001409134827554226, -0.00019176676869392395, 0.001025601290166378, 0.00224296934902668, 0.003460337407886982, 0.004677705466747284, 0.005895073525607586, 0.007112441584467888, 0.00832980964332819, 0.009547177702188492, 0.010764545761048794, 0.011981913819909096, 0.013199281878769398, 0.0144166499376297, 0.015634018927812576, 0.016851386055350304, 0.01806875318288803, 0.019286122173070908, 0.020503491163253784, 0.02172085829079151, 0.02293822541832924, 0.024155594408512115, 0.025372963398694992, 0.02659033052623272, 0.027807697653770447, 0.029025066643953323, 0.0302424356341362, 0.03145980089902878, 0.032677169889211655, 0.03389453887939453]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 7.0, 18.0, 21.0, 34.0, 50.0, 70.0, 106.0, 167.0, 261.0, 461.0, 896.0, 1774.0, 3731.0, 8332.0, 19317.0, 46848.0, 115137.0, 256073.0, 310517.0, 166201.0, 68286.0, 28044.0, 11880.0, 5271.0, 2365.0, 1150.0, 628.0, 371.0, 175.0, 109.0, 82.0, 46.0, 30.0, 20.0, 20.0, 13.0, 11.0, 8.0, 4.0, 5.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0100250244140625, -0.0096818208694458, -0.009338617324829102, -0.008995413780212402, -0.008652210235595703, -0.008309006690979004, -0.007965803146362305, -0.0076225996017456055, -0.007279396057128906, -0.006936192512512207, -0.006592988967895508, -0.006249785423278809, -0.005906581878662109, -0.00556337833404541, -0.005220174789428711, -0.004876971244812012, -0.0045337677001953125, -0.004190564155578613, -0.003847360610961914, -0.003504157066345215, -0.0031609535217285156, -0.0028177499771118164, -0.002474546432495117, -0.002131342887878418, -0.0017881393432617188, -0.0014449357986450195, -0.0011017322540283203, -0.0007585287094116211, -0.0004153251647949219, -7.212162017822266e-05, 0.00027108192443847656, 0.0006142854690551758, 0.000957489013671875, 0.0013006925582885742, 0.0016438961029052734, 0.0019870996475219727, 0.002330303192138672, 0.002673506736755371, 0.0030167102813720703, 0.0033599138259887695, 0.0037031173706054688, 0.004046320915222168, 0.004389524459838867, 0.004732728004455566, 0.005075931549072266, 0.005419135093688965, 0.005762338638305664, 0.006105542182922363, 0.0064487457275390625, 0.006791949272155762, 0.007135152816772461, 0.00747835636138916, 0.00782155990600586, 0.008164763450622559, 0.008507966995239258, 0.008851170539855957, 0.009194374084472656, 0.009537577629089355, 0.009880781173706055, 0.010223984718322754, 0.010567188262939453, 0.010910391807556152, 0.011253595352172852, 0.01159679889678955, 0.01194000244140625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 8.0, 12.0, 12.0, 11.0, 18.0, 21.0, 25.0, 26.0, 41.0, 48.0, 37.0, 53.0, 63.0, 76.0, 72.0, 58.0, 62.0, 61.0, 55.0, 56.0, 49.0, 38.0, 27.0, 34.0, 14.0, 9.0, 4.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007503509521484375, -0.0072217583656311035, -0.006940007209777832, -0.0066582560539245605, -0.006376504898071289, -0.006094753742218018, -0.005813002586364746, -0.005531251430511475, -0.005249500274658203, -0.004967749118804932, -0.00468599796295166, -0.004404246807098389, -0.004122495651245117, -0.0038407444953918457, -0.0035589933395385742, -0.0032772421836853027, -0.0029954910278320312, -0.0027137398719787598, -0.0024319887161254883, -0.002150237560272217, -0.0018684864044189453, -0.0015867352485656738, -0.0013049840927124023, -0.0010232329368591309, -0.0007414817810058594, -0.0004597306251525879, -0.0001779794692993164, 0.00010377168655395508, 0.00038552284240722656, 0.000667273998260498, 0.0009490251541137695, 0.001230776309967041, 0.0015125274658203125, 0.001794278621673584, 0.0020760297775268555, 0.002357780933380127, 0.0026395320892333984, 0.00292128324508667, 0.0032030344009399414, 0.003484785556793213, 0.0037665367126464844, 0.004048287868499756, 0.004330039024353027, 0.004611790180206299, 0.00489354133605957, 0.005175292491912842, 0.005457043647766113, 0.005738794803619385, 0.006020545959472656, 0.006302297115325928, 0.006584048271179199, 0.006865799427032471, 0.007147550582885742, 0.007429301738739014, 0.007711052894592285, 0.007992804050445557, 0.008274555206298828, 0.0085563063621521, 0.008838057518005371, 0.009119808673858643, 0.009401559829711914, 0.009683310985565186, 0.009965062141418457, 0.010246813297271729, 0.010528564453125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 17.0, 31.0, 44.0, 94.0, 191.0, 406.0, 890.0, 2331.0, 7327.0, 25924.0, 99673.0, 362724.0, 399743.0, 108855.0, 28187.0, 7855.0, 2546.0, 936.0, 390.0, 166.0, 105.0, 43.0, 28.0, 14.0, 14.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015411376953125, -0.014930248260498047, -0.014449119567871094, -0.01396799087524414, -0.013486862182617188, -0.013005733489990234, -0.012524604797363281, -0.012043476104736328, -0.011562347412109375, -0.011081218719482422, -0.010600090026855469, -0.010118961334228516, -0.009637832641601562, -0.00915670394897461, -0.008675575256347656, -0.008194446563720703, -0.00771331787109375, -0.007232189178466797, -0.006751060485839844, -0.006269931793212891, -0.0057888031005859375, -0.005307674407958984, -0.004826545715332031, -0.004345417022705078, -0.003864288330078125, -0.003383159637451172, -0.0029020309448242188, -0.0024209022521972656, -0.0019397735595703125, -0.0014586448669433594, -0.0009775161743164062, -0.0004963874816894531, -1.52587890625e-05, 0.0004658699035644531, 0.0009469985961914062, 0.0014281272888183594, 0.0019092559814453125, 0.0023903846740722656, 0.0028715133666992188, 0.003352642059326172, 0.003833770751953125, 0.004314899444580078, 0.004796028137207031, 0.005277156829833984, 0.0057582855224609375, 0.006239414215087891, 0.006720542907714844, 0.007201671600341797, 0.00768280029296875, 0.008163928985595703, 0.008645057678222656, 0.00912618637084961, 0.009607315063476562, 0.010088443756103516, 0.010569572448730469, 0.011050701141357422, 0.011531829833984375, 0.012012958526611328, 0.012494087219238281, 0.012975215911865234, 0.013456344604492188, 0.01393747329711914, 0.014418601989746094, 0.014899730682373047, 0.015380859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 1.0, 6.0, 8.0, 15.0, 12.0, 23.0, 23.0, 23.0, 29.0, 38.0, 32.0, 42.0, 49.0, 35.0, 51.0, 44.0, 48.0, 43.0, 45.0, 64.0, 39.0, 37.0, 45.0, 38.0, 38.0, 20.0, 26.0, 27.0, 20.0, 16.0, 13.0, 7.0, 6.0, 7.0, 9.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0186920166015625, -0.018146038055419922, -0.017600059509277344, -0.017054080963134766, -0.016508102416992188, -0.01596212387084961, -0.015416145324707031, -0.014870166778564453, -0.014324188232421875, -0.013778209686279297, -0.013232231140136719, -0.01268625259399414, -0.012140274047851562, -0.011594295501708984, -0.011048316955566406, -0.010502338409423828, -0.00995635986328125, -0.009410381317138672, -0.008864402770996094, -0.008318424224853516, -0.0077724456787109375, -0.007226467132568359, -0.006680488586425781, -0.006134510040283203, -0.005588531494140625, -0.005042552947998047, -0.004496574401855469, -0.003950595855712891, -0.0034046173095703125, -0.0028586387634277344, -0.0023126602172851562, -0.0017666816711425781, -0.001220703125, -0.0006747245788574219, -0.00012874603271484375, 0.0004172325134277344, 0.0009632110595703125, 0.0015091896057128906, 0.0020551681518554688, 0.002601146697998047, 0.003147125244140625, 0.003693103790283203, 0.004239082336425781, 0.004785060882568359, 0.0053310394287109375, 0.005877017974853516, 0.006422996520996094, 0.006968975067138672, 0.00751495361328125, 0.008060932159423828, 0.008606910705566406, 0.009152889251708984, 0.009698867797851562, 0.01024484634399414, 0.010790824890136719, 0.011336803436279297, 0.011882781982421875, 0.012428760528564453, 0.012974739074707031, 0.01352071762084961, 0.014066696166992188, 0.014612674713134766, 0.015158653259277344, 0.015704631805419922, 0.0162506103515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 8.0, 17.0, 30.0, 52.0, 105.0, 192.0, 442.0, 870.0, 2350.0, 6314.0, 21327.0, 83667.0, 342205.0, 443031.0, 108747.0, 26562.0, 7771.0, 2721.0, 1071.0, 542.0, 253.0, 123.0, 68.0, 29.0, 18.0, 16.0, 6.0, 1.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0037708282470703125, -0.0036568641662597656, -0.0035429000854492188, -0.003428936004638672, -0.003314971923828125, -0.003201007843017578, -0.0030870437622070312, -0.0029730796813964844, -0.0028591156005859375, -0.0027451515197753906, -0.0026311874389648438, -0.002517223358154297, -0.00240325927734375, -0.002289295196533203, -0.0021753311157226562, -0.0020613670349121094, -0.0019474029541015625, -0.0018334388732910156, -0.0017194747924804688, -0.0016055107116699219, -0.001491546630859375, -0.0013775825500488281, -0.0012636184692382812, -0.0011496543884277344, -0.0010356903076171875, -0.0009217262268066406, -0.0008077621459960938, -0.0006937980651855469, -0.000579833984375, -0.0004658699035644531, -0.00035190582275390625, -0.00023794174194335938, -0.0001239776611328125, -1.0013580322265625e-05, 0.00010395050048828125, 0.00021791458129882812, 0.000331878662109375, 0.0004458427429199219, 0.0005598068237304688, 0.0006737709045410156, 0.0007877349853515625, 0.0009016990661621094, 0.0010156631469726562, 0.0011296272277832031, 0.00124359130859375, 0.0013575553894042969, 0.0014715194702148438, 0.0015854835510253906, 0.0016994476318359375, 0.0018134117126464844, 0.0019273757934570312, 0.002041339874267578, 0.002155303955078125, 0.002269268035888672, 0.0023832321166992188, 0.0024971961975097656, 0.0026111602783203125, 0.0027251243591308594, 0.0028390884399414062, 0.002953052520751953, 0.0030670166015625, 0.003180980682373047, 0.0032949447631835938, 0.0034089088439941406, 0.0035228729248046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 0.0, 6.0, 14.0, 23.0, 18.0, 0.0, 28.0, 23.0, 24.0, 0.0, 36.0, 45.0, 79.0, 60.0, 0.0, 59.0, 62.0, 66.0, 0.0, 67.0, 70.0, 44.0, 44.0, 0.0, 41.0, 36.0, 28.0, 28.0, 0.0, 29.0, 12.0, 18.0, 0.0, 15.0, 5.0, 5.0, 6.0, 0.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.430511474609375e-06, -1.383945345878601e-06, -1.3373792171478271e-06, -1.2908130884170532e-06, -1.2442469596862793e-06, -1.1976808309555054e-06, -1.1511147022247314e-06, -1.1045485734939575e-06, -1.0579824447631836e-06, -1.0114163160324097e-06, -9.648501873016357e-07, -9.182840585708618e-07, -8.717179298400879e-07, -8.25151801109314e-07, -7.7858567237854e-07, -7.320195436477661e-07, -6.854534149169922e-07, -6.388872861862183e-07, -5.923211574554443e-07, -5.457550287246704e-07, -4.991888999938965e-07, -4.5262277126312256e-07, -4.0605664253234863e-07, -3.594905138015747e-07, -3.129243850708008e-07, -2.6635825634002686e-07, -2.1979212760925293e-07, -1.73225998878479e-07, -1.2665987014770508e-07, -8.009374141693115e-08, -3.3527612686157227e-08, 1.30385160446167e-08, 5.960464477539063e-08, 1.0617077350616455e-07, 1.5273690223693848e-07, 1.993030309677124e-07, 2.4586915969848633e-07, 2.9243528842926025e-07, 3.390014171600342e-07, 3.855675458908081e-07, 4.3213367462158203e-07, 4.78699803352356e-07, 5.252659320831299e-07, 5.718320608139038e-07, 6.183981895446777e-07, 6.649643182754517e-07, 7.115304470062256e-07, 7.580965757369995e-07, 8.046627044677734e-07, 8.512288331985474e-07, 8.977949619293213e-07, 9.443610906600952e-07, 9.909272193908691e-07, 1.037493348121643e-06, 1.084059476852417e-06, 1.130625605583191e-06, 1.1771917343139648e-06, 1.2237578630447388e-06, 1.2703239917755127e-06, 1.3168901205062866e-06, 1.3634562492370605e-06, 1.4100223779678345e-06, 1.4565885066986084e-06, 1.5031546354293823e-06, 1.5497207641601562e-06]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 15.0, 26.0, 34.0, 94.0, 213.0, 462.0, 1221.0, 3754.0, 13544.0, 63470.0, 310347.0, 502958.0, 118942.0, 24084.0, 6118.0, 1946.0, 747.0, 305.0, 126.0, 63.0, 39.0, 15.0, 11.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.004428863525390625, -0.004306495189666748, -0.004184126853942871, -0.004061758518218994, -0.003939390182495117, -0.0038170218467712402, -0.0036946535110473633, -0.0035722851753234863, -0.0034499168395996094, -0.0033275485038757324, -0.0032051801681518555, -0.0030828118324279785, -0.0029604434967041016, -0.0028380751609802246, -0.0027157068252563477, -0.0025933384895324707, -0.0024709701538085938, -0.002348601818084717, -0.00222623348236084, -0.002103865146636963, -0.001981496810913086, -0.001859128475189209, -0.001736760139465332, -0.001614391803741455, -0.0014920234680175781, -0.0013696551322937012, -0.0012472867965698242, -0.0011249184608459473, -0.0010025501251220703, -0.0008801817893981934, -0.0007578134536743164, -0.0006354451179504395, -0.0005130767822265625, -0.00039070844650268555, -0.0002683401107788086, -0.00014597177505493164, -2.3603439331054688e-05, 9.876489639282227e-05, 0.00022113323211669922, 0.00034350156784057617, 0.0004658699035644531, 0.0005882382392883301, 0.000710606575012207, 0.000832974910736084, 0.0009553432464599609, 0.0010777115821838379, 0.0012000799179077148, 0.0013224482536315918, 0.0014448165893554688, 0.0015671849250793457, 0.0016895532608032227, 0.0018119215965270996, 0.0019342899322509766, 0.0020566582679748535, 0.0021790266036987305, 0.0023013949394226074, 0.0024237632751464844, 0.0025461316108703613, 0.0026684999465942383, 0.0027908682823181152, 0.002913236618041992, 0.003035604953765869, 0.003157973289489746, 0.003280341625213623, 0.0034027099609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 1.0, 2.0, 5.0, 7.0, 6.0, 13.0, 22.0, 18.0, 30.0, 39.0, 46.0, 55.0, 73.0, 91.0, 114.0, 106.0, 72.0, 58.0, 67.0, 38.0, 33.0, 31.0, 18.0, 11.0, 14.0, 8.0, 11.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.004852294921875, -0.004716813564300537, -0.004581332206726074, -0.004445850849151611, -0.0043103694915771484, -0.0041748881340026855, -0.004039406776428223, -0.0039039254188537598, -0.003768444061279297, -0.003632962703704834, -0.003497481346130371, -0.003361999988555908, -0.0032265186309814453, -0.0030910372734069824, -0.0029555559158325195, -0.0028200745582580566, -0.0026845932006835938, -0.002549111843109131, -0.002413630485534668, -0.002278149127960205, -0.002142667770385742, -0.0020071864128112793, -0.0018717050552368164, -0.0017362236976623535, -0.0016007423400878906, -0.0014652609825134277, -0.0013297796249389648, -0.001194298267364502, -0.001058816909790039, -0.0009233355522155762, -0.0007878541946411133, -0.0006523728370666504, -0.0005168914794921875, -0.0003814101219177246, -0.0002459287643432617, -0.00011044740676879883, 2.5033950805664062e-05, 0.00016051530838012695, 0.00029599666595458984, 0.00043147802352905273, 0.0005669593811035156, 0.0007024407386779785, 0.0008379220962524414, 0.0009734034538269043, 0.0011088848114013672, 0.00124436616897583, 0.001379847526550293, 0.0015153288841247559, 0.0016508102416992188, 0.0017862915992736816, 0.0019217729568481445, 0.0020572543144226074, 0.0021927356719970703, 0.002328217029571533, 0.002463698387145996, 0.002599179744720459, 0.002734661102294922, 0.0028701424598693848, 0.0030056238174438477, 0.0031411051750183105, 0.0032765865325927734, 0.0034120678901672363, 0.0035475492477416992, 0.003683030605316162, 0.003818511962890625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 14.0, 20.0, 44.0, 83.0, 123.0, 174.0, 186.0, 142.0, 97.0, 47.0, 28.0, 15.0, 9.0, 6.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04296469688415527, -0.040269721299409866, -0.03757474571466446, -0.034879766404628754, -0.03218479081988335, -0.02948981523513794, -0.026794839650392532, -0.024099862203001976, -0.02140488661825657, -0.018709911033511162, -0.016014933586120605, -0.013319958001375198, -0.010624981485307217, -0.007930004969239235, -0.005235029384493828, -0.0025400519371032715, 0.00015492364764213562, 0.0028498999308794737, 0.005544876214116812, 0.008239852264523506, 0.010934828780591488, 0.01362980529665947, 0.016324780881404877, 0.019019758328795433, 0.02171473391354084, 0.024409709498286247, 0.027104686945676804, 0.02979966253042221, 0.03249463811516762, 0.035189613699913025, 0.03788459300994873, 0.04057956859469414, 0.043274544179439545, 0.04596951976418495, 0.04866449534893036, 0.051359474658966064, 0.05405445024371147, 0.05674942582845688, 0.059444401413202286, 0.06213937699794769, 0.0648343563079834, 0.0675293356180191, 0.07022430747747421, 0.07291928678750992, 0.07561425864696503, 0.07830923795700073, 0.08100421726703644, 0.08369918912649155, 0.08639416098594666, 0.08908914029598236, 0.09178411215543747, 0.09447909146547318, 0.09717406332492828, 0.09986904263496399, 0.1025640219449997, 0.1052589938044548, 0.10795397311449051, 0.11064895242452621, 0.11334392428398132, 0.11603890359401703, 0.11873387545347214, 0.12142885476350784, 0.12412382662296295, 0.12681880593299866, 0.12951378524303436]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 3.0, 4.0, 5.0, 7.0, 8.0, 13.0, 7.0, 16.0, 16.0, 16.0, 15.0, 17.0, 23.0, 21.0, 25.0, 21.0, 25.0, 40.0, 35.0, 38.0, 47.0, 35.0, 45.0, 43.0, 49.0, 39.0, 40.0, 32.0, 35.0, 36.0, 26.0, 25.0, 29.0, 20.0, 22.0, 17.0, 11.0, 15.0, 13.0, 10.0, 14.0, 5.0, 10.0, 10.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.03336894512176514, -0.03234583139419556, -0.03132271766662598, -0.030299600213766098, -0.029276486486196518, -0.028253372758626938, -0.02723025716841221, -0.02620714157819748, -0.0251840278506279, -0.02416091412305832, -0.02313779853284359, -0.02211468294262886, -0.02109156921505928, -0.0200684554874897, -0.01904533989727497, -0.01802222430706024, -0.01699911057949066, -0.01597599685192108, -0.014952881261706352, -0.013929766602814198, -0.012906651943922043, -0.011883537285029888, -0.010860422626137733, -0.009837307967245579, -0.008814193308353424, -0.007791078649461269, -0.006767963990569115, -0.00574484933167696, -0.004721734672784805, -0.0036986200138926506, -0.002675505355000496, -0.0016523906961083412, -0.0006292760372161865, 0.00039383862167596817, 0.0014169532805681229, 0.0024400679394602776, 0.0034631825983524323, 0.004486297257244587, 0.005509411916136742, 0.006532526575028896, 0.007555641233921051, 0.008578755892813206, 0.00960187055170536, 0.010624985210597515, 0.01164809986948967, 0.012671214528381824, 0.01369432918727398, 0.014717443846166134, 0.01574055850505829, 0.01676367223262787, 0.017786787822842598, 0.018809903413057327, 0.019833017140626907, 0.020856130868196487, 0.021879246458411217, 0.022902362048625946, 0.023925475776195526, 0.024948589503765106, 0.025971705093979836, 0.026994820684194565, 0.028017934411764145, 0.029041048139333725, 0.030064163729548454, 0.031087279319763184, 0.032110393047332764]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 9.0, 16.0, 35.0, 41.0, 45.0, 79.0, 124.0, 203.0, 329.0, 682.0, 2299.0, 14189.0, 184671.0, 3006496.0, 936635.0, 40893.0, 5124.0, 1233.0, 484.0, 258.0, 141.0, 94.0, 59.0, 41.0, 23.0, 25.0, 9.0, 8.0, 6.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0235748291015625, -0.022754430770874023, -0.021934032440185547, -0.02111363410949707, -0.020293235778808594, -0.019472837448120117, -0.01865243911743164, -0.017832040786743164, -0.017011642456054688, -0.01619124412536621, -0.015370845794677734, -0.014550447463989258, -0.013730049133300781, -0.012909650802612305, -0.012089252471923828, -0.011268854141235352, -0.010448455810546875, -0.009628057479858398, -0.008807659149169922, -0.007987260818481445, -0.007166862487792969, -0.006346464157104492, -0.005526065826416016, -0.004705667495727539, -0.0038852691650390625, -0.003064870834350586, -0.0022444725036621094, -0.0014240741729736328, -0.0006036758422851562, 0.0002167224884033203, 0.0010371208190917969, 0.0018575191497802734, 0.00267791748046875, 0.0034983158111572266, 0.004318714141845703, 0.00513911247253418, 0.005959510803222656, 0.006779909133911133, 0.007600307464599609, 0.008420705795288086, 0.009241104125976562, 0.010061502456665039, 0.010881900787353516, 0.011702299118041992, 0.012522697448730469, 0.013343095779418945, 0.014163494110107422, 0.014983892440795898, 0.015804290771484375, 0.01662468910217285, 0.017445087432861328, 0.018265485763549805, 0.01908588409423828, 0.019906282424926758, 0.020726680755615234, 0.02154707908630371, 0.022367477416992188, 0.023187875747680664, 0.02400827407836914, 0.024828672409057617, 0.025649070739746094, 0.02646946907043457, 0.027289867401123047, 0.028110265731811523, 0.0289306640625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 14.0, 15.0, 19.0, 20.0, 36.0, 33.0, 54.0, 41.0, 58.0, 77.0, 65.0, 78.0, 82.0, 58.0, 59.0, 63.0, 38.0, 38.0, 48.0, 28.0, 24.0, 14.0, 12.0, 3.0, 2.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006931304931640625, -0.006663501262664795, -0.006395697593688965, -0.006127893924713135, -0.005860090255737305, -0.005592286586761475, -0.0053244829177856445, -0.0050566792488098145, -0.004788875579833984, -0.004521071910858154, -0.004253268241882324, -0.003985464572906494, -0.003717660903930664, -0.003449857234954834, -0.003182053565979004, -0.002914249897003174, -0.0026464462280273438, -0.0023786425590515137, -0.0021108388900756836, -0.0018430352210998535, -0.0015752315521240234, -0.0013074278831481934, -0.0010396242141723633, -0.0007718205451965332, -0.0005040168762207031, -0.00023621320724487305, 3.159046173095703e-05, 0.0002993941307067871, 0.0005671977996826172, 0.0008350014686584473, 0.0011028051376342773, 0.0013706088066101074, 0.0016384124755859375, 0.0019062161445617676, 0.0021740198135375977, 0.0024418234825134277, 0.002709627151489258, 0.002977430820465088, 0.003245234489440918, 0.003513038158416748, 0.003780841827392578, 0.004048645496368408, 0.004316449165344238, 0.004584252834320068, 0.0048520565032958984, 0.0051198601722717285, 0.005387663841247559, 0.005655467510223389, 0.005923271179199219, 0.006191074848175049, 0.006458878517150879, 0.006726682186126709, 0.006994485855102539, 0.007262289524078369, 0.007530093193054199, 0.007797896862030029, 0.00806570053100586, 0.00833350419998169, 0.00860130786895752, 0.00886911153793335, 0.00913691520690918, 0.00940471887588501, 0.00967252254486084, 0.00994032621383667, 0.0102081298828125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 10.0, 19.0, 35.0, 48.0, 95.0, 182.0, 367.0, 706.0, 2031.0, 7289.0, 51164.0, 1592447.0, 2458445.0, 68506.0, 8877.0, 2319.0, 856.0, 411.0, 222.0, 88.0, 62.0, 28.0, 30.0, 15.0, 7.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0261993408203125, -0.025382041931152344, -0.024564743041992188, -0.02374744415283203, -0.022930145263671875, -0.02211284637451172, -0.021295547485351562, -0.020478248596191406, -0.01966094970703125, -0.018843650817871094, -0.018026351928710938, -0.01720905303955078, -0.016391754150390625, -0.015574455261230469, -0.014757156372070312, -0.013939857482910156, -0.01312255859375, -0.012305259704589844, -0.011487960815429688, -0.010670661926269531, -0.009853363037109375, -0.009036064147949219, -0.008218765258789062, -0.007401466369628906, -0.00658416748046875, -0.005766868591308594, -0.0049495697021484375, -0.004132270812988281, -0.003314971923828125, -0.0024976730346679688, -0.0016803741455078125, -0.0008630752563476562, -4.57763671875e-05, 0.0007715225219726562, 0.0015888214111328125, 0.0024061203002929688, 0.003223419189453125, 0.004040718078613281, 0.0048580169677734375, 0.005675315856933594, 0.00649261474609375, 0.007309913635253906, 0.008127212524414062, 0.008944511413574219, 0.009761810302734375, 0.010579109191894531, 0.011396408081054688, 0.012213706970214844, 0.013031005859375, 0.013848304748535156, 0.014665603637695312, 0.015482902526855469, 0.016300201416015625, 0.01711750030517578, 0.017934799194335938, 0.018752098083496094, 0.01956939697265625, 0.020386695861816406, 0.021203994750976562, 0.02202129364013672, 0.022838592529296875, 0.02365589141845703, 0.024473190307617188, 0.025290489196777344, 0.0261077880859375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 3.0, 5.0, 6.0, 7.0, 14.0, 19.0, 26.0, 28.0, 42.0, 64.0, 86.0, 122.0, 173.0, 216.0, 280.0, 381.0, 438.0, 461.0, 386.0, 320.0, 255.0, 185.0, 133.0, 103.0, 78.0, 50.0, 52.0, 31.0, 26.0, 23.0, 15.0, 9.0, 9.0, 4.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011810302734375, -0.011312484741210938, -0.010814666748046875, -0.010316848754882812, -0.00981903076171875, -0.009321212768554688, -0.008823394775390625, -0.008325576782226562, -0.0078277587890625, -0.0073299407958984375, -0.006832122802734375, -0.0063343048095703125, -0.00583648681640625, -0.0053386688232421875, -0.004840850830078125, -0.0043430328369140625, -0.00384521484375, -0.0033473968505859375, -0.002849578857421875, -0.0023517608642578125, -0.00185394287109375, -0.0013561248779296875, -0.000858306884765625, -0.0003604888916015625, 0.0001373291015625, 0.0006351470947265625, 0.001132965087890625, 0.0016307830810546875, 0.00212860107421875, 0.0026264190673828125, 0.003124237060546875, 0.0036220550537109375, 0.004119873046875, 0.0046176910400390625, 0.005115509033203125, 0.0056133270263671875, 0.00611114501953125, 0.0066089630126953125, 0.007106781005859375, 0.0076045989990234375, 0.0081024169921875, 0.008600234985351562, 0.009098052978515625, 0.009595870971679688, 0.01009368896484375, 0.010591506958007812, 0.011089324951171875, 0.011587142944335938, 0.0120849609375, 0.012582778930664062, 0.013080596923828125, 0.013578414916992188, 0.01407623291015625, 0.014574050903320312, 0.015071868896484375, 0.015569686889648438, 0.0160675048828125, 0.016565322875976562, 0.017063140869140625, 0.017560958862304688, 0.01805877685546875, 0.018556594848632812, 0.019054412841796875, 0.019552230834960938, 0.020050048828125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 9.0, 13.0, 31.0, 52.0, 166.0, 325.0, 246.0, 75.0, 37.0, 15.0, 10.0, 8.0, 3.0, 5.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4731270670890808, -0.4598137140274048, -0.44650033116340637, -0.43318697810173035, -0.41987359523773193, -0.4065602421760559, -0.3932468891143799, -0.37993350625038147, -0.36662012338638306, -0.35330677032470703, -0.3399933874607086, -0.3266800343990326, -0.3133666515350342, -0.30005329847335815, -0.28673994541168213, -0.2734265625476837, -0.2601132094860077, -0.24679984152317047, -0.23348647356033325, -0.22017312049865723, -0.2068597376346588, -0.1935463845729828, -0.18023301661014557, -0.16691964864730835, -0.15360628068447113, -0.1402929127216339, -0.1269795447587967, -0.11366618424654007, -0.10035281628370285, -0.08703944832086563, -0.07372608780860901, -0.06041271984577179, -0.04709935188293457, -0.03378598392009735, -0.02047261968255043, -0.0071592554450035095, 0.00615411251783371, 0.01946748048067093, 0.03278084099292755, 0.04609420895576477, 0.05940757691860199, 0.07272094488143921, 0.08603431284427643, 0.09934767335653305, 0.11266104131937027, 0.12597441673278809, 0.1392877697944641, 0.15260113775730133, 0.16591450572013855, 0.17922787368297577, 0.192541241645813, 0.205854594707489, 0.21916797757148743, 0.23248133063316345, 0.24579469859600067, 0.2591080665588379, 0.2724214196205139, 0.28573477268218994, 0.29904815554618835, 0.3123615086078644, 0.3256748914718628, 0.3389882445335388, 0.35230159759521484, 0.36561498045921326, 0.37892836332321167]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 0.0, 3.0, 4.0, 6.0, 2.0, 11.0, 10.0, 9.0, 15.0, 12.0, 22.0, 33.0, 31.0, 39.0, 37.0, 41.0, 52.0, 59.0, 79.0, 49.0, 70.0, 47.0, 56.0, 53.0, 45.0, 44.0, 31.0, 22.0, 29.0, 25.0, 12.0, 12.0, 11.0, 11.0, 5.0, 3.0, 8.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.09200793504714966, -0.08866562694311142, -0.08532331883907318, -0.08198101073503494, -0.0786387026309967, -0.07529638707637787, -0.07195407897233963, -0.06861177086830139, -0.06526946276426315, -0.061927154660224915, -0.058584846556186676, -0.05524253472685814, -0.0519002266228199, -0.04855791851878166, -0.045215606689453125, -0.041873298585414886, -0.03853099048137665, -0.03518868237733841, -0.03184637427330017, -0.028504062443971634, -0.025161754339933395, -0.021819446235895157, -0.01847713626921177, -0.015134826302528381, -0.011792518198490143, -0.00845020916312933, -0.0051079001277685165, -0.0017655910924077034, 0.0015767179429531097, 0.004919026046991348, 0.008261336013674736, 0.011603645980358124, 0.014945954084396362, 0.0182882621884346, 0.02163057215511799, 0.024972882121801376, 0.028315190225839615, 0.03165749832987785, 0.03499981015920639, 0.03834211826324463, 0.04168442636728287, 0.045026734471321106, 0.048369042575359344, 0.05171135440468788, 0.05505366250872612, 0.05839597061276436, 0.061738282442092896, 0.06508059054613113, 0.06842289865016937, 0.07176520675420761, 0.07510751485824585, 0.07844982296228409, 0.08179213106632233, 0.08513444662094116, 0.0884767547249794, 0.09181906282901764, 0.09516137093305588, 0.09850367903709412, 0.10184598714113235, 0.1051882952451706, 0.10853061079978943, 0.11187291145324707, 0.1152152270078659, 0.11855753511190414, 0.12189984321594238]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 5.0, 4.0, 11.0, 13.0, 18.0, 18.0, 29.0, 51.0, 67.0, 101.0, 159.0, 259.0, 472.0, 964.0, 2203.0, 7198.0, 42072.0, 593646.0, 363761.0, 28118.0, 5631.0, 1856.0, 773.0, 421.0, 257.0, 129.0, 92.0, 67.0, 43.0, 32.0, 18.0, 12.0, 10.0, 5.0, 7.0, 4.0, 6.0, 2.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0228271484375, -0.02200913429260254, -0.021191120147705078, -0.020373106002807617, -0.019555091857910156, -0.018737077713012695, -0.017919063568115234, -0.017101049423217773, -0.016283035278320312, -0.015465021133422852, -0.01464700698852539, -0.01382899284362793, -0.013010978698730469, -0.012192964553833008, -0.011374950408935547, -0.010556936264038086, -0.009738922119140625, -0.008920907974243164, -0.008102893829345703, -0.007284879684448242, -0.006466865539550781, -0.00564885139465332, -0.004830837249755859, -0.0040128231048583984, -0.0031948089599609375, -0.0023767948150634766, -0.0015587806701660156, -0.0007407665252685547, 7.724761962890625e-05, 0.0008952617645263672, 0.0017132759094238281, 0.002531290054321289, 0.00334930419921875, 0.004167318344116211, 0.004985332489013672, 0.005803346633911133, 0.006621360778808594, 0.007439374923706055, 0.008257389068603516, 0.009075403213500977, 0.009893417358398438, 0.010711431503295898, 0.01152944564819336, 0.01234745979309082, 0.013165473937988281, 0.013983488082885742, 0.014801502227783203, 0.015619516372680664, 0.016437530517578125, 0.017255544662475586, 0.018073558807373047, 0.018891572952270508, 0.01970958709716797, 0.02052760124206543, 0.02134561538696289, 0.02216362953186035, 0.022981643676757812, 0.023799657821655273, 0.024617671966552734, 0.025435686111450195, 0.026253700256347656, 0.027071714401245117, 0.027889728546142578, 0.02870774269104004, 0.0295257568359375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 10.0, 9.0, 11.0, 25.0, 22.0, 26.0, 37.0, 49.0, 55.0, 73.0, 75.0, 86.0, 70.0, 81.0, 69.0, 68.0, 48.0, 42.0, 37.0, 35.0, 17.0, 10.0, 10.0, 8.0, 7.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01442718505859375, -0.01389920711517334, -0.01337122917175293, -0.01284325122833252, -0.01231527328491211, -0.0117872953414917, -0.011259317398071289, -0.010731339454650879, -0.010203361511230469, -0.009675383567810059, -0.009147405624389648, -0.008619427680969238, -0.008091449737548828, -0.007563471794128418, -0.007035493850708008, -0.006507515907287598, -0.0059795379638671875, -0.005451560020446777, -0.004923582077026367, -0.004395604133605957, -0.003867626190185547, -0.0033396482467651367, -0.0028116703033447266, -0.0022836923599243164, -0.0017557144165039062, -0.001227736473083496, -0.0006997585296630859, -0.00017178058624267578, 0.0003561973571777344, 0.0008841753005981445, 0.0014121532440185547, 0.0019401311874389648, 0.002468109130859375, 0.002996087074279785, 0.0035240650177001953, 0.0040520429611206055, 0.004580020904541016, 0.005107998847961426, 0.005635976791381836, 0.006163954734802246, 0.006691932678222656, 0.007219910621643066, 0.0077478885650634766, 0.008275866508483887, 0.008803844451904297, 0.009331822395324707, 0.009859800338745117, 0.010387778282165527, 0.010915756225585938, 0.011443734169006348, 0.011971712112426758, 0.012499690055847168, 0.013027667999267578, 0.013555645942687988, 0.014083623886108398, 0.014611601829528809, 0.015139579772949219, 0.01566755771636963, 0.01619553565979004, 0.01672351360321045, 0.01725149154663086, 0.01777946949005127, 0.01830744743347168, 0.01883542537689209, 0.0193634033203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 8.0, 7.0, 13.0, 21.0, 20.0, 29.0, 51.0, 57.0, 74.0, 124.0, 159.0, 298.0, 863.0, 4145.0, 53338.0, 944849.0, 39489.0, 3383.0, 787.0, 289.0, 158.0, 112.0, 72.0, 61.0, 34.0, 24.0, 21.0, 20.0, 7.0, 8.0, 8.0, 2.0, 6.0, 3.0, 7.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.034454345703125, -0.033509254455566406, -0.03256416320800781, -0.03161907196044922, -0.030673980712890625, -0.02972888946533203, -0.028783798217773438, -0.027838706970214844, -0.02689361572265625, -0.025948524475097656, -0.025003433227539062, -0.02405834197998047, -0.023113250732421875, -0.02216815948486328, -0.021223068237304688, -0.020277976989746094, -0.0193328857421875, -0.018387794494628906, -0.017442703247070312, -0.01649761199951172, -0.015552520751953125, -0.014607429504394531, -0.013662338256835938, -0.012717247009277344, -0.01177215576171875, -0.010827064514160156, -0.009881973266601562, -0.008936882019042969, -0.007991790771484375, -0.007046699523925781, -0.0061016082763671875, -0.005156517028808594, -0.00421142578125, -0.0032663345336914062, -0.0023212432861328125, -0.0013761520385742188, -0.000431060791015625, 0.0005140304565429688, 0.0014591217041015625, 0.0024042129516601562, 0.00334930419921875, 0.004294395446777344, 0.0052394866943359375, 0.006184577941894531, 0.007129669189453125, 0.008074760437011719, 0.009019851684570312, 0.009964942932128906, 0.0109100341796875, 0.011855125427246094, 0.012800216674804688, 0.013745307922363281, 0.014690399169921875, 0.01563549041748047, 0.016580581665039062, 0.017525672912597656, 0.01847076416015625, 0.019415855407714844, 0.020360946655273438, 0.02130603790283203, 0.022251129150390625, 0.02319622039794922, 0.024141311645507812, 0.025086402893066406, 0.026031494140625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 8.0, 6.0, 12.0, 17.0, 21.0, 25.0, 28.0, 30.0, 29.0, 46.0, 54.0, 72.0, 65.0, 75.0, 64.0, 51.0, 65.0, 54.0, 48.0, 50.0, 33.0, 29.0, 34.0, 17.0, 20.0, 15.0, 11.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0399169921875, -0.038826704025268555, -0.03773641586303711, -0.036646127700805664, -0.03555583953857422, -0.03446555137634277, -0.03337526321411133, -0.03228497505187988, -0.031194686889648438, -0.030104398727416992, -0.029014110565185547, -0.0279238224029541, -0.026833534240722656, -0.02574324607849121, -0.024652957916259766, -0.02356266975402832, -0.022472381591796875, -0.02138209342956543, -0.020291805267333984, -0.01920151710510254, -0.018111228942871094, -0.01702094078063965, -0.015930652618408203, -0.014840364456176758, -0.013750076293945312, -0.012659788131713867, -0.011569499969482422, -0.010479211807250977, -0.009388923645019531, -0.008298635482788086, -0.007208347320556641, -0.006118059158325195, -0.00502777099609375, -0.003937482833862305, -0.0028471946716308594, -0.001756906509399414, -0.0006666183471679688, 0.00042366981506347656, 0.0015139579772949219, 0.002604246139526367, 0.0036945343017578125, 0.004784822463989258, 0.005875110626220703, 0.0069653987884521484, 0.008055686950683594, 0.009145975112915039, 0.010236263275146484, 0.01132655143737793, 0.012416839599609375, 0.01350712776184082, 0.014597415924072266, 0.01568770408630371, 0.016777992248535156, 0.0178682804107666, 0.018958568572998047, 0.020048856735229492, 0.021139144897460938, 0.022229433059692383, 0.023319721221923828, 0.024410009384155273, 0.02550029754638672, 0.026590585708618164, 0.02768087387084961, 0.028771162033081055, 0.0298614501953125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 8.0, 2.0, 8.0, 7.0, 18.0, 11.0, 26.0, 32.0, 35.0, 48.0, 85.0, 85.0, 147.0, 216.0, 383.0, 715.0, 1287.0, 2640.0, 6122.0, 17085.0, 64907.0, 362534.0, 480496.0, 78717.0, 19959.0, 6898.0, 2912.0, 1391.0, 730.0, 378.0, 221.0, 126.0, 95.0, 62.0, 45.0, 28.0, 22.0, 15.0, 14.0, 10.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.002506256103515625, -0.0024326741695404053, -0.0023590922355651855, -0.002285510301589966, -0.002211928367614746, -0.0021383464336395264, -0.0020647644996643066, -0.001991182565689087, -0.0019176006317138672, -0.0018440186977386475, -0.0017704367637634277, -0.001696854829788208, -0.0016232728958129883, -0.0015496909618377686, -0.0014761090278625488, -0.001402527093887329, -0.0013289451599121094, -0.0012553632259368896, -0.00118178129196167, -0.0011081993579864502, -0.0010346174240112305, -0.0009610354900360107, -0.000887453556060791, -0.0008138716220855713, -0.0007402896881103516, -0.0006667077541351318, -0.0005931258201599121, -0.0005195438861846924, -0.00044596195220947266, -0.00037238001823425293, -0.0002987980842590332, -0.00022521615028381348, -0.00015163421630859375, -7.805228233337402e-05, -4.470348358154297e-06, 6.911158561706543e-05, 0.00014269351959228516, 0.00021627545356750488, 0.0002898573875427246, 0.00036343932151794434, 0.00043702125549316406, 0.0005106031894683838, 0.0005841851234436035, 0.0006577670574188232, 0.000731348991394043, 0.0008049309253692627, 0.0008785128593444824, 0.0009520947933197021, 0.0010256767272949219, 0.0010992586612701416, 0.0011728405952453613, 0.001246422529220581, 0.0013200044631958008, 0.0013935863971710205, 0.0014671683311462402, 0.00154075026512146, 0.0016143321990966797, 0.0016879141330718994, 0.0017614960670471191, 0.0018350780010223389, 0.0019086599349975586, 0.0019822418689727783, 0.002055823802947998, 0.0021294057369232178, 0.0022029876708984375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 0.0, 7.0, 0.0, 5.0, 12.0, 0.0, 14.0, 28.0, 0.0, 18.0, 36.0, 0.0, 33.0, 46.0, 0.0, 55.0, 0.0, 72.0, 70.0, 0.0, 73.0, 91.0, 0.0, 68.0, 58.0, 0.0, 57.0, 0.0, 51.0, 40.0, 0.0, 48.0, 31.0, 0.0, 28.0, 16.0, 0.0, 10.0, 10.0, 0.0, 8.0, 0.0, 8.0, 2.0, 0.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2135133147239685e-06, -1.1753290891647339e-06, -1.1371448636054993e-06, -1.0989606380462646e-06, -1.06077641248703e-06, -1.0225921869277954e-06, -9.844079613685608e-07, -9.462237358093262e-07, -9.080395102500916e-07, -8.698552846908569e-07, -8.316710591316223e-07, -7.934868335723877e-07, -7.553026080131531e-07, -7.171183824539185e-07, -6.789341568946838e-07, -6.407499313354492e-07, -6.025657057762146e-07, -5.6438148021698e-07, -5.261972546577454e-07, -4.880130290985107e-07, -4.498288035392761e-07, -4.116445779800415e-07, -3.734603524208069e-07, -3.3527612686157227e-07, -2.9709190130233765e-07, -2.5890767574310303e-07, -2.207234501838684e-07, -1.825392246246338e-07, -1.4435499906539917e-07, -1.0617077350616455e-07, -6.798654794692993e-08, -2.9802322387695312e-08, 8.381903171539307e-09, 4.6566128730773926e-08, 8.475035429000854e-08, 1.2293457984924316e-07, 1.6111880540847778e-07, 1.993030309677124e-07, 2.3748725652694702e-07, 2.7567148208618164e-07, 3.1385570764541626e-07, 3.520399332046509e-07, 3.902241587638855e-07, 4.284083843231201e-07, 4.6659260988235474e-07, 5.047768354415894e-07, 5.42961061000824e-07, 5.811452865600586e-07, 6.193295121192932e-07, 6.575137376785278e-07, 6.956979632377625e-07, 7.338821887969971e-07, 7.720664143562317e-07, 8.102506399154663e-07, 8.484348654747009e-07, 8.866190910339355e-07, 9.248033165931702e-07, 9.629875421524048e-07, 1.0011717677116394e-06, 1.039355993270874e-06, 1.0775402188301086e-06, 1.1157244443893433e-06, 1.1539086699485779e-06, 1.1920928955078125e-06]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 10.0, 11.0, 18.0, 21.0, 63.0, 89.0, 149.0, 352.0, 798.0, 2802.0, 17995.0, 779617.0, 234564.0, 8857.0, 1815.0, 638.0, 351.0, 178.0, 76.0, 43.0, 30.0, 26.0, 12.0, 7.0, 8.0, 8.0, 5.0, 5.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00489044189453125, -0.004666686058044434, -0.004442930221557617, -0.004219174385070801, -0.003995418548583984, -0.003771662712097168, -0.0035479068756103516, -0.003324151039123535, -0.0031003952026367188, -0.0028766393661499023, -0.002652883529663086, -0.0024291276931762695, -0.002205371856689453, -0.0019816160202026367, -0.0017578601837158203, -0.001534104347229004, -0.0013103485107421875, -0.001086592674255371, -0.0008628368377685547, -0.0006390810012817383, -0.0004153251647949219, -0.00019156932830810547, 3.218650817871094e-05, 0.00025594234466552734, 0.00047969818115234375, 0.0007034540176391602, 0.0009272098541259766, 0.001150965690612793, 0.0013747215270996094, 0.0015984773635864258, 0.0018222332000732422, 0.0020459890365600586, 0.002269744873046875, 0.0024935007095336914, 0.002717256546020508, 0.0029410123825073242, 0.0031647682189941406, 0.003388524055480957, 0.0036122798919677734, 0.00383603572845459, 0.004059791564941406, 0.004283547401428223, 0.004507303237915039, 0.0047310590744018555, 0.004954814910888672, 0.005178570747375488, 0.005402326583862305, 0.005626082420349121, 0.0058498382568359375, 0.006073594093322754, 0.00629734992980957, 0.006521105766296387, 0.006744861602783203, 0.0069686174392700195, 0.007192373275756836, 0.007416129112243652, 0.007639884948730469, 0.007863640785217285, 0.008087396621704102, 0.008311152458190918, 0.008534908294677734, 0.00875866413116455, 0.008982419967651367, 0.009206175804138184, 0.009429931640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 5.0, 6.0, 3.0, 4.0, 10.0, 8.0, 20.0, 18.0, 31.0, 28.0, 33.0, 31.0, 46.0, 53.0, 78.0, 57.0, 79.0, 74.0, 62.0, 53.0, 43.0, 39.0, 36.0, 32.0, 21.0, 22.0, 19.0, 14.0, 14.0, 12.0, 5.0, 5.0, 4.0, 8.0, 5.0, 3.0, 5.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0029659271240234375, -0.0028659403324127197, -0.002765953540802002, -0.002665966749191284, -0.0025659799575805664, -0.0024659931659698486, -0.002366006374359131, -0.002266019582748413, -0.0021660327911376953, -0.0020660459995269775, -0.0019660592079162598, -0.001866072416305542, -0.0017660856246948242, -0.0016660988330841064, -0.0015661120414733887, -0.001466125249862671, -0.0013661384582519531, -0.0012661516666412354, -0.0011661648750305176, -0.0010661780834197998, -0.000966191291809082, -0.0008662045001983643, -0.0007662177085876465, -0.0006662309169769287, -0.0005662441253662109, -0.00046625733375549316, -0.0003662705421447754, -0.0002662837505340576, -0.00016629695892333984, -6.631016731262207e-05, 3.36766242980957e-05, 0.00013366341590881348, 0.00023365020751953125, 0.000333636999130249, 0.0004336237907409668, 0.0005336105823516846, 0.0006335973739624023, 0.0007335841655731201, 0.0008335709571838379, 0.0009335577487945557, 0.0010335445404052734, 0.0011335313320159912, 0.001233518123626709, 0.0013335049152374268, 0.0014334917068481445, 0.0015334784984588623, 0.00163346529006958, 0.0017334520816802979, 0.0018334388732910156, 0.0019334256649017334, 0.002033412456512451, 0.002133399248123169, 0.0022333860397338867, 0.0023333728313446045, 0.0024333596229553223, 0.00253334641456604, 0.002633333206176758, 0.0027333199977874756, 0.0028333067893981934, 0.002933293581008911, 0.003033280372619629, 0.0031332671642303467, 0.0032332539558410645, 0.0033332407474517822, 0.0034332275390625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 3.0, 7.0, 3.0, 9.0, 18.0, 36.0, 88.0, 137.0, 219.0, 199.0, 118.0, 71.0, 35.0, 24.0, 14.0, 5.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12021695822477341, -0.11591017246246338, -0.11160339415073395, -0.10729660838842392, -0.10298983007669449, -0.09868304431438446, -0.09437626600265503, -0.090069480240345, -0.08576269447803497, -0.08145590871572495, -0.07714913040399551, -0.07284234464168549, -0.06853556632995605, -0.06422878056764603, -0.0599219985306263, -0.05561521649360657, -0.051308438181877136, -0.04700165614485741, -0.04269487410783768, -0.03838808834552765, -0.03408131003379822, -0.02977452613413334, -0.02546774223446846, -0.02116096019744873, -0.016854178160429, -0.012547396123409271, -0.008240613155066967, -0.003933830186724663, 0.00037295185029506683, 0.0046797338873147964, 0.008986517786979675, 0.013293299823999405, 0.017600074410438538, 0.021906856447458267, 0.026213638484477997, 0.030520422384142876, 0.034827202558517456, 0.039133988320827484, 0.043440770357847214, 0.04774755239486694, 0.05205433443188667, 0.0563611164689064, 0.06066789850592613, 0.06497468054294586, 0.06928146630525589, 0.07358824461698532, 0.07789503037929535, 0.08220180869102478, 0.08650859445333481, 0.09081538021564484, 0.09512215852737427, 0.0994289442896843, 0.10373572260141373, 0.10804250836372375, 0.11234928667545319, 0.11665607243776321, 0.12096285820007324, 0.12526963651180267, 0.1295764297246933, 0.13388320803642273, 0.13818998634815216, 0.1424967646598816, 0.14680355787277222, 0.15111033618450165, 0.15541711449623108]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 2.0, 6.0, 7.0, 7.0, 10.0, 8.0, 6.0, 8.0, 17.0, 18.0, 31.0, 21.0, 22.0, 31.0, 26.0, 35.0, 41.0, 37.0, 35.0, 36.0, 52.0, 51.0, 61.0, 42.0, 41.0, 41.0, 39.0, 39.0, 28.0, 27.0, 29.0, 20.0, 20.0, 18.0, 14.0, 16.0, 19.0, 10.0, 5.0, 3.0, 5.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07492536306381226, -0.07257053256034851, -0.07021570205688477, -0.06786087155342102, -0.06550604104995728, -0.06315120309591293, -0.06079637259244919, -0.05844154208898544, -0.0560867115855217, -0.05373188108205795, -0.05137705057859421, -0.049022216349840164, -0.04666738584637642, -0.044312555342912674, -0.04195772111415863, -0.039602890610694885, -0.03724806010723114, -0.034893229603767395, -0.03253839910030365, -0.030183564871549606, -0.02782873436808586, -0.025473903864622116, -0.023119071498513222, -0.020764239132404327, -0.018409408628940582, -0.016054578125476837, -0.013699745759367943, -0.011344914324581623, -0.008990082889795303, -0.006635251455008984, -0.004280420020222664, -0.0019255876541137695, 0.0004292428493499756, 0.0027840742841362953, 0.005138905718922615, 0.007493737153708935, 0.009848568588495255, 0.012203400023281574, 0.014558231458067894, 0.01691306382417679, 0.019267894327640533, 0.02162272483110428, 0.023977557197213173, 0.026332389563322067, 0.028687220066785812, 0.031042050570249557, 0.0333968847990036, 0.035751715302467346, 0.03810654580593109, 0.040461376309394836, 0.04281620681285858, 0.045171041041612625, 0.04752587154507637, 0.049880702048540115, 0.05223553627729416, 0.054590366780757904, 0.05694519728422165, 0.059300027787685394, 0.06165485829114914, 0.06400968879461288, 0.06636452674865723, 0.06871935725212097, 0.07107418775558472, 0.07342901825904846, 0.07578384876251221]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 0.0, 2.0, 2.0, 8.0, 8.0, 3.0, 6.0, 5.0, 10.0, 7.0, 9.0, 14.0, 26.0, 27.0, 43.0, 39.0, 75.0, 176.0, 276.0, 57.0, 42.0, 27.0, 28.0, 24.0, 13.0, 18.0, 16.0, 10.0, 7.0, 3.0, 2.0, 4.0, 5.0, 5.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015838623046875, -0.015275239944458008, -0.014711856842041016, -0.014148473739624023, -0.013585090637207031, -0.013021707534790039, -0.012458324432373047, -0.011894941329956055, -0.011331558227539062, -0.01076817512512207, -0.010204792022705078, -0.009641408920288086, -0.009078025817871094, -0.008514642715454102, -0.00795125961303711, -0.007387876510620117, -0.006824493408203125, -0.006261110305786133, -0.005697727203369141, -0.0051343441009521484, -0.004570960998535156, -0.004007577896118164, -0.003444194793701172, -0.0028808116912841797, -0.0023174285888671875, -0.0017540454864501953, -0.0011906623840332031, -0.0006272792816162109, -6.389617919921875e-05, 0.0004994869232177734, 0.0010628700256347656, 0.0016262531280517578, 0.00218963623046875, 0.002753019332885742, 0.0033164024353027344, 0.0038797855377197266, 0.004443168640136719, 0.005006551742553711, 0.005569934844970703, 0.006133317947387695, 0.0066967010498046875, 0.00726008415222168, 0.007823467254638672, 0.008386850357055664, 0.008950233459472656, 0.009513616561889648, 0.01007699966430664, 0.010640382766723633, 0.011203765869140625, 0.011767148971557617, 0.01233053207397461, 0.012893915176391602, 0.013457298278808594, 0.014020681381225586, 0.014584064483642578, 0.01514744758605957, 0.015710830688476562, 0.016274213790893555, 0.016837596893310547, 0.01740097999572754, 0.01796436309814453, 0.018527746200561523, 0.019091129302978516, 0.019654512405395508, 0.0202178955078125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 9.0, 13.0, 19.0, 33.0, 58.0, 123.0, 230.0, 745.0, 5064.0, 8331503.0, 47778.0, 2144.0, 492.0, 168.0, 82.0, 43.0, 23.0, 16.0, 9.0, 10.0, 6.0, 7.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062177058309316635, -0.05932721868157387, -0.0564773827791214, -0.05362754315137863, -0.050777703523635864, -0.0479278638958931, -0.04507802426815033, -0.04222818836569786, -0.03937834873795509, -0.036528509110212326, -0.03367867320775986, -0.03082883358001709, -0.027978993952274323, -0.025129154324531555, -0.022279316559433937, -0.01942947879433632, -0.01657963916659355, -0.013729800470173359, -0.010879961773753166, -0.008030123077332973, -0.005180284380912781, -0.002330445684492588, 0.0005193930119276047, 0.0033692307770252228, 0.00621907040476799, 0.009068909101188183, 0.011918747797608376, 0.014768586494028568, 0.01761842519044876, 0.02046826481819153, 0.023318102583289146, 0.026167940348386765, 0.029017776250839233, 0.031867615878582, 0.03471745550632477, 0.03756729140877724, 0.040417131036520004, 0.04326697066426277, 0.04611680656671524, 0.04896664619445801, 0.051816485822200775, 0.05466632544994354, 0.05751616507768631, 0.06036600098013878, 0.06321583688259125, 0.06606567651033401, 0.06891551613807678, 0.07176535576581955, 0.07461519539356232, 0.07746503502130508, 0.08031487464904785, 0.08316471427679062, 0.08601455390453339, 0.08886438608169556, 0.09171422570943832, 0.09456406533718109, 0.09741390496492386, 0.10026374459266663, 0.1031135842204094, 0.10596342384815216, 0.10881325602531433, 0.1116630956530571, 0.11451293528079987, 0.11736277490854263, 0.1202126145362854]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 3.0, 3.0, 5.0, 7.0, 5.0, 5.0, 8.0, 18.0, 19.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09243899583816528, -0.09023238718509674, -0.0880257710814476, -0.08581916242837906, -0.08361254632472992, -0.08140593767166138, -0.07919932901859283, -0.0769927129149437, -0.07478610426187515, -0.07257949560880661, -0.07037287950515747, -0.06816627085208893, -0.06595965474843979, -0.06375304609537125, -0.061546433717012405, -0.059339821338653564, -0.057133208960294724, -0.05492659658193588, -0.05271998420357704, -0.0505133718252182, -0.04830676317214966, -0.04610015079379082, -0.043893538415431976, -0.041686926037073135, -0.039480313658714294, -0.037273701280355453, -0.03506708890199661, -0.03286048024892807, -0.03065386787056923, -0.028447255492210388, -0.026240643113851547, -0.024034030735492706, -0.021827418357133865, -0.019620805978775024, -0.017414195463061333, -0.015207583084702492, -0.013000971637666225, -0.010794360190629959, -0.008587747812271118, -0.006381136365234852, -0.0041745249181985855, -0.0019679132383316755, 0.00023869844153523445, 0.002445310354232788, 0.004651921801269054, 0.006858533248305321, 0.009065145626664162, 0.011271757073700428, 0.013478368520736694, 0.015684980899095535, 0.017891591414809227, 0.020098203793168068, 0.02230481430888176, 0.0245114266872406, 0.02671803906559944, 0.028924651443958282, 0.031131261959671974, 0.033337872475385666, 0.03554448485374451, 0.03775109723210335, 0.03995770961046219, 0.04216431826353073, 0.04437093436717987, 0.04657754302024841, 0.048784155398607254]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 1.0, 9.0, 9.0, 11.0, 12.0, 23.0, 24.0, 29.0, 37.0, 31.0, 52.0, 48.0, 82.0, 84.0, 82.0, 79.0, 54.0, 51.0, 67.0, 54.0, 41.0, 19.0, 15.0, 19.0, 19.0, 12.0, 5.0, 3.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01226806640625, -0.011773824691772461, -0.011279582977294922, -0.010785341262817383, -0.010291099548339844, -0.009796857833862305, -0.009302616119384766, -0.008808374404907227, -0.008314132690429688, -0.007819890975952148, -0.007325649261474609, -0.00683140754699707, -0.006337165832519531, -0.005842924118041992, -0.005348682403564453, -0.004854440689086914, -0.004360198974609375, -0.003865957260131836, -0.003371715545654297, -0.002877473831176758, -0.0023832321166992188, -0.0018889904022216797, -0.0013947486877441406, -0.0009005069732666016, -0.0004062652587890625, 8.797645568847656e-05, 0.0005822181701660156, 0.0010764598846435547, 0.0015707015991210938, 0.002064943313598633, 0.002559185028076172, 0.003053426742553711, 0.00354766845703125, 0.004041910171508789, 0.004536151885986328, 0.005030393600463867, 0.005524635314941406, 0.006018877029418945, 0.006513118743896484, 0.0070073604583740234, 0.0075016021728515625, 0.007995843887329102, 0.00849008560180664, 0.00898432731628418, 0.009478569030761719, 0.009972810745239258, 0.010467052459716797, 0.010961294174194336, 0.011455535888671875, 0.011949777603149414, 0.012444019317626953, 0.012938261032104492, 0.013432502746582031, 0.01392674446105957, 0.01442098617553711, 0.014915227890014648, 0.015409469604492188, 0.015903711318969727, 0.016397953033447266, 0.016892194747924805, 0.017386436462402344, 0.017880678176879883, 0.018374919891357422, 0.01886916160583496, 0.0193634033203125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 9.0, 9.0, 15.0, 12.0, 5.0, 23.0, 30.0, 38.0, 58.0, 100.0, 135.0, 215.0, 323.0, 466.0, 769.0, 1262.0, 2168.0, 3741.0, 6971.0, 14322.0, 32591.0, 97509.0, 211876.0, 90753.0, 31386.0, 13571.0, 6803.0, 3635.0, 2116.0, 1194.0, 725.0, 438.0, 352.0, 197.0, 133.0, 102.0, 55.0, 47.0, 23.0, 28.0, 20.0, 9.0, 8.0, 6.0, 6.0, 5.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0], "bins": [-0.07318115234375, -0.07092761993408203, -0.06867408752441406, -0.0664205551147461, -0.06416702270507812, -0.061913490295410156, -0.05965995788574219, -0.05740642547607422, -0.05515289306640625, -0.05289936065673828, -0.05064582824707031, -0.048392295837402344, -0.046138763427734375, -0.043885231018066406, -0.04163169860839844, -0.03937816619873047, -0.0371246337890625, -0.03487110137939453, -0.03261756896972656, -0.030364036560058594, -0.028110504150390625, -0.025856971740722656, -0.023603439331054688, -0.02134990692138672, -0.01909637451171875, -0.01684284210205078, -0.014589309692382812, -0.012335777282714844, -0.010082244873046875, -0.007828712463378906, -0.0055751800537109375, -0.0033216476440429688, -0.001068115234375, 0.0011854171752929688, 0.0034389495849609375, 0.005692481994628906, 0.007946014404296875, 0.010199546813964844, 0.012453079223632812, 0.014706611633300781, 0.01696014404296875, 0.01921367645263672, 0.021467208862304688, 0.023720741271972656, 0.025974273681640625, 0.028227806091308594, 0.030481338500976562, 0.03273487091064453, 0.0349884033203125, 0.03724193572998047, 0.03949546813964844, 0.041749000549316406, 0.044002532958984375, 0.046256065368652344, 0.04850959777832031, 0.05076313018798828, 0.05301666259765625, 0.05527019500732422, 0.05752372741699219, 0.059777259826660156, 0.062030792236328125, 0.0642843246459961, 0.06653785705566406, 0.06879138946533203, 0.071044921875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 6.0, 11.0, 10.0, 10.0, 13.0, 18.0, 16.0, 16.0, 28.0, 27.0, 26.0, 26.0, 32.0, 40.0, 35.0, 37.0, 45.0, 40.0, 57.0, 28.0, 46.0, 39.0, 28.0, 42.0, 39.0, 40.0, 31.0, 33.0, 25.0, 20.0, 25.0, 20.0, 22.0, 8.0, 21.0, 13.0, 4.0, 7.0, 3.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00696563720703125, -0.006744086742401123, -0.006522536277770996, -0.006300985813140869, -0.006079435348510742, -0.005857884883880615, -0.005636334419250488, -0.005414783954620361, -0.005193233489990234, -0.004971683025360107, -0.0047501325607299805, -0.0045285820960998535, -0.0043070316314697266, -0.0040854811668396, -0.0038639307022094727, -0.0036423802375793457, -0.0034208297729492188, -0.003199279308319092, -0.002977728843688965, -0.002756178379058838, -0.002534627914428711, -0.002313077449798584, -0.002091526985168457, -0.00186997652053833, -0.0016484260559082031, -0.0014268755912780762, -0.0012053251266479492, -0.0009837746620178223, -0.0007622241973876953, -0.0005406737327575684, -0.0003191232681274414, -9.757280349731445e-05, 0.0001239776611328125, 0.00034552812576293945, 0.0005670785903930664, 0.0007886290550231934, 0.0010101795196533203, 0.0012317299842834473, 0.0014532804489135742, 0.0016748309135437012, 0.0018963813781738281, 0.002117931842803955, 0.002339482307434082, 0.002561032772064209, 0.002782583236694336, 0.003004133701324463, 0.00322568416595459, 0.003447234630584717, 0.0036687850952148438, 0.0038903355598449707, 0.004111886024475098, 0.004333436489105225, 0.0045549869537353516, 0.0047765374183654785, 0.0049980878829956055, 0.005219638347625732, 0.005441188812255859, 0.005662739276885986, 0.005884289741516113, 0.00610584020614624, 0.006327390670776367, 0.006548941135406494, 0.006770491600036621, 0.006992042064666748, 0.007213592529296875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 2.0, 0.0, 7.0, 9.0, 8.0, 14.0, 13.0, 22.0, 20.0, 33.0, 56.0, 41.0, 47.0, 37.0, 43.0, 36.0, 27.0, 11.0, 14.0, 9.0, 10.0, 8.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.026083093136548996, -0.025294704362750053, -0.02450631558895111, -0.023717928677797318, -0.022929539903998375, -0.022141151130199432, -0.02135276235640049, -0.020564373582601547, -0.019775984808802605, -0.018987596035003662, -0.01819920726120472, -0.017410818487405777, -0.016622431576251984, -0.01583404280245304, -0.015045654028654099, -0.014257265254855156, -0.013468877412378788, -0.012680488638579845, -0.011892100796103477, -0.011103712022304535, -0.010315323248505592, -0.00952693447470665, -0.008738546632230282, -0.00795015785843134, -0.007161769550293684, -0.006373381242156029, -0.005584992468357086, -0.004796604160219431, -0.004008215852081776, -0.003219827078282833, -0.002431438770145178, -0.0016430499963462353, -0.00085466168820858, -6.627320544794202e-05, 0.000722115277312696, 0.001510503701865673, 0.002298892242833972, 0.003087280783802271, 0.003875669091939926, 0.004664057865738869, 0.005452446173876524, 0.006240834482014179, 0.007029223255813122, 0.00781761109828949, 0.008605999872088432, 0.009394388645887375, 0.010182777419686317, 0.01097116619348526, 0.011759554035961628, 0.01254794280976057, 0.013336330652236938, 0.014124719426035881, 0.014913108199834824, 0.015701496973633766, 0.01648988574743271, 0.017278272658586502, 0.018066661432385445, 0.018855050206184387, 0.01964343897998333, 0.020431827753782272, 0.021220214664936066, 0.022008603438735008, 0.02279699221253395, 0.023585380986332893, 0.024373769760131836]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 4.0, 4.0, 6.0, 6.0, 7.0, 13.0, 6.0, 6.0, 7.0, 11.0, 24.0, 39.0, 53.0, 53.0, 77.0, 42.0, 32.0, 18.0, 13.0, 9.0, 6.0, 6.0, 9.0, 5.0, 10.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03322523832321167, -0.032107096165418625, -0.03098895214498043, -0.029870808124542236, -0.02875266596674919, -0.027634523808956146, -0.026516379788517952, -0.025398235768079758, -0.024280093610286713, -0.023161951452493668, -0.022043807432055473, -0.02092566341161728, -0.019807521253824234, -0.01868937909603119, -0.017571235075592995, -0.0164530910551548, -0.015334948897361755, -0.014216805808246136, -0.013098662719130516, -0.011980519630014896, -0.010862376540899277, -0.009744233451783657, -0.008626090362668037, -0.007507947273552418, -0.006389804184436798, -0.0052716610953211784, -0.004153518006205559, -0.003035374917089939, -0.0019172318279743195, -0.0007990887388586998, 0.00031905435025691986, 0.0014371974393725395, 0.002555340528488159, 0.003673483617603779, 0.0047916267067193985, 0.005909769795835018, 0.007027912884950638, 0.008146055974066257, 0.009264199063181877, 0.010382342152297497, 0.011500485241413116, 0.012618628330528736, 0.013736771419644356, 0.014854914508759975, 0.015973057597875595, 0.01709119975566864, 0.018209343776106834, 0.01932748779654503, 0.020445629954338074, 0.02156377211213112, 0.022681916132569313, 0.023800060153007507, 0.024918202310800552, 0.026036344468593597, 0.02715448848903179, 0.028272632509469986, 0.02939077466726303, 0.030508916825056076, 0.03162705898284912, 0.032745204865932465, 0.03386334702372551, 0.034981489181518555, 0.0360996350646019, 0.03721777722239494, 0.03833591938018799]}, "eval/loss": 8.365464210510254, "eval/bleu": 0.0, "eval/runtime": 3715.1655, "eval/samples_per_second": 3.973, "eval/steps_per_second": 0.993} \ No newline at end of file